X-Git-Url: https://gerrit.fd.io/r/gitweb?p=csit.git;a=blobdiff_plain;f=resources%2Ftools%2Fpresentation%2Futils.py;h=a56ee3e105536cf8a501453a4a7074fca4545e63;hp=cf3005c0b4db493991c5d5613c904db9fbed77d4;hb=a0918a2c7112621563f14ba06a7aee3eaa3ac711;hpb=45790e85151194fdea40530a31d5181bb4b21e85 diff --git a/resources/tools/presentation/utils.py b/resources/tools/presentation/utils.py index cf3005c0b4..a56ee3e105 100644 --- a/resources/tools/presentation/utils.py +++ b/resources/tools/presentation/utils.py @@ -14,6 +14,8 @@ """General purpose utilities. """ +import numpy as np + from os import walk from os.path import join from math import sqrt @@ -60,6 +62,33 @@ def relative_change(nr1, nr2): return float(((nr2 - nr1) / nr1) * 100) +def remove_outliers(input_data, outlier_const): + """ + + :param input_data: Data from which the outliers will be removed. + :param outlier_const: Outlier constant. + :type input_data: list + :type outlier_const: float + :returns: The input list without outliers. + :rtype: list + """ + + data = np.array(input_data) + upper_quartile = np.percentile(data, 75) + lower_quartile = np.percentile(data, 25) + iqr = (upper_quartile - lower_quartile) * outlier_const + quartile_set = (lower_quartile - iqr, upper_quartile + iqr) + result_lst = list() + for y in data.tolist(): + if quartile_set[0] <= y <= quartile_set[1]: + result_lst.append(y) + print(quartile_set) + print(input_data) + print(result_lst) + print("") + return result_lst + + def get_files(path, extension=None, full_path=True): """Generates the list of files to process.