CSIT-1133: Cosmetic improvements in trending plots

[csit.git] / resources / tools / presentation / new / generator_CPTA.py
diff --git a/resources/tools/presentation/new/generator_CPTA.py b/resources/tools/presentation/new/generator_CPTA.py

index 1b4115f..d4ac06d 100644 (file)
--- a/resources/tools/presentation/new/generator_CPTA.py
+++ b/resources/tools/presentation/new/generator_CPTA.py
@@ -27,7 +27,7 @@ import pandas as pd
  from collections import OrderedDict
  from datetime import datetime
  
-from utils import archive_input_data, execute_command,\
+from utils import archive_input_data, execute_command, \
      classify_anomalies, Worker
  
  
@@ -87,22 +87,22 @@ def generate_cpta(spec, data):
      return ret_code
  
  
-def _generate_trending_traces(in_data, build_info, moving_win_size=10,
+def _generate_trending_traces(in_data, job_name, build_info,
                                show_trend_line=True, name="", color=""):
      """Generate the trending traces:
       - samples,
-     - trimmed moving median (trending line)
       - outliers, regress, progress
+     - average of normal samples (trending line)
  
      :param in_data: Full data set.
+    :param job_name: The name of job which generated the data.
      :param build_info: Information about the builds.
-    :param moving_win_size: Window size.
      :param show_trend_line: Show moving median (trending plot).
      :param name: Name of the plot
      :param color: Name of the color for the plot.
      :type in_data: OrderedDict
+    :type job_name: str
      :type build_info: dict
-    :type moving_win_size: int
      :type show_trend_line: bool
      :type name: str
      :type color: str
@@ -116,10 +116,15 @@ def _generate_trending_traces(in_data, build_info, moving_win_size=10,
      hover_text = list()
      xaxis = list()
      for idx in data_x:
-        hover_text.append("vpp-ref: {0}<br>csit-ref: mrr-daily-build-{1}".
-                          format(build_info[str(idx)][1].rsplit('~', 1)[0],
-                                 idx))
-        date = build_info[str(idx)][0]
+        if "dpdk" in job_name:
+            hover_text.append("dpdk-ref: {0}<br>csit-ref: mrr-weekly-build-{1}".
+                              format(build_info[job_name][str(idx)][1].
+                                     rsplit('~', 1)[0], idx))
+        elif "vpp" in job_name:
+            hover_text.append("vpp-ref: {0}<br>csit-ref: mrr-daily-build-{1}".
+                              format(build_info[job_name][str(idx)][1].
+                                     rsplit('~', 1)[0], idx))
+        date = build_info[job_name][str(idx)][0]
          xaxis.append(datetime(int(date[0:4]), int(date[4:6]), int(date[6:8]),
                                int(date[9:11]), int(date[12:])))
  
@@ -131,9 +136,8 @@ def _generate_trending_traces(in_data, build_info, moving_win_size=10,
      anomalies_colors = list()
      anomalies_avgs = list()
      anomaly_color = {
-        "outlier": 0.0,
-        "regression": 0.33,
-        "normal": 0.66,
+        "regression": 0.0,
+        "normal": 0.5,
          "progression": 1.0
      }
      if anomaly_classification:
@@ -145,7 +149,7 @@ def _generate_trending_traces(in_data, build_info, moving_win_size=10,
                  anomalies_colors.append(
                      anomaly_color[anomaly_classification[idx]])
                  anomalies_avgs.append(avgs[idx])
-        anomalies_colors.extend([0.0, 0.33, 0.66, 1.0])
+        anomalies_colors.extend([0.0, 0.5, 1.0])
  
      # Create traces
  
@@ -156,8 +160,9 @@ def _generate_trending_traces(in_data, build_info, moving_win_size=10,
          line={
              "width": 1
          },
+        showlegend=True,
          legendgroup=name,
-        name="{name}-thput".format(name=name),
+        name="{name}".format(name=name),
          marker={
              "size": 5,
              "color": color,
@@ -178,6 +183,7 @@ def _generate_trending_traces(in_data, build_info, moving_win_size=10,
                  "width": 1,
                  "color": color,
              },
+            showlegend=False,
              legendgroup=name,
              name='{name}-trend'.format(name=name)
          )
@@ -188,20 +194,18 @@ def _generate_trending_traces(in_data, build_info, moving_win_size=10,
          y=anomalies_avgs,
          mode='markers',
          hoverinfo="none",
-        showlegend=True,
+        showlegend=False,
          legendgroup=name,
          name="{name}-anomalies".format(name=name),
          marker={
              "size": 15,
              "symbol": "circle-open",
              "color": anomalies_colors,
-            "colorscale": [[0.00, "grey"],
-                           [0.25, "grey"],
-                           [0.25, "red"],
-                           [0.50, "red"],
-                           [0.50, "white"],
-                           [0.75, "white"],
-                           [0.75, "green"],
+            "colorscale": [[0.00, "red"],
+                           [0.33, "red"],
+                           [0.33, "white"],
+                           [0.66, "white"],
+                           [0.66, "green"],
                             [1.00, "green"]],
              "showscale": True,
              "line": {
@@ -216,8 +220,8 @@ def _generate_trending_traces(in_data, build_info, moving_win_size=10,
                      "size": 14
                  },
                  "tickmode": 'array',
-                "tickvals": [0.125, 0.375, 0.625, 0.875],
-                "ticktext": ["Outlier", "Regression", "Normal", "Progression"],
+                "tickvals": [0.167, 0.500, 0.833],
+                "ticktext": ["Regression", "Normal", "Progression"],
                  "ticks": "",
                  "ticklen": 0,
                  "tickangle": -90,
@@ -227,7 +231,10 @@ def _generate_trending_traces(in_data, build_info, moving_win_size=10,
      )
      traces.append(trace_anomalies)
  
-    return traces, anomaly_classification[-1]
+    if anomaly_classification:
+        return traces, anomaly_classification[-1]
+    else:
+        return traces, None
  
  
  def _generate_all_charts(spec, input_data):
@@ -250,7 +257,7 @@ def _generate_all_charts(spec, input_data):
          logs.append(("INFO", "  Generating the chart '{0}' ...".
                       format(graph.get("title", ""))))
  
-        job_name = spec.cpta["data"].keys()[0]
+        job_name = graph["data"].keys()[0]
  
          csv_tbl = list()
          res = list()
@@ -264,8 +271,10 @@ def _generate_all_charts(spec, input_data):
              return
  
          chart_data = dict()
-        for job in data:
-            for index, bld in job.items():
+        for job, job_data in data.iteritems():
+            if job != job_name:
+                continue
+            for index, bld in job_data.items():
                  for test_name, test in bld.items():
                      if chart_data.get(test_name, None) is None:
                          chart_data[test_name] = OrderedDict()
@@ -278,7 +287,7 @@ def _generate_all_charts(spec, input_data):
          # Add items to the csv table:
          for tst_name, tst_data in chart_data.items():
              tst_lst = list()
-            for bld in builds_lst:
+            for bld in builds_dict[job_name]:
                  itm = tst_data.get(int(bld), '')
                  tst_lst.append(str(itm))
              csv_tbl.append("{0},".format(tst_name) + ",".join(tst_lst) + '\n')
@@ -294,8 +303,8 @@ def _generate_all_charts(spec, input_data):
              test_name = test_name.split('.')[-1]
              trace, rslt = _generate_trending_traces(
                  test_data,
+                job_name=job_name,
                  build_info=build_info,
-                moving_win_size=win_size,
                  name='-'.join(test_name.split('-')[3:-1]),
                  color=COLORS[index])
              traces.extend(trace)
@@ -320,30 +329,32 @@ def _generate_all_charts(spec, input_data):
                  logs.append(("WARNING", "No data for the plot. Skipped."))
  
          data_out = {
+            "job_name": job_name,
              "csv_table": csv_tbl,
              "results": res,
              "logs": logs
          }
          data_q.put(data_out)
  
-    job_name = spec.cpta["data"].keys()[0]
-
-    builds_lst = list()
-    for build in spec.input["builds"][job_name]:
-        status = build["status"]
-        if status != "failed" and status != "not found":
-            builds_lst.append(str(build["build"]))
-
-    # Get "build ID": "date" dict:
-    build_info = OrderedDict()
-    for build in builds_lst:
-        try:
-            build_info[build] = (
-                input_data.metadata(job_name, build)["generated"][:14],
-                input_data.metadata(job_name, build)["version"]
+    builds_dict = dict()
+    for job in spec.input["builds"].keys():
+        if builds_dict.get(job, None) is None:
+            builds_dict[job] = list()
+        for build in spec.input["builds"][job]:
+            status = build["status"]
+            if status != "failed" and status != "not found":
+                builds_dict[job].append(str(build["build"]))
+
+    # Create "build ID": "date" dict:
+    build_info = dict()
+    for job_name, job_data in builds_dict.items():
+        if build_info.get(job_name, None) is None:
+            build_info[job_name] = OrderedDict()
+        for build in job_data:
+            build_info[job_name][build] = (
+                input_data.metadata(job_name, build).get("generated", ""),
+                input_data.metadata(job_name, build).get("version", "")
              )
-        except KeyError:
-            build_info[build] = ("", "")
  
      work_queue = multiprocessing.JoinableQueue()
      manager = multiprocessing.Manager()
@@ -368,21 +379,24 @@ def _generate_all_charts(spec, input_data):
      anomaly_classifications = list()
  
      # Create the header:
-    csv_table = list()
-    header = "Build Number:," + ",".join(builds_lst) + '\n'
-    csv_table.append(header)
-    build_dates = [x[0] for x in build_info.values()]
-    header = "Build Date:," + ",".join(build_dates) + '\n'
-    csv_table.append(header)
-    vpp_versions = [x[1] for x in build_info.values()]
-    header = "VPP Version:," + ",".join(vpp_versions) + '\n'
-    csv_table.append(header)
+    csv_tables = dict()
+    for job_name in builds_dict.keys():
+        if csv_tables.get(job_name, None) is None:
+            csv_tables[job_name] = list()
+        header = "Build Number:," + ",".join(builds_dict[job_name]) + '\n'
+        csv_tables[job_name].append(header)
+        build_dates = [x[0] for x in build_info[job_name].values()]
+        header = "Build Date:," + ",".join(build_dates) + '\n'
+        csv_tables[job_name].append(header)
+        versions = [x[1] for x in build_info[job_name].values()]
+        header = "Version:," + ",".join(versions) + '\n'
+        csv_tables[job_name].append(header)
  
      while not data_queue.empty():
          result = data_queue.get()
  
          anomaly_classifications.extend(result["results"])
-        csv_table.extend(result["csv_table"])
+        csv_tables[result["job_name"]].extend(result["csv_table"])
  
          for item in result["logs"]:
              if item[0] == "INFO":
@@ -404,33 +418,34 @@ def _generate_all_charts(spec, input_data):
          worker.join()
  
      # Write the tables:
-    file_name = spec.cpta["output-file"] + "-trending"
-    with open("{0}.csv".format(file_name), 'w') as file_handler:
-        file_handler.writelines(csv_table)
-
-    txt_table = None
-    with open("{0}.csv".format(file_name), 'rb') as csv_file:
-        csv_content = csv.reader(csv_file, delimiter=',', quotechar='"')
-        line_nr = 0
-        for row in csv_content:
-            if txt_table is None:
-                txt_table = prettytable.PrettyTable(row)
-            else:
-                if line_nr > 1:
-                    for idx, item in enumerate(row):
-                        try:
-                            row[idx] = str(round(float(item) / 1000000, 2))
-                        except ValueError:
-                            pass
-                try:
-                    txt_table.add_row(row)
-                except Exception as err:
-                    logging.warning("Error occurred while generating TXT table:"
-                                    "\n{0}".format(err))
-            line_nr += 1
-        txt_table.align["Build Number:"] = "l"
-    with open("{0}.txt".format(file_name), "w") as txt_file:
-        txt_file.write(str(txt_table))
+    for job_name, csv_table in csv_tables.items():
+        file_name = spec.cpta["output-file"] + "-" + job_name + "-trending"
+        with open("{0}.csv".format(file_name), 'w') as file_handler:
+            file_handler.writelines(csv_table)
+
+        txt_table = None
+        with open("{0}.csv".format(file_name), 'rb') as csv_file:
+            csv_content = csv.reader(csv_file, delimiter=',', quotechar='"')
+            line_nr = 0
+            for row in csv_content:
+                if txt_table is None:
+                    txt_table = prettytable.PrettyTable(row)
+                else:
+                    if line_nr > 1:
+                        for idx, item in enumerate(row):
+                            try:
+                                row[idx] = str(round(float(item) / 1000000, 2))
+                            except ValueError:
+                                pass
+                    try:
+                        txt_table.add_row(row)
+                    except Exception as err:
+                        logging.warning("Error occurred while generating TXT "
+                                        "table:\n{0}".format(err))
+                line_nr += 1
+            txt_table.align["Build Number:"] = "l"
+        with open("{0}.txt".format(file_name), "w") as txt_file:
+            txt_file.write(str(txt_table))
  
      # Evaluate result:
      if anomaly_classifications: