PAL: Update to RF 5.0 and pandas.Series

[csit.git] / resources / tools / presentation / input_data_parser.py
diff --git a/resources/tools/presentation/input_data_parser.py b/resources/tools/presentation/input_data_parser.py

index 00c2380..7f1ccd3 100644 (file)
--- a/resources/tools/presentation/input_data_parser.py
+++ b/resources/tools/presentation/input_data_parser.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2021 Cisco and/or its affiliates.
+# Copyright (c) 2022 Cisco and/or its affiliates.
  # Licensed under the Apache License, Version 2.0 (the "License");
  # you may not use this file except in compliance with the License.
  # You may obtain a copy of the License at:
@@ -287,8 +287,6 @@ class ExecutionChecker(ResultVisitor):
      )
      REGEX_TC_TAG = re.compile(r'\d+[tT]\d+[cC]')
  
-    REGEX_TC_NAME_OLD = re.compile(r'-\d+[tT]\d+[cC]-')
-
      REGEX_TC_NAME_NEW = re.compile(r'-\d+[cC]-')
  
      REGEX_TC_NUMBER = re.compile(r'tc\d{2}-')
@@ -299,7 +297,7 @@ class ExecutionChecker(ResultVisitor):
          r'hostname=\"(\d{1,3}.\d{1,3}.\d{1,3}.\d{1,3})\",hook=\"(.*)\"'
      )
  
-    def __init__(self, metadata, mapping, ignore, for_output):
+    def __init__(self, metadata, mapping, ignore, process_oper):
          """Initialisation.
  
          :param metadata: Key-value pairs to be included in "metadata" part of
@@ -307,11 +305,12 @@ class ExecutionChecker(ResultVisitor):
          :param mapping: Mapping of the old names of test cases to the new
              (actual) one.
          :param ignore: List of TCs to be ignored.
-        :param for_output: Output to be generated from downloaded data.
+        :param process_oper: If True, operational data (show run, telemetry) is
+            processed.
          :type metadata: dict
          :type mapping: dict
          :type ignore: list
-        :type for_output: str
+        :type process_oper: bool
          """
  
          # Type of message to parse out from the test messages
@@ -332,7 +331,7 @@ class ExecutionChecker(ResultVisitor):
          # Ignore list
          self._ignore = ignore
  
-        self._for_output = for_output
+        self._process_oper = process_oper
  
          # Number of PAPI History messages found:
          # 0 - no message
@@ -362,7 +361,6 @@ class ExecutionChecker(ResultVisitor):
          # Dictionary defining the methods used to parse different types of
          # messages
          self.parse_msg = {
-            u"timestamp": self._get_timestamp,
              u"vpp-version": self._get_vpp_version,
              u"dpdk-version": self._get_dpdk_version,
              u"teardown-papi-history": self._get_papi_history,
@@ -480,7 +478,8 @@ class ExecutionChecker(ResultVisitor):
              return u"Test Failed."
  
          def _process_lat(in_str_1, in_str_2):
-            """Extract min, avg, max values from latency string.
+            """Extract P50, P90 and P99 latencies or min, avg, max values from
+            latency string.
  
              :param in_str_1: Latency string for one direction produced by robot
                  framework.
@@ -501,13 +500,13 @@ class ExecutionChecker(ResultVisitor):
              try:
                  hdr_lat_1 = hdrh.histogram.HdrHistogram.decode(in_list_1[3])
              except hdrh.codec.HdrLengthException:
-                return None
+                hdr_lat_1 = None
  
              in_list_2[3] += u"=" * (len(in_list_2[3]) % 4)
              try:
                  hdr_lat_2 = hdrh.histogram.HdrHistogram.decode(in_list_2[3])
              except hdrh.codec.HdrLengthException:
-                return None
+                hdr_lat_2 = None
  
              if hdr_lat_1 and hdr_lat_2:
                  hdr_lat = (
@@ -518,11 +517,17 @@ class ExecutionChecker(ResultVisitor):
                      hdr_lat_2.get_value_at_percentile(90.0),
                      hdr_lat_2.get_value_at_percentile(99.0)
                  )
-
                  if all(hdr_lat):
                      return hdr_lat
  
-            return None
+            hdr_lat = (
+                int(in_list_1[0]), int(in_list_1[1]), int(in_list_1[2]),
+                int(in_list_2[0]), int(in_list_2[1]), int(in_list_2[2])
+            )
+            for item in hdr_lat:
+                if item in (-1, 4294967295, 0):
+                    return None
+            return hdr_lat
  
          try:
              out_msg = (
@@ -614,18 +619,6 @@ class ExecutionChecker(ResultVisitor):
              finally:
                  self._msg_type = None
  
-    def _get_timestamp(self, msg):
-        """Called when extraction of timestamp is required.
-
-        :param msg: Message to process.
-        :type msg: Message
-        :returns: Nothing.
-        """
-
-        self._timestamp = msg.timestamp[:14]
-        self._data[u"metadata"][u"generated"] = self._timestamp
-        self._msg_type = None
-
      def _get_papi_history(self, msg):
          """Called when extraction of PAPI command history is required.
  
@@ -1050,7 +1043,7 @@ class ExecutionChecker(ResultVisitor):
                                    u"level": len(suite.longname.split(u"."))
                                }
  
-        suite.keywords.visit(self)
+        suite.setup.visit(self)
  
      def end_suite(self, suite):
          """Called when suite ends.
@@ -1068,7 +1061,7 @@ class ExecutionChecker(ResultVisitor):
          :returns: Nothing.
          """
          if self.start_test(test) is not False:
-            test.keywords.visit(self)
+            test.body.visit(self)
              self.end_test(test)
  
      def start_test(self, test):
@@ -1136,38 +1129,36 @@ class ExecutionChecker(ResultVisitor):
          else:
              test_result[u"msg"] = test.message
  
-        if u"PERFTEST" in tags:
+        if u"PERFTEST" in tags and u"TREX" not in tags:
              # Replace info about cores (e.g. -1c-) with the info about threads
              # and cores (e.g. -1t1c-) in the long test case names and in the
              # test case names if necessary.
-            groups = re.search(self.REGEX_TC_NAME_OLD, self._test_id)
-            if not groups:
-                tag_count = 0
-                tag_tc = str()
-                for tag in test_result[u"tags"]:
-                    groups = re.search(self.REGEX_TC_TAG, tag)
-                    if groups:
-                        tag_count += 1
-                        tag_tc = tag
-
-                if tag_count == 1:
-                    self._test_id = re.sub(
-                        self.REGEX_TC_NAME_NEW, f"-{tag_tc.lower()}-",
-                        self._test_id, count=1
-                    )
-                    test_result[u"name"] = re.sub(
-                        self.REGEX_TC_NAME_NEW, f"-{tag_tc.lower()}-",
-                        test_result["name"], count=1
-                    )
-                else:
-                    test_result[u"status"] = u"FAIL"
-                    self._data[u"tests"][self._test_id] = test_result
-                    logging.debug(
-                        f"The test {self._test_id} has no or more than one "
-                        f"multi-threading tags.\n"
-                        f"Tags: {test_result[u'tags']}"
-                    )
-                    return
+            tag_count = 0
+            tag_tc = str()
+            for tag in test_result[u"tags"]:
+                groups = re.search(self.REGEX_TC_TAG, tag)
+                if groups:
+                    tag_count += 1
+                    tag_tc = tag
+
+            if tag_count == 1:
+                self._test_id = re.sub(
+                    self.REGEX_TC_NAME_NEW, f"-{tag_tc.lower()}-",
+                    self._test_id, count=1
+                )
+                test_result[u"name"] = re.sub(
+                    self.REGEX_TC_NAME_NEW, f"-{tag_tc.lower()}-",
+                    test_result["name"], count=1
+                )
+            else:
+                test_result[u"status"] = u"FAIL"
+                self._data[u"tests"][self._test_id] = test_result
+                logging.debug(
+                    f"The test {self._test_id} has no or more than one "
+                    f"multi-threading tags.\n"
+                    f"Tags: {test_result[u'tags']}"
+                )
+                return
  
          if u"DEVICETEST" in tags:
              test_result[u"type"] = u"DEVICETEST"
@@ -1211,20 +1202,15 @@ class ExecutionChecker(ResultVisitor):
              if test.status == u"PASS":
                  test_result[u"throughput"], test_result[u"status"] = \
                      self._get_plr_throughput(test.message)
+        elif u"LDP_NGINX" in tags:
+            test_result[u"type"] = u"LDP_NGINX"
+            test_result[u"result"], test_result[u"status"] = \
+                self._get_vsap_data(test.message, tags)
          elif u"HOSTSTACK" in tags:
              test_result[u"type"] = u"HOSTSTACK"
              if test.status == u"PASS":
                  test_result[u"result"], test_result[u"status"] = \
                      self._get_hoststack_data(test.message, tags)
-        elif u"LDP_NGINX" in tags:
-            test_result[u"type"] = u"LDP_NGINX"
-            test_result[u"result"], test_result[u"status"] = \
-                self._get_vsap_data(test.message, tags)
-        # elif u"TCP" in tags:  # This might be not used
-        #     test_result[u"type"] = u"TCP"
-        #     if test.status == u"PASS":
-        #         groups = re.search(self.REGEX_TCP, test.message)
-        #         test_result[u"result"] = int(groups.group(2))
          elif u"RECONF" in tags:
              test_result[u"type"] = u"RECONF"
              if test.status == u"PASS":
@@ -1294,7 +1280,7 @@ class ExecutionChecker(ResultVisitor):
          :type test_kw: Keyword
          :returns: Nothing.
          """
-        for keyword in test_kw.keywords:
+        for keyword in test_kw.body:
              if self.start_test_kw(keyword) is not False:
                  self.visit_test_kw(keyword)
                  self.end_test_kw(keyword)
@@ -1307,7 +1293,7 @@ class ExecutionChecker(ResultVisitor):
          :type test_kw: Keyword
          :returns: Nothing.
          """
-        if self._for_output == u"trending":
+        if not self._process_oper:
              return
  
          if test_kw.name.count(u"Run Telemetry On All Duts"):
@@ -1336,7 +1322,7 @@ class ExecutionChecker(ResultVisitor):
          :type setup_kw: Keyword
          :returns: Nothing.
          """
-        for keyword in setup_kw.keywords:
+        for keyword in setup_kw.body:
              if self.start_setup_kw(keyword) is not False:
                  self.visit_setup_kw(keyword)
                  self.end_setup_kw(keyword)
@@ -1355,9 +1341,6 @@ class ExecutionChecker(ResultVisitor):
          elif setup_kw.name.count(u"Install Dpdk Framework On All Duts") and \
                  not self._version:
              self._msg_type = u"dpdk-version"
-        elif setup_kw.name.count(u"Set Global Variable") \
-                and not self._timestamp:
-            self._msg_type = u"timestamp"
          elif setup_kw.name.count(u"Setup Framework") and not self._testbed:
              self._msg_type = u"testbed"
          else:
@@ -1380,7 +1363,7 @@ class ExecutionChecker(ResultVisitor):
          :type teardown_kw: Keyword
          :returns: Nothing.
          """
-        for keyword in teardown_kw.keywords:
+        for keyword in teardown_kw.body:
              if self.start_teardown_kw(keyword) is not False:
                  self.visit_teardown_kw(keyword)
                  self.end_teardown_kw(keyword)
@@ -1467,7 +1450,7 @@ class InputData:
          self._for_output = for_output
  
          # Data store:
-        self._input_data = pd.Series()
+        self._input_data = pd.Series(dtype="object")
  
      @property
      def data(self):
@@ -1539,11 +1522,30 @@ class InputData:
                      f"Error occurred while parsing output.xml: {repr(err)}"
                  )
                  return None
+
+        process_oper = False
+        if u"-vpp-perf-report-coverage-" in job:
+            process_oper = True
+        # elif u"-vpp-perf-report-iterative-" in job:
+        #     # Exceptions for TBs where we do not have coverage data:
+        #     for item in (u"-2n-icx", ):
+        #         if item in job:
+        #             process_oper = True
+        #             break
          checker = ExecutionChecker(
-            metadata, self._cfg.mapping, self._cfg.ignore, self._for_output
+            metadata, self._cfg.mapping, self._cfg.ignore, process_oper
          )
          result.visit(checker)
  
+        checker.data[u"metadata"][u"tests_total"] = \
+            result.statistics.total.all.total
+        checker.data[u"metadata"][u"tests_passed"] = \
+            result.statistics.total.all.passed
+        checker.data[u"metadata"][u"tests_failed"] = \
+            result.statistics.total.all.failed
+        checker.data[u"metadata"][u"elapsedtime"] = result.suite.elapsedtime
+        checker.data[u"metadata"][u"generated"] = result.suite.endtime[:14]
+
          return checker.data
  
      def _download_and_parse_build(self, job, build, repeat, pid=10000):
@@ -1663,7 +1665,7 @@ class InputData:
                      })
  
                      if self._input_data.get(job, None) is None:
-                        self._input_data[job] = pd.Series()
+                        self._input_data[job] = pd.Series(dtype="object")
                      self._input_data[job][str(build_nr)] = build_data
                      self._cfg.set_input_file_name(
                          job, build_nr, result[u"build"][u"file-name"]
@@ -1742,7 +1744,7 @@ class InputData:
          })
  
          if self._input_data.get(job, None) is None:
-            self._input_data[job] = pd.Series()
+            self._input_data[job] = pd.Series(dtype="object")
          self._input_data[job][str(build_nr)] = build_data
  
          self._cfg.set_input_state(job, build_nr, u"processed")
@@ -1899,12 +1901,12 @@ class InputData:
                  params.extend((u"type", u"status"))
  
          data_to_filter = data if data else element[u"data"]
-        data = pd.Series()
+        data = pd.Series(dtype="object")
          try:
              for job, builds in data_to_filter.items():
-                data[job] = pd.Series()
+                data[job] = pd.Series(dtype="object")
                  for build in builds:
-                    data[job][str(build)] = pd.Series()
+                    data[job][str(build)] = pd.Series(dtype="object")
                      try:
                          data_dict = dict(
                              self.data[job][str(build)][data_set].items())
@@ -1915,7 +1917,8 @@ class InputData:
  
                      for test_id, test_data in data_dict.items():
                          if eval(cond, {u"tags": test_data.get(u"tags", u"")}):
-                            data[job][str(build)][test_id] = pd.Series()
+                            data[job][str(build)][test_id] = \
+                                pd.Series(dtype="object")
                              if params is None:
                                  for param, val in test_data.items():
                                      data[job][str(build)][test_id][param] = val
@@ -1999,12 +2002,12 @@ class InputData:
          else:
              tests = include
  
-        data = pd.Series()
+        data = pd.Series(dtype="object")
          try:
              for job, builds in element[u"data"].items():
-                data[job] = pd.Series()
+                data[job] = pd.Series(dtype="object")
                  for build in builds:
-                    data[job][str(build)] = pd.Series()
+                    data[job][str(build)] = pd.Series(dtype="object")
                      for test in tests:
                          try:
                              reg_ex = re.compile(str(test).lower())
@@ -2013,7 +2016,8 @@ class InputData:
                                  if re.match(reg_ex, str(test_id).lower()):
                                      test_data = self.data[job][
                                          str(build)][data_set][test_id]
-                                    data[job][str(build)][test_id] = pd.Series()
+                                    data[job][str(build)][test_id] = \
+                                        pd.Series(dtype="object")
                                      if params is None:
                                          for param, val in test_data.items():
                                              data[job][str(build)][test_id]\
@@ -2068,7 +2072,7 @@ class InputData:
  
          logging.info(u"    Merging data ...")
  
-        merged_data = pd.Series()
+        merged_data = pd.Series(dtype="object")
          for builds in data.values:
              for item in builds.values:
                  for item_id, item_data in item.items():