Report: Add mrr stdev to comp tables

[csit.git] / resources / tools / presentation / input_data_parser.py
diff --git a/resources/tools/presentation/input_data_parser.py b/resources/tools/presentation/input_data_parser.py

index 5d9234e..987b996 100644 (file)
--- a/resources/tools/presentation/input_data_parser.py
+++ b/resources/tools/presentation/input_data_parser.py
@@ -25,10 +25,12 @@ import resource
  import logging
  
  from collections import OrderedDict
-from os import remove
+from os import remove, walk, listdir
+from os.path import isfile, isdir, join
  from datetime import datetime as dt
  from datetime import timedelta
  from json import loads
+from json.decoder import JSONDecodeError
  
  import hdrh.histogram
  import hdrh.codec
@@ -40,6 +42,7 @@ from robot import errors
  
  from resources.libraries.python import jumpavg
  from input_data_files import download_and_unzip_data_file
+from pal_errors import PresentationError
  
  
  # Separator used in file names
@@ -220,6 +223,8 @@ class ExecutionChecker(ResultVisitor):
          r'Latency at 50% PDR:.*\[\'(.*)\', \'(.*)\'\].*\n'
          r'Latency at 10% PDR:.*\[\'(.*)\', \'(.*)\'\].*\n'
      )
+    REGEX_MRR_MSG_INFO = re.compile(r'.*\[(.*)\]')
+
      # TODO: Remove when not needed
      REGEX_NDRPDR_LAT_BASE = re.compile(
          r'LATENCY.*\[\'(.*)\', \'(.*)\'\]\s\n.*\n.*\n'
@@ -355,15 +360,34 @@ class ExecutionChecker(ResultVisitor):
          """
          return self._data
  
+    def _get_data_from_mrr_test_msg(self, msg):
+        """Get info from message of MRR performance tests.
+
+        :param msg: Message to be processed.
+        :type msg: str
+        :returns: Processed message or original message if a problem occurs.
+        :rtype: str
+        """
+
+        groups = re.search(self.REGEX_MRR_MSG_INFO, msg)
+        if not groups or groups.lastindex != 1:
+            return u"Test Failed."
+
+        try:
+            data = groups.group(1).split(u", ")
+        except (AttributeError, IndexError, ValueError, KeyError):
+            return u"Test Failed."
+
+        out_str = u"["
+        try:
+            for item in data:
+                out_str += f"{(float(item) / 1e6):.2f}, "
+            return out_str[:-2] + u"]"
+        except (AttributeError, IndexError, ValueError, KeyError):
+            return u"Test Failed."
+
      def _get_data_from_perf_test_msg(self, msg):
-        """Get
-            - NDR_LOWER
-            - LATENCY
-            - NDR_UPPER
-            - PDR_LOWER
-            - LATENCY
-            - PDR_UPPER
-        from message of NDRPDR performance tests.
+        """Get info from message of NDRPDR performance tests.
  
          :param msg: Message to be processed.
          :type msg: str
@@ -373,7 +397,7 @@ class ExecutionChecker(ResultVisitor):
  
          groups = re.search(self.REGEX_PERF_MSG_INFO, msg)
          if not groups or groups.lastindex != 10:
-            return msg
+            return u"Test Failed."
  
          try:
              data = {
@@ -389,7 +413,7 @@ class ExecutionChecker(ResultVisitor):
                  u"pdr_lat_10_2": groups.group(10),
              }
          except (AttributeError, IndexError, ValueError, KeyError):
-            return msg
+            return u"Test Failed."
  
          def _process_lat(in_str_1, in_str_2):
              """Extract min, avg, max values from latency string.
@@ -400,65 +424,75 @@ class ExecutionChecker(ResultVisitor):
                  robot framework.
              :type in_str_1: str
              :type in_str_2: str
-            :returns: Processed latency string or empty string if a problem
-                occurs.
-            :rtype: tuple(str, str)
+            :returns: Processed latency string or None if a problem occurs.
+            :rtype: tuple
              """
              in_list_1 = in_str_1.split('/', 3)
              in_list_2 = in_str_2.split('/', 3)
  
              if len(in_list_1) != 4 and len(in_list_2) != 4:
-                return u""
+                return None
  
              in_list_1[3] += u"=" * (len(in_list_1[3]) % 4)
              try:
                  hdr_lat_1 = hdrh.histogram.HdrHistogram.decode(in_list_1[3])
              except hdrh.codec.HdrLengthException:
-                return u""
+                return None
  
              in_list_2[3] += u"=" * (len(in_list_2[3]) % 4)
              try:
                  hdr_lat_2 = hdrh.histogram.HdrHistogram.decode(in_list_2[3])
              except hdrh.codec.HdrLengthException:
-                return u""
+                return None
  
              if hdr_lat_1 and hdr_lat_2:
-                hdr_lat_1_50 = hdr_lat_1.get_value_at_percentile(50.0)
-                hdr_lat_1_90 = hdr_lat_1.get_value_at_percentile(90.0)
-                hdr_lat_1_99 = hdr_lat_1.get_value_at_percentile(99.0)
-                hdr_lat_2_50 = hdr_lat_2.get_value_at_percentile(50.0)
-                hdr_lat_2_90 = hdr_lat_2.get_value_at_percentile(90.0)
-                hdr_lat_2_99 = hdr_lat_2.get_value_at_percentile(99.0)
-
-                if (hdr_lat_1_50 + hdr_lat_1_90 + hdr_lat_1_99 +
-                        hdr_lat_2_50 + hdr_lat_2_90 + hdr_lat_2_99):
-                    return (
-                        f"{hdr_lat_1_50} {hdr_lat_1_90} {hdr_lat_1_99} , "
-                        f"{hdr_lat_2_50} {hdr_lat_2_90} {hdr_lat_2_99}"
-                    )
+                hdr_lat = (
+                    hdr_lat_1.get_value_at_percentile(50.0),
+                    hdr_lat_1.get_value_at_percentile(90.0),
+                    hdr_lat_1.get_value_at_percentile(99.0),
+                    hdr_lat_2.get_value_at_percentile(50.0),
+                    hdr_lat_2.get_value_at_percentile(90.0),
+                    hdr_lat_2.get_value_at_percentile(99.0)
+                )
  
-            return u""
+                if all(hdr_lat):
+                    return hdr_lat
+
+            return None
  
          try:
-            pdr_lat_10 = _process_lat(data[u'pdr_lat_10_1'],
-                                      data[u'pdr_lat_10_2'])
-            pdr_lat_50 = _process_lat(data[u'pdr_lat_50_1'],
-                                      data[u'pdr_lat_50_2'])
-            pdr_lat_90 = _process_lat(data[u'pdr_lat_90_1'],
-                                      data[u'pdr_lat_90_2'])
-            pdr_lat_10 = f"\n3. {pdr_lat_10}" if pdr_lat_10 else u""
-            pdr_lat_50 = f"\n4. {pdr_lat_50}" if pdr_lat_50 else u""
-            pdr_lat_90 = f"\n5. {pdr_lat_90}" if pdr_lat_90 else u""
-
-            return (
-                f"1. {(data[u'ndr_low'] / 1e6):.2f} {data[u'ndr_low_b']:.2f}"
-                f"\n2. {(data[u'pdr_low'] / 1e6):.2f} {data[u'pdr_low_b']:.2f}"
-                f"{pdr_lat_10}"
-                f"{pdr_lat_50}"
-                f"{pdr_lat_90}"
+            out_msg = (
+                f"1. {(data[u'ndr_low'] / 1e6):5.2f}      "
+                f"{data[u'ndr_low_b']:5.2f}"
+                f"\n2. {(data[u'pdr_low'] / 1e6):5.2f}      "
+                f"{data[u'pdr_low_b']:5.2f}"
+            )
+            latency = (
+                _process_lat(data[u'pdr_lat_10_1'], data[u'pdr_lat_10_2']),
+                _process_lat(data[u'pdr_lat_50_1'], data[u'pdr_lat_50_2']),
+                _process_lat(data[u'pdr_lat_90_1'], data[u'pdr_lat_90_2'])
              )
+            if all(latency):
+                max_len = len(str(max((max(item) for item in latency))))
+                max_len = 4 if max_len < 4 else max_len
+
+                for idx, lat in enumerate(latency):
+                    if not idx:
+                        out_msg += u"\n"
+                    out_msg += (
+                        f"\n{idx + 3}. "
+                        f"{lat[0]:{max_len}d} "
+                        f"{lat[1]:{max_len}d} "
+                        f"{lat[2]:{max_len}d}      "
+                        f"{lat[3]:{max_len}d} "
+                        f"{lat[4]:{max_len}d} "
+                        f"{lat[5]:{max_len}d} "
+                    )
+
+            return out_msg
+
          except (AttributeError, IndexError, ValueError, KeyError):
-            return msg
+            return u"Test Failed."
  
      def _get_testbed(self, msg):
          """Called when extraction of testbed IP is required.
@@ -840,6 +874,40 @@ class ExecutionChecker(ResultVisitor):
  
          return latency, u"FAIL"
  
+    @staticmethod
+    def _get_hoststack_data(msg, tags):
+        """Get data from the hoststack test message.
+
+        :param msg: The test message to be parsed.
+        :param tags: Test tags.
+        :type msg: str
+        :type tags: list
+        :returns: Parsed data as a JSON dict and the status (PASS/FAIL).
+        :rtype: tuple(dict, str)
+        """
+        result = dict()
+        status = u"FAIL"
+
+        msg = msg.replace(u"'", u'"').replace(u" ", u"")
+        if u"LDPRELOAD" in tags:
+            try:
+                result = loads(msg)
+                status = u"PASS"
+            except JSONDecodeError:
+                pass
+        elif u"VPPECHO" in tags:
+            try:
+                msg_lst = msg.replace(u"}{", u"} {").split(u" ")
+                result = dict(
+                    client=loads(msg_lst[0]),
+                    server=loads(msg_lst[1])
+                )
+                status = u"PASS"
+            except (JSONDecodeError, IndexError):
+                pass
+
+        return result, status
+
      def visit_suite(self, suite):
          """Implements traversing through the suite and its direct children.
  
@@ -947,13 +1015,24 @@ class ExecutionChecker(ResultVisitor):
              replace(u'\r', u'').\
              replace(u'[', u' |br| [').\
              replace(u' |br| [', u'[', 1)
-        test_result[u"msg"] = self._get_data_from_perf_test_msg(test.message).\
-            replace(u'\n', u' |br| ').\
-            replace(u'\r', u'').\
-            replace(u'"', u"'")
          test_result[u"type"] = u"FUNC"
          test_result[u"status"] = test.status
  
+        if test.status == u"PASS":
+            if u"NDRPDR" in tags:
+                test_result[u"msg"] = self._get_data_from_perf_test_msg(
+                    test.message).replace(u'\n', u' |br| ').\
+                    replace(u'\r', u'').replace(u'"', u"'")
+            elif u"MRR" in tags or u"FRMOBL" in tags or u"BMRR" in tags:
+                test_result[u"msg"] = self._get_data_from_mrr_test_msg(
+                    test.message).replace(u'\n', u' |br| ').\
+                    replace(u'\r', u'').replace(u'"', u"'")
+            else:
+                test_result[u"msg"] = test.message.replace(u'\n', u' |br| ').\
+                    replace(u'\r', u'').replace(u'"', u"'")
+        else:
+            test_result[u"msg"] = u"Test Failed."
+
          if u"PERFTEST" in tags:
              # Replace info about cores (e.g. -1c-) with the info about threads
              # and cores (e.g. -1t1c-) in the long test case names and in the
@@ -969,14 +1048,14 @@ class ExecutionChecker(ResultVisitor):
                          tag_tc = tag
  
                  if tag_count == 1:
-                    self._test_id = re.sub(self.REGEX_TC_NAME_NEW,
-                                           f"-{tag_tc.lower()}-",
-                                           self._test_id,
-                                           count=1)
-                    test_result[u"name"] = re.sub(self.REGEX_TC_NAME_NEW,
-                                                  f"-{tag_tc.lower()}-",
-                                                  test_result["name"],
-                                                  count=1)
+                    self._test_id = re.sub(
+                        self.REGEX_TC_NAME_NEW, f"-{tag_tc.lower()}-",
+                        self._test_id, count=1
+                    )
+                    test_result[u"name"] = re.sub(
+                        self.REGEX_TC_NAME_NEW, f"-{tag_tc.lower()}-",
+                        test_result["name"], count=1
+                    )
                  else:
                      test_result[u"status"] = u"FAIL"
                      self._data[u"tests"][self._test_id] = test_result
@@ -998,6 +1077,10 @@ class ExecutionChecker(ResultVisitor):
                  test_result[u"type"] = u"SOAK"
                  test_result[u"throughput"], test_result[u"status"] = \
                      self._get_plr_throughput(test.message)
+            elif u"HOSTSTACK" in tags:
+                test_result[u"type"] = u"HOSTSTACK"
+                test_result[u"result"], test_result[u"status"] = \
+                    self._get_hoststack_data(test.message, tags)
              elif u"TCP" in tags:
                  test_result[u"type"] = u"TCP"
                  groups = re.search(self.REGEX_TCP, test.message)
@@ -1017,6 +1100,7 @@ class ExecutionChecker(ResultVisitor):
                      # Use whole list in CSIT-1180.
                      stats = jumpavg.AvgStdevStats.for_runs(items_float)
                      test_result[u"result"][u"receive-rate"] = stats.avg
+                    test_result[u"result"][u"receive-stdev"] = stats.stdev
                  else:
                      groups = re.search(self.REGEX_MRR, test.message)
                      test_result[u"result"][u"receive-rate"] = \
@@ -1110,7 +1194,8 @@ class ExecutionChecker(ResultVisitor):
                  test_kw.name.count(u"Show Runtime Counters On All Duts"):
              self._msg_type = u"test-show-runtime"
              self._sh_run_counter += 1
-        elif test_kw.name.count(u"Install Dpdk Test") and not self._version:
+        elif test_kw.name.count(u"Install Dpdk Test On All Duts") and \
+                not self._version:
              self._msg_type = u"dpdk-version"
          else:
              return
@@ -1222,7 +1307,6 @@ class ExecutionChecker(ResultVisitor):
          :type msg: Message
          :returns: Nothing.
          """
-
          if self._msg_type:
              self.parse_msg[self._msg_type](msg)
  
@@ -1284,7 +1368,6 @@ class InputData:
          :returns: Metadata
          :rtype: pandas.Series
          """
-
          return self.data[job][build][u"metadata"]
  
      def suites(self, job, build):
@@ -1297,7 +1380,6 @@ class InputData:
          :returns: Suites.
          :rtype: pandas.Series
          """
-
          return self.data[job][str(build)][u"suites"]
  
      def tests(self, job, build):
@@ -1310,7 +1392,6 @@ class InputData:
          :returns: Tests.
          :rtype: pandas.Series
          """
-
          return self.data[job][build][u"tests"]
  
      def _parse_tests(self, job, build, log):
@@ -1494,6 +1575,122 @@ class InputData:
  
          logging.info(u"Done.")
  
+    def process_local_file(self, local_file, job=u"local", build_nr=1,
+                           replace=True):
+        """Process local XML file given as a command-line parameter.
+
+        :param local_file: The file to process.
+        :param job: Job name.
+        :param build_nr: Build number.
+        :param replace: If True, the information about jobs and builds is
+            replaced by the new one, otherwise the new jobs and builds are
+            added.
+        :type local_file: str
+        :type job: str
+        :type build_nr: int
+        :type replace: bool
+        :raises: PresentationError if an error occurs.
+        """
+        if not isfile(local_file):
+            raise PresentationError(f"The file {local_file} does not exist.")
+
+        build = {
+            u"build": build_nr,
+            u"status": u"failed",
+            u"file-name": local_file
+        }
+        if replace:
+            self._cfg.builds = dict()
+        self._cfg.add_build(job, build)
+
+        logging.info(f"Processing {job}: {build_nr:2d}: {local_file}")
+        data = self._parse_tests(job, build, list())
+        if data is None:
+            raise PresentationError(
+                f"Error occurred while parsing the file {local_file}"
+            )
+
+        build_data = pd.Series({
+            u"metadata": pd.Series(
+                list(data[u"metadata"].values()),
+                index=list(data[u"metadata"].keys())
+            ),
+            u"suites": pd.Series(
+                list(data[u"suites"].values()),
+                index=list(data[u"suites"].keys())
+            ),
+            u"tests": pd.Series(
+                list(data[u"tests"].values()),
+                index=list(data[u"tests"].keys())
+            )
+        })
+
+        if self._input_data.get(job, None) is None:
+            self._input_data[job] = pd.Series()
+        self._input_data[job][str(build_nr)] = build_data
+
+        self._cfg.set_input_state(job, build_nr, u"processed")
+
+    def process_local_directory(self, local_dir, replace=True):
+        """Process local directory with XML file(s). The directory is processed
+        as a 'job' and the XML files in it as builds.
+        If the given directory contains only sub-directories, these
+        sub-directories processed as jobs and corresponding XML files as builds
+        of their job.
+
+        :param local_dir: Local directory to process.
+        :param replace: If True, the information about jobs and builds is
+            replaced by the new one, otherwise the new jobs and builds are
+            added.
+        :type local_dir: str
+        :type replace: bool
+        """
+        if not isdir(local_dir):
+            raise PresentationError(
+                f"The directory {local_dir} does not exist."
+            )
+
+        # Check if the given directory includes only files, or only directories
+        _, dirnames, filenames = next(walk(local_dir))
+
+        if filenames and not dirnames:
+            filenames.sort()
+            # local_builds:
+            # key: dir (job) name, value: list of file names (builds)
+            local_builds = {
+                local_dir: [join(local_dir, name) for name in filenames]
+            }
+
+        elif dirnames and not filenames:
+            dirnames.sort()
+            # local_builds:
+            # key: dir (job) name, value: list of file names (builds)
+            local_builds = dict()
+            for dirname in dirnames:
+                builds = [
+                    join(local_dir, dirname, name)
+                    for name in listdir(join(local_dir, dirname))
+                    if isfile(join(local_dir, dirname, name))
+                ]
+                if builds:
+                    local_builds[dirname] = sorted(builds)
+
+        elif not filenames and not dirnames:
+            raise PresentationError(f"The directory {local_dir} is empty.")
+        else:
+            raise PresentationError(
+                f"The directory {local_dir} can include only files or only "
+                f"directories, not both.\nThe directory {local_dir} includes "
+                f"file(s):\n{filenames}\nand directories:\n{dirnames}"
+            )
+
+        if replace:
+            self._cfg.builds = dict()
+
+        for job, files in local_builds.items():
+            for idx, local_file in enumerate(files):
+                self.process_local_file(local_file, job, idx + 1, replace=False)
+
      @staticmethod
      def _end_of_tag(tag_filter, start=0, closer=u"'"):
          """Return the index of character in the string which is the end of tag.
@@ -1507,7 +1704,6 @@ class InputData:
          :returns: The index of the tag closer.
          :rtype: int
          """
-
          try:
              idx_opener = tag_filter.index(closer, start)
              return tag_filter.index(closer, idx_opener + 1)
@@ -1523,7 +1719,6 @@ class InputData:
          :returns: Conditional statement which can be evaluated.
          :rtype: str
          """
-
          index = 0
          while True:
              index = InputData._end_of_tag(tag_filter, index)
@@ -1537,7 +1732,6 @@ class InputData:
          """Filter required data from the given jobs and builds.
  
          The output data structure is:
-
          - job 1
            - build 1
              - test (or suite) 1 ID:
@@ -1640,7 +1834,6 @@ class InputData:
          """Filter required data from the given jobs and builds.
  
          The output data structure is:
-
          - job 1
            - build 1
              - test (or suite) 1 ID:
@@ -1754,7 +1947,6 @@ class InputData:
              for item in builds.values:
                  for item_id, item_data in item.items():
                      merged_data[item_id] = item_data
-
          return merged_data
  
      def print_all_oper_data(self):