resources/tools/presentation/generator_tables.py

   1 # Copyright (c) 2017 Cisco and/or its affiliates.
   2 # Licensed under the Apache License, Version 2.0 (the "License");
   3 # you may not use this file except in compliance with the License.
   4 # You may obtain a copy of the License at:
   5 #
   6 #     http://www.apache.org/licenses/LICENSE-2.0
   7 #
   8 # Unless required by applicable law or agreed to in writing, software
   9 # distributed under the License is distributed on an "AS IS" BASIS,
  10 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  11 # See the License for the specific language governing permissions and
  12 # limitations under the License.
  13
  14 """Algorithms to generate tables.
  15 """
  16
  17
  18 import logging
  19 import csv
  20 import prettytable
  21 import pandas as pd
  22
  23 from string import replace
  24 from math import isnan
  25 from xml.etree import ElementTree as ET
  26
  27 from errors import PresentationError
  28 from utils import mean, stdev, relative_change, remove_outliers, split_outliers
  29
  30
  31 def generate_tables(spec, data):
  32     """Generate all tables specified in the specification file.
  33
  34     :param spec: Specification read from the specification file.
  35     :param data: Data to process.
  36     :type spec: Specification
  37     :type data: InputData
  38     """
  39
  40     logging.info("Generating the tables ...")
  41     for table in spec.tables:
  42         try:
  43             eval(table["algorithm"])(table, data)
  44         except NameError:
  45             logging.error("The algorithm '{0}' is not defined.".
  46                           format(table["algorithm"]))
  47     logging.info("Done.")
  48
  49
  50 def table_details(table, input_data):
  51     """Generate the table(s) with algorithm: table_detailed_test_results
  52     specified in the specification file.
  53
  54     :param table: Table to generate.
  55     :param input_data: Data to process.
  56     :type table: pandas.Series
  57     :type input_data: InputData
  58     """
  59
  60     logging.info("  Generating the table {0} ...".
  61                  format(table.get("title", "")))
  62
  63     # Transform the data
  64     data = input_data.filter_data(table)
  65
  66     # Prepare the header of the tables
  67     header = list()
  68     for column in table["columns"]:
  69         header.append('"{0}"'.format(str(column["title"]).replace('"', '""')))
  70
  71     # Generate the data for the table according to the model in the table
  72     # specification
  73     job = table["data"].keys()[0]
  74     build = str(table["data"][job][0])
  75     try:
  76         suites = input_data.suites(job, build)
  77     except KeyError:
  78         logging.error("    No data available. The table will not be generated.")
  79         return
  80
  81     for suite_longname, suite in suites.iteritems():
  82         # Generate data
  83         suite_name = suite["name"]
  84         table_lst = list()
  85         for test in data[job][build].keys():
  86             if data[job][build][test]["parent"] in suite_name:
  87                 row_lst = list()
  88                 for column in table["columns"]:
  89                     try:
  90                         col_data = str(data[job][build][test][column["data"].
  91                                        split(" ")[1]]).replace('"', '""')
  92                         if column["data"].split(" ")[1] in ("vat-history",
  93                                                             "show-run"):
  94                             col_data = replace(col_data, " |br| ", "",
  95                                                maxreplace=1)
  96                             col_data = " |prein| {0} |preout| ".\
  97                                 format(col_data[:-5])
  98                         row_lst.append('"{0}"'.format(col_data))
  99                     except KeyError:
 100                         row_lst.append("No data")
 101                 table_lst.append(row_lst)
 102
 103         # Write the data to file
 104         if table_lst:
 105             file_name = "{0}_{1}{2}".format(table["output-file"], suite_name,
 106                                             table["output-file-ext"])
 107             logging.info("      Writing file: '{}'".format(file_name))
 108             with open(file_name, "w") as file_handler:
 109                 file_handler.write(",".join(header) + "\n")
 110                 for item in table_lst:
 111                     file_handler.write(",".join(item) + "\n")
 112
 113     logging.info("  Done.")
 114
 115
 116 def table_merged_details(table, input_data):
 117     """Generate the table(s) with algorithm: table_merged_details
 118     specified in the specification file.
 119
 120     :param table: Table to generate.
 121     :param input_data: Data to process.
 122     :type table: pandas.Series
 123     :type input_data: InputData
 124     """
 125
 126     logging.info("  Generating the table {0} ...".
 127                  format(table.get("title", "")))
 128
 129     # Transform the data
 130     data = input_data.filter_data(table)
 131     data = input_data.merge_data(data)
 132     data.sort_index(inplace=True)
 133
 134     suites = input_data.filter_data(table, data_set="suites")
 135     suites = input_data.merge_data(suites)
 136
 137     # Prepare the header of the tables
 138     header = list()
 139     for column in table["columns"]:
 140         header.append('"{0}"'.format(str(column["title"]).replace('"', '""')))
 141
 142     for _, suite in suites.iteritems():
 143         # Generate data
 144         suite_name = suite["name"]
 145         table_lst = list()
 146         for test in data.keys():
 147             if data[test]["parent"] in suite_name:
 148                 row_lst = list()
 149                 for column in table["columns"]:
 150                     try:
 151                         col_data = str(data[test][column["data"].
 152                                        split(" ")[1]]).replace('"', '""')
 153                         if column["data"].split(" ")[1] in ("vat-history",
 154                                                             "show-run"):
 155                             col_data = replace(col_data, " |br| ", "",
 156                                                maxreplace=1)
 157                             col_data = " |prein| {0} |preout| ".\
 158                                 format(col_data[:-5])
 159                         row_lst.append('"{0}"'.format(col_data))
 160                     except KeyError:
 161                         row_lst.append("No data")
 162                 table_lst.append(row_lst)
 163
 164         # Write the data to file
 165         if table_lst:
 166             file_name = "{0}_{1}{2}".format(table["output-file"], suite_name,
 167                                             table["output-file-ext"])
 168             logging.info("      Writing file: '{}'".format(file_name))
 169             with open(file_name, "w") as file_handler:
 170                 file_handler.write(",".join(header) + "\n")
 171                 for item in table_lst:
 172                     file_handler.write(",".join(item) + "\n")
 173
 174     logging.info("  Done.")
 175
 176
 177 def table_performance_improvements(table, input_data):
 178     """Generate the table(s) with algorithm: table_performance_improvements
 179     specified in the specification file.
 180
 181     :param table: Table to generate.
 182     :param input_data: Data to process.
 183     :type table: pandas.Series
 184     :type input_data: InputData
 185     """
 186
 187     def _write_line_to_file(file_handler, data):
 188         """Write a line to the .csv file.
 189
 190         :param file_handler: File handler for the csv file. It must be open for
 191          writing text.
 192         :param data: Item to be written to the file.
 193         :type file_handler: BinaryIO
 194         :type data: list
 195         """
 196
 197         line_lst = list()
 198         for item in data:
 199             if isinstance(item["data"], str):
 200                 # Remove -?drdisc from the end
 201                 if item["data"].endswith("drdisc"):
 202                     item["data"] = item["data"][:-8]
 203                 line_lst.append(item["data"])
 204             elif isinstance(item["data"], float):
 205                 line_lst.append("{:.1f}".format(item["data"]))
 206             elif item["data"] is None:
 207                 line_lst.append("")
 208         file_handler.write(",".join(line_lst) + "\n")
 209
 210     logging.info("  Generating the table {0} ...".
 211                  format(table.get("title", "")))
 212
 213     # Read the template
 214     file_name = table.get("template", None)
 215     if file_name:
 216         try:
 217             tmpl = _read_csv_template(file_name)
 218         except PresentationError:
 219             logging.error("  The template '{0}' does not exist. Skipping the "
 220                           "table.".format(file_name))
 221             return None
 222     else:
 223         logging.error("The template is not defined. Skipping the table.")
 224         return None
 225
 226     # Transform the data
 227     data = input_data.filter_data(table)
 228
 229     # Prepare the header of the tables
 230     header = list()
 231     for column in table["columns"]:
 232         header.append(column["title"])
 233
 234     # Generate the data for the table according to the model in the table
 235     # specification
 236     tbl_lst = list()
 237     for tmpl_item in tmpl:
 238         tbl_item = list()
 239         for column in table["columns"]:
 240             cmd = column["data"].split(" ")[0]
 241             args = column["data"].split(" ")[1:]
 242             if cmd == "template":
 243                 try:
 244                     val = float(tmpl_item[int(args[0])])
 245                 except ValueError:
 246                     val = tmpl_item[int(args[0])]
 247                 tbl_item.append({"data": val})
 248             elif cmd == "data":
 249                 jobs = args[0:-1]
 250                 operation = args[-1]
 251                 data_lst = list()
 252                 for job in jobs:
 253                     for build in data[job]:
 254                         try:
 255                             data_lst.append(float(build[tmpl_item[0]]
 256                                                   ["throughput"]["value"]))
 257                         except (KeyError, TypeError):
 258                             # No data, ignore
 259                             continue
 260                 if data_lst:
 261                     tbl_item.append({"data": (eval(operation)(data_lst)) /
 262                                              1000000})
 263                 else:
 264                     tbl_item.append({"data": None})
 265             elif cmd == "operation":
 266                 operation = args[0]
 267                 try:
 268                     nr1 = float(tbl_item[int(args[1])]["data"])
 269                     nr2 = float(tbl_item[int(args[2])]["data"])
 270                     if nr1 and nr2:
 271                         tbl_item.append({"data": eval(operation)(nr1, nr2)})
 272                     else:
 273                         tbl_item.append({"data": None})
 274                 except (IndexError, ValueError, TypeError):
 275                     logging.error("No data for {0}".format(tbl_item[0]["data"]))
 276                     tbl_item.append({"data": None})
 277                     continue
 278             else:
 279                 logging.error("Not supported command {0}. Skipping the table.".
 280                               format(cmd))
 281                 return None
 282         tbl_lst.append(tbl_item)
 283
 284     # Sort the table according to the relative change
 285     tbl_lst.sort(key=lambda rel: rel[-1]["data"], reverse=True)
 286
 287     # Create the tables and write them to the files
 288     file_names = [
 289         "{0}_ndr_top{1}".format(table["output-file"], table["output-file-ext"]),
 290         "{0}_pdr_top{1}".format(table["output-file"], table["output-file-ext"]),
 291         "{0}_ndr_low{1}".format(table["output-file"], table["output-file-ext"]),
 292         "{0}_pdr_low{1}".format(table["output-file"], table["output-file-ext"])
 293     ]
 294
 295     for file_name in file_names:
 296         logging.info("    Writing the file '{0}'".format(file_name))
 297         with open(file_name, "w") as file_handler:
 298             file_handler.write(",".join(header) + "\n")
 299             for item in tbl_lst:
 300                 if isinstance(item[-1]["data"], float):
 301                     rel_change = round(item[-1]["data"], 1)
 302                 else:
 303                     rel_change = item[-1]["data"]
 304                 if "ndr_top" in file_name \
 305                         and "ndr" in item[0]["data"] \
 306                         and rel_change >= 10.0:
 307                     _write_line_to_file(file_handler, item)
 308                 elif "pdr_top" in file_name \
 309                         and "pdr" in item[0]["data"] \
 310                         and rel_change >= 10.0:
 311                     _write_line_to_file(file_handler, item)
 312                 elif "ndr_low" in file_name \
 313                         and "ndr" in item[0]["data"] \
 314                         and rel_change < 10.0:
 315                     _write_line_to_file(file_handler, item)
 316                 elif "pdr_low" in file_name \
 317                         and "pdr" in item[0]["data"] \
 318                         and rel_change < 10.0:
 319                     _write_line_to_file(file_handler, item)
 320
 321     logging.info("  Done.")
 322
 323
 324 def _read_csv_template(file_name):
 325     """Read the template from a .csv file.
 326
 327     :param file_name: Name / full path / relative path of the file to read.
 328     :type file_name: str
 329     :returns: Data from the template as list (lines) of lists (items on line).
 330     :rtype: list
 331     :raises: PresentationError if it is not possible to read the file.
 332     """
 333
 334     try:
 335         with open(file_name, 'r') as csv_file:
 336             tmpl_data = list()
 337             for line in csv_file:
 338                 tmpl_data.append(line[:-1].split(","))
 339         return tmpl_data
 340     except IOError as err:
 341         raise PresentationError(str(err), level="ERROR")
 342
 343
 344 def table_performance_comparison(table, input_data):
 345     """Generate the table(s) with algorithm: table_performance_comparison
 346     specified in the specification file.
 347
 348     :param table: Table to generate.
 349     :param input_data: Data to process.
 350     :type table: pandas.Series
 351     :type input_data: InputData
 352     """
 353
 354     logging.info("  Generating the table {0} ...".
 355                  format(table.get("title", "")))
 356
 357     # Transform the data
 358     data = input_data.filter_data(table, continue_on_error=True)
 359
 360     # Prepare the header of the tables
 361     try:
 362         header = ["Test case",
 363                   "{0} Throughput [Mpps]".format(table["reference"]["title"]),
 364                   "{0} stdev [Mpps]".format(table["reference"]["title"]),
 365                   "{0} Throughput [Mpps]".format(table["compare"]["title"]),
 366                   "{0} stdev [Mpps]".format(table["compare"]["title"]),
 367                   "Change [%]"]
 368         header_str = ",".join(header) + "\n"
 369     except (AttributeError, KeyError) as err:
 370         logging.error("The model is invalid, missing parameter: {0}".
 371                       format(err))
 372         return
 373
 374     # Prepare data to the table:
 375     tbl_dict = dict()
 376     for job, builds in table["reference"]["data"].items():
 377         for build in builds:
 378             for tst_name, tst_data in data[job][str(build)].iteritems():
 379                 if tbl_dict.get(tst_name, None) is None:
 380                     name = "{0}-{1}".format(tst_data["parent"].split("-")[0],
 381                                             "-".join(tst_data["name"].
 382                                                      split("-")[1:]))
 383                     tbl_dict[tst_name] = {"name": name,
 384                                           "ref-data": list(),
 385                                           "cmp-data": list()}
 386                 try:
 387                     tbl_dict[tst_name]["ref-data"].\
 388                         append(tst_data["throughput"]["value"])
 389                 except TypeError:
 390                     pass  # No data in output.xml for this test
 391
 392     for job, builds in table["compare"]["data"].items():
 393         for build in builds:
 394             for tst_name, tst_data in data[job][str(build)].iteritems():
 395                 try:
 396                     tbl_dict[tst_name]["cmp-data"].\
 397                         append(tst_data["throughput"]["value"])
 398                 except KeyError:
 399                     pass
 400                 except TypeError:
 401                     tbl_dict.pop(tst_name, None)
 402
 403     tbl_lst = list()
 404     for tst_name in tbl_dict.keys():
 405         item = [tbl_dict[tst_name]["name"], ]
 406         if tbl_dict[tst_name]["ref-data"]:
 407             data_t = remove_outliers(tbl_dict[tst_name]["ref-data"],
 408                                      outlier_const=table["outlier-const"])
 409             # TODO: Specify window size.
 410             if data_t:
 411                 item.append(round(mean(data_t) / 1000000, 2))
 412                 item.append(round(stdev(data_t) / 1000000, 2))
 413             else:
 414                 item.extend([None, None])
 415         else:
 416             item.extend([None, None])
 417         if tbl_dict[tst_name]["cmp-data"]:
 418             data_t = remove_outliers(tbl_dict[tst_name]["cmp-data"],
 419                                      outlier_const=table["outlier-const"])
 420             # TODO: Specify window size.
 421             if data_t:
 422                 item.append(round(mean(data_t) / 1000000, 2))
 423                 item.append(round(stdev(data_t) / 1000000, 2))
 424             else:
 425                 item.extend([None, None])
 426         else:
 427             item.extend([None, None])
 428         if item[1] is not None and item[3] is not None:
 429             item.append(int(relative_change(float(item[1]), float(item[3]))))
 430         if len(item) == 6:
 431             tbl_lst.append(item)
 432
 433     # Sort the table according to the relative change
 434     tbl_lst.sort(key=lambda rel: rel[-1], reverse=True)
 435
 436     # Generate tables:
 437     # All tests in csv:
 438     tbl_names = ["{0}-ndr-1t1c-full{1}".format(table["output-file"],
 439                                                table["output-file-ext"]),
 440                  "{0}-ndr-2t2c-full{1}".format(table["output-file"],
 441                                                table["output-file-ext"]),
 442                  "{0}-ndr-4t4c-full{1}".format(table["output-file"],
 443                                                table["output-file-ext"]),
 444                  "{0}-pdr-1t1c-full{1}".format(table["output-file"],
 445                                                table["output-file-ext"]),
 446                  "{0}-pdr-2t2c-full{1}".format(table["output-file"],
 447                                                table["output-file-ext"]),
 448                  "{0}-pdr-4t4c-full{1}".format(table["output-file"],
 449                                                table["output-file-ext"])
 450                  ]
 451     for file_name in tbl_names:
 452         logging.info("      Writing file: '{0}'".format(file_name))
 453         with open(file_name, "w") as file_handler:
 454             file_handler.write(header_str)
 455             for test in tbl_lst:
 456                 if (file_name.split("-")[-3] in test[0] and    # NDR vs PDR
 457                         file_name.split("-")[-2] in test[0]):  # cores
 458                     test[0] = "-".join(test[0].split("-")[:-1])
 459                     file_handler.write(",".join([str(item) for item in test]) +
 460                                        "\n")
 461
 462     # All tests in txt:
 463     tbl_names_txt = ["{0}-ndr-1t1c-full.txt".format(table["output-file"]),
 464                      "{0}-ndr-2t2c-full.txt".format(table["output-file"]),
 465                      "{0}-ndr-4t4c-full.txt".format(table["output-file"]),
 466                      "{0}-pdr-1t1c-full.txt".format(table["output-file"]),
 467                      "{0}-pdr-2t2c-full.txt".format(table["output-file"]),
 468                      "{0}-pdr-4t4c-full.txt".format(table["output-file"])
 469                      ]
 470
 471     for i, txt_name in enumerate(tbl_names_txt):
 472         txt_table = None
 473         logging.info("      Writing file: '{0}'".format(txt_name))
 474         with open(tbl_names[i], 'rb') as csv_file:
 475             csv_content = csv.reader(csv_file, delimiter=',', quotechar='"')
 476             for row in csv_content:
 477                 if txt_table is None:
 478                     txt_table = prettytable.PrettyTable(row)
 479                 else:
 480                     txt_table.add_row(row)
 481             txt_table.align["Test case"] = "l"
 482         with open(txt_name, "w") as txt_file:
 483             txt_file.write(str(txt_table))
 484
 485     # Selected tests in csv:
 486     input_file = "{0}-ndr-1t1c-full{1}".format(table["output-file"],
 487                                                table["output-file-ext"])
 488     with open(input_file, "r") as in_file:
 489         lines = list()
 490         for line in in_file:
 491             lines.append(line)
 492
 493     output_file = "{0}-ndr-1t1c-top{1}".format(table["output-file"],
 494                                                table["output-file-ext"])
 495     logging.info("      Writing file: '{0}'".format(output_file))
 496     with open(output_file, "w") as out_file:
 497         out_file.write(header_str)
 498         for i, line in enumerate(lines[1:]):
 499             if i == table["nr-of-tests-shown"]:
 500                 break
 501             out_file.write(line)
 502
 503     output_file = "{0}-ndr-1t1c-bottom{1}".format(table["output-file"],
 504                                                   table["output-file-ext"])
 505     logging.info("      Writing file: '{0}'".format(output_file))
 506     with open(output_file, "w") as out_file:
 507         out_file.write(header_str)
 508         for i, line in enumerate(lines[-1:0:-1]):
 509             if i == table["nr-of-tests-shown"]:
 510                 break
 511             out_file.write(line)
 512
 513     input_file = "{0}-pdr-1t1c-full{1}".format(table["output-file"],
 514                                                table["output-file-ext"])
 515     with open(input_file, "r") as in_file:
 516         lines = list()
 517         for line in in_file:
 518             lines.append(line)
 519
 520     output_file = "{0}-pdr-1t1c-top{1}".format(table["output-file"],
 521                                                table["output-file-ext"])
 522     logging.info("      Writing file: '{0}'".format(output_file))
 523     with open(output_file, "w") as out_file:
 524         out_file.write(header_str)
 525         for i, line in enumerate(lines[1:]):
 526             if i == table["nr-of-tests-shown"]:
 527                 break
 528             out_file.write(line)
 529
 530     output_file = "{0}-pdr-1t1c-bottom{1}".format(table["output-file"],
 531                                                   table["output-file-ext"])
 532     logging.info("      Writing file: '{0}'".format(output_file))
 533     with open(output_file, "w") as out_file:
 534         out_file.write(header_str)
 535         for i, line in enumerate(lines[-1:0:-1]):
 536             if i == table["nr-of-tests-shown"]:
 537                 break
 538             out_file.write(line)
 539
 540
 541 def table_performance_comparison_mrr(table, input_data):
 542     """Generate the table(s) with algorithm: table_performance_comparison_mrr
 543     specified in the specification file.
 544
 545     :param table: Table to generate.
 546     :param input_data: Data to process.
 547     :type table: pandas.Series
 548     :type input_data: InputData
 549     """
 550
 551     logging.info("  Generating the table {0} ...".
 552                  format(table.get("title", "")))
 553
 554     # Transform the data
 555     data = input_data.filter_data(table, continue_on_error=True)
 556
 557     # Prepare the header of the tables
 558     try:
 559         header = ["Test case",
 560                   "{0} Throughput [Mpps]".format(table["reference"]["title"]),
 561                   "{0} stdev [Mpps]".format(table["reference"]["title"]),
 562                   "{0} Throughput [Mpps]".format(table["compare"]["title"]),
 563                   "{0} stdev [Mpps]".format(table["compare"]["title"]),
 564                   "Change [%]"]
 565         header_str = ",".join(header) + "\n"
 566     except (AttributeError, KeyError) as err:
 567         logging.error("The model is invalid, missing parameter: {0}".
 568                       format(err))
 569         return
 570
 571     # Prepare data to the table:
 572     tbl_dict = dict()
 573     for job, builds in table["reference"]["data"].items():
 574         for build in builds:
 575             for tst_name, tst_data in data[job][str(build)].iteritems():
 576                 if tbl_dict.get(tst_name, None) is None:
 577                     name = "{0}-{1}".format(tst_data["parent"].split("-")[0],
 578                                             "-".join(tst_data["name"].
 579                                                      split("-")[1:]))
 580                     tbl_dict[tst_name] = {"name": name,
 581                                           "ref-data": list(),
 582                                           "cmp-data": list()}
 583                 try:
 584                     tbl_dict[tst_name]["ref-data"].\
 585                         append(tst_data["result"]["throughput"])
 586                 except TypeError:
 587                     pass  # No data in output.xml for this test
 588
 589     for job, builds in table["compare"]["data"].items():
 590         for build in builds:
 591             for tst_name, tst_data in data[job][str(build)].iteritems():
 592                 try:
 593                     tbl_dict[tst_name]["cmp-data"].\
 594                         append(tst_data["result"]["throughput"])
 595                 except KeyError:
 596                     pass
 597                 except TypeError:
 598                     tbl_dict.pop(tst_name, None)
 599
 600     tbl_lst = list()
 601     for tst_name in tbl_dict.keys():
 602         item = [tbl_dict[tst_name]["name"], ]
 603         if tbl_dict[tst_name]["ref-data"]:
 604             data_t = remove_outliers(tbl_dict[tst_name]["ref-data"],
 605                                      outlier_const=table["outlier-const"])
 606             # TODO: Specify window size.
 607             if data_t:
 608                 item.append(round(mean(data_t) / 1000000, 2))
 609                 item.append(round(stdev(data_t) / 1000000, 2))
 610             else:
 611                 item.extend([None, None])
 612         else:
 613             item.extend([None, None])
 614         if tbl_dict[tst_name]["cmp-data"]:
 615             data_t = remove_outliers(tbl_dict[tst_name]["cmp-data"],
 616                                      outlier_const=table["outlier-const"])
 617             # TODO: Specify window size.
 618             if data_t:
 619                 item.append(round(mean(data_t) / 1000000, 2))
 620                 item.append(round(stdev(data_t) / 1000000, 2))
 621             else:
 622                 item.extend([None, None])
 623         else:
 624             item.extend([None, None])
 625         if item[1] is not None and item[3] is not None and item[1] != 0:
 626             item.append(int(relative_change(float(item[1]), float(item[3]))))
 627         if len(item) == 6:
 628             tbl_lst.append(item)
 629
 630     # Sort the table according to the relative change
 631     tbl_lst.sort(key=lambda rel: rel[-1], reverse=True)
 632
 633     # Generate tables:
 634     # All tests in csv:
 635     tbl_names = ["{0}-1t1c-full{1}".format(table["output-file"],
 636                                            table["output-file-ext"]),
 637                  "{0}-2t2c-full{1}".format(table["output-file"],
 638                                            table["output-file-ext"]),
 639                  "{0}-4t4c-full{1}".format(table["output-file"],
 640                                            table["output-file-ext"])
 641                  ]
 642     for file_name in tbl_names:
 643         logging.info("      Writing file: '{0}'".format(file_name))
 644         with open(file_name, "w") as file_handler:
 645             file_handler.write(header_str)
 646             for test in tbl_lst:
 647                 if file_name.split("-")[-2] in test[0]:  # cores
 648                     test[0] = "-".join(test[0].split("-")[:-1])
 649                     file_handler.write(",".join([str(item) for item in test]) +
 650                                        "\n")
 651
 652     # All tests in txt:
 653     tbl_names_txt = ["{0}-1t1c-full.txt".format(table["output-file"]),
 654                      "{0}-2t2c-full.txt".format(table["output-file"]),
 655                      "{0}-4t4c-full.txt".format(table["output-file"])
 656                      ]
 657
 658     for i, txt_name in enumerate(tbl_names_txt):
 659         txt_table = None
 660         logging.info("      Writing file: '{0}'".format(txt_name))
 661         with open(tbl_names[i], 'rb') as csv_file:
 662             csv_content = csv.reader(csv_file, delimiter=',', quotechar='"')
 663             for row in csv_content:
 664                 if txt_table is None:
 665                     txt_table = prettytable.PrettyTable(row)
 666                 else:
 667                     txt_table.add_row(row)
 668             txt_table.align["Test case"] = "l"
 669         with open(txt_name, "w") as txt_file:
 670             txt_file.write(str(txt_table))
 671
 672
 673 def table_performance_trending_dashboard(table, input_data):
 674     """Generate the table(s) with algorithm: table_performance_comparison
 675     specified in the specification file.
 676
 677     :param table: Table to generate.
 678     :param input_data: Data to process.
 679     :type table: pandas.Series
 680     :type input_data: InputData
 681     """
 682
 683     logging.info("  Generating the table {0} ...".
 684                  format(table.get("title", "")))
 685
 686     # Transform the data
 687     data = input_data.filter_data(table, continue_on_error=True)
 688
 689     # Prepare the header of the tables
 690     header = ["Test Case",
 691               "Throughput Trend [Mpps]",
 692               "Long Trend Compliance",
 693               "Trend Compliance",
 694               "Top Anomaly [Mpps]",
 695               "Change [%]",
 696               "Outliers [Number]"
 697               ]
 698     header_str = ",".join(header) + "\n"
 699
 700     # Prepare data to the table:
 701     tbl_dict = dict()
 702     for job, builds in table["data"].items():
 703         for build in builds:
 704             for tst_name, tst_data in data[job][str(build)].iteritems():
 705                 if tbl_dict.get(tst_name, None) is None:
 706                     name = "{0}-{1}".format(tst_data["parent"].split("-")[0],
 707                                             "-".join(tst_data["name"].
 708                                                      split("-")[1:]))
 709                     tbl_dict[tst_name] = {"name": name,
 710                                           "data": dict()}
 711                 try:
 712                     tbl_dict[tst_name]["data"][str(build)] =  \
 713                         tst_data["result"]["throughput"]
 714                 except (TypeError, KeyError):
 715                     pass  # No data in output.xml for this test
 716
 717     tbl_lst = list()
 718     for tst_name in tbl_dict.keys():
 719         if len(tbl_dict[tst_name]["data"]) > 2:
 720
 721             pd_data = pd.Series(tbl_dict[tst_name]["data"])
 722             win_size = min(pd_data.size, table["window"])
 723             # Test name:
 724             name = tbl_dict[tst_name]["name"]
 725
 726             median = pd_data.rolling(window=win_size, min_periods=2).median()
 727             median_idx = pd_data.size - table["long-trend-window"]
 728             median_idx = 0 if median_idx < 0 else median_idx
 729             max_median = max(median.values[median_idx:])
 730             trimmed_data, _ = split_outliers(pd_data, outlier_const=1.5,
 731                                              window=win_size)
 732             stdev_t = pd_data.rolling(window=win_size, min_periods=2).std()
 733
 734             rel_change_lst = [None, ]
 735             classification_lst = [None, ]
 736             median_lst = [None, ]
 737             sample_lst = [None, ]
 738             first = True
 739             for build_nr, value in pd_data.iteritems():
 740                 if first:
 741                     first = False
 742                     continue
 743                 # Relative changes list:
 744                 if not isnan(value) \
 745                         and not isnan(median[build_nr]) \
 746                         and median[build_nr] != 0:
 747                     rel_change_lst.append(round(
 748                         relative_change(float(median[build_nr]), float(value)),
 749                         2))
 750                 else:
 751                     rel_change_lst.append(None)
 752
 753                 # Classification list:
 754                 if isnan(trimmed_data[build_nr]) \
 755                         or isnan(median[build_nr]) \
 756                         or isnan(stdev_t[build_nr]) \
 757                         or isnan(value):
 758                     classification_lst.append("outlier")
 759                 elif value < (median[build_nr] - 3 * stdev_t[build_nr]):
 760                     classification_lst.append("regression")
 761                 elif value > (median[build_nr] + 3 * stdev_t[build_nr]):
 762                     classification_lst.append("progression")
 763                 else:
 764                     classification_lst.append("normal")
 765                 sample_lst.append(value)
 766                 median_lst.append(median[build_nr])
 767
 768             last_idx = len(classification_lst) - 1
 769             first_idx = last_idx - int(table["evaluated-window"])
 770             if first_idx < 0:
 771                 first_idx = 0
 772
 773             nr_outliers = 0
 774             consecutive_outliers = 0
 775             failure = False
 776             for item in classification_lst[first_idx:]:
 777                 if item == "outlier":
 778                     nr_outliers += 1
 779                     consecutive_outliers += 1
 780                     if consecutive_outliers == 3:
 781                         failure = True
 782                 else:
 783                     consecutive_outliers = 0
 784
 785             if failure:
 786                 classification = "failure"
 787             elif "regression" in classification_lst[first_idx:]:
 788                 classification = "regression"
 789             elif "progression" in classification_lst[first_idx:]:
 790                 classification = "progression"
 791             else:
 792                 classification = "normal"
 793
 794             if classification == "normal":
 795                 index = len(classification_lst) - 1
 796             else:
 797                 tmp_classification = "outlier" if classification == "failure" \
 798                     else classification
 799                 index = None
 800                 for idx in range(first_idx, len(classification_lst)):
 801                     if classification_lst[idx] == tmp_classification:
 802                         if rel_change_lst[idx]:
 803                             index = idx
 804                             break
 805                 if index is None:
 806                     continue
 807                 for idx in range(index+1, len(classification_lst)):
 808                     if classification_lst[idx] == tmp_classification:
 809                         if rel_change_lst[idx]:
 810                             if (abs(rel_change_lst[idx]) >
 811                                     abs(rel_change_lst[index])):
 812                                 index = idx
 813
 814             logging.info("{}".format(name))
 815             logging.info("sample_lst: {} - {}".format(len(sample_lst), sample_lst))
 816             logging.info("median_lst: {} - {}".format(len(median_lst), median_lst))
 817             logging.info("rel_change: {} - {}".format(len(rel_change_lst), rel_change_lst))
 818             logging.info("classn_lst: {} - {}".format(len(classification_lst), classification_lst))
 819             logging.info("index:      {}".format(index))
 820             logging.info("classifica: {}".format(classification))
 821
 822             try:
 823                 trend = round(float(median_lst[-1]) / 1000000, 2) \
 824                     if not isnan(median_lst[-1]) else '-'
 825                 sample = round(float(sample_lst[index]) / 1000000, 2) \
 826                     if not isnan(sample_lst[index]) else '-'
 827                 rel_change = rel_change_lst[index] \
 828                     if rel_change_lst[index] is not None else '-'
 829                 if not isnan(max_median):
 830                     if not isnan(sample_lst[index]):
 831                         long_trend_threshold = max_median * \
 832                                                (table["long-trend-threshold"] / 100)
 833                         if sample_lst[index] < long_trend_threshold:
 834                             long_trend_classification = "failure"
 835                         else:
 836                             long_trend_classification = '-'
 837                     else:
 838                         long_trend_classification = "failure"
 839                 else:
 840                     long_trend_classification = '-'
 841                 tbl_lst.append([name,
 842                                 trend,
 843                                 long_trend_classification,
 844                                 classification,
 845                                 '-' if classification == "normal" else sample,
 846                                 '-' if classification == "normal" else rel_change,
 847                                 nr_outliers])
 848             except IndexError as err:
 849                 logging.error("{}".format(err))
 850                 continue
 851
 852     # Sort the table according to the classification
 853     tbl_sorted = list()
 854     for long_trend_class in ("failure", '-'):
 855         tbl_long = [item for item in tbl_lst if item[2] == long_trend_class]
 856         for classification in \
 857                 ("failure", "regression", "progression", "normal"):
 858             tbl_tmp = [item for item in tbl_long if item[3] == classification]
 859             tbl_tmp.sort(key=lambda rel: rel[0])
 860             tbl_sorted.extend(tbl_tmp)
 861
 862     file_name = "{0}{1}".format(table["output-file"], table["output-file-ext"])
 863
 864     logging.info("      Writing file: '{0}'".format(file_name))
 865     with open(file_name, "w") as file_handler:
 866         file_handler.write(header_str)
 867         for test in tbl_sorted:
 868             file_handler.write(",".join([str(item) for item in test]) + '\n')
 869
 870     txt_file_name = "{0}.txt".format(table["output-file"])
 871     txt_table = None
 872     logging.info("      Writing file: '{0}'".format(txt_file_name))
 873     with open(file_name, 'rb') as csv_file:
 874         csv_content = csv.reader(csv_file, delimiter=',', quotechar='"')
 875         for row in csv_content:
 876             if txt_table is None:
 877                 txt_table = prettytable.PrettyTable(row)
 878             else:
 879                 txt_table.add_row(row)
 880         txt_table.align["Test case"] = "l"
 881     with open(txt_file_name, "w") as txt_file:
 882         txt_file.write(str(txt_table))
 883
 884
 885 def table_performance_trending_dashboard_html(table, input_data):
 886     """Generate the table(s) with algorithm:
 887     table_performance_trending_dashboard_html specified in the specification
 888     file.
 889
 890     :param table: Table to generate.
 891     :param input_data: Data to process.
 892     :type table: pandas.Series
 893     :type input_data: InputData
 894     """
 895
 896     logging.info("  Generating the table {0} ...".
 897                  format(table.get("title", "")))
 898
 899     try:
 900         with open(table["input-file"], 'rb') as csv_file:
 901             csv_content = csv.reader(csv_file, delimiter=',', quotechar='"')
 902             csv_lst = [item for item in csv_content]
 903     except KeyError:
 904         logging.warning("The input file is not defined.")
 905         return
 906     except csv.Error as err:
 907         logging.warning("Not possible to process the file '{0}'.\n{1}".
 908                         format(table["input-file"], err))
 909         return
 910
 911     # Table:
 912     dashboard = ET.Element("table", attrib=dict(width="100%", border='0'))
 913
 914     # Table header:
 915     tr = ET.SubElement(dashboard, "tr", attrib=dict(bgcolor="#7eade7"))
 916     for idx, item in enumerate(csv_lst[0]):
 917         alignment = "left" if idx == 0 else "center"
 918         th = ET.SubElement(tr, "th", attrib=dict(align=alignment))
 919         th.text = item
 920
 921     # Rows:
 922     for r_idx, row in enumerate(csv_lst[1:]):
 923         background = "#D4E4F7" if r_idx % 2 else "white"
 924         tr = ET.SubElement(dashboard, "tr", attrib=dict(bgcolor=background))
 925
 926         # Columns:
 927         for c_idx, item in enumerate(row):
 928             alignment = "left" if c_idx == 0 else "center"
 929             td = ET.SubElement(tr, "td", attrib=dict(align=alignment))
 930             # Name:
 931             url = "../trending/"
 932             file_name = ""
 933             anchor = "#"
 934             feature = ""
 935             if c_idx == 0:
 936                 if "memif" in item:
 937                     file_name = "container_memif.html"
 938
 939                 elif "vhost" in item:
 940                     if "l2xcbase" in item or "l2bdbasemaclrn" in item:
 941                         file_name = "vm_vhost_l2.html"
 942                     elif "ip4base" in item:
 943                         file_name = "vm_vhost_ip4.html"
 944
 945                 elif "ipsec" in item:
 946                     file_name = "ipsec.html"
 947
 948                 elif "ethip4lispip" in item or "ethip4vxlan" in item:
 949                     file_name = "ip4_tunnels.html"
 950
 951                 elif "ip4base" in item or "ip4scale" in item:
 952                     file_name = "ip4.html"
 953                     if "iacl" in item or "snat" in item or "cop" in item:
 954                         feature = "-features"
 955
 956                 elif "ip6base" in item or "ip6scale" in item:
 957                     file_name = "ip6.html"
 958
 959                 elif "l2xcbase" in item or "l2xcscale" in item \
 960                         or "l2bdbasemaclrn" in item or "l2bdscale" in item \
 961                         or "l2dbbasemaclrn" in item or "l2dbscale" in item:
 962                     file_name = "l2.html"
 963                     if "iacl" in item:
 964                         feature = "-features"
 965
 966                 if "x520" in item:
 967                     anchor += "x520-"
 968                 elif "x710" in item:
 969                     anchor += "x710-"
 970                 elif "xl710" in item:
 971                     anchor += "xl710-"
 972
 973                 if "64b" in item:
 974                     anchor += "64b-"
 975                 elif "78b" in item:
 976                     anchor += "78b"
 977                 elif "imix" in item:
 978                     anchor += "imix-"
 979                 elif "9000b" in item:
 980                     anchor += "9000b-"
 981                 elif "1518" in item:
 982                     anchor += "1518b-"
 983
 984                 if "1t1c" in item:
 985                     anchor += "1t1c"
 986                 elif "2t2c" in item:
 987                     anchor += "2t2c"
 988                 elif "4t4c" in item:
 989                     anchor += "4t4c"
 990
 991                 url = url + file_name + anchor + feature
 992
 993                 ref = ET.SubElement(td, "a", attrib=dict(href=url))
 994                 ref.text = item
 995
 996             if c_idx == 3:
 997                 if item == "regression":
 998                     td.set("bgcolor", "#eca1a6")
 999                 elif item == "failure":
1000                     td.set("bgcolor", "#d6cbd3")
1001                 elif item == "progression":
1002                     td.set("bgcolor", "#bdcebe")
1003             if c_idx > 0:
1004                 td.text = item
1005
1006     try:
1007         with open(table["output-file"], 'w') as html_file:
1008             logging.info("      Writing file: '{0}'".
1009                          format(table["output-file"]))
1010             html_file.write(".. raw:: html\n\n\t")
1011             html_file.write(ET.tostring(dashboard))
1012             html_file.write("\n\t<p><br><br></p>\n")
1013     except KeyError:
1014         logging.warning("The output file is not defined.")
1015         return