fixed performance issue (moved STRECH case to low priority cases)

author imarom <[email protected]>

Wed, 26 Oct 2016 13:00:50 +0000 (15:00 +0200)

committer imarom <[email protected]>

Wed, 26 Oct 2016 13:22:47 +0000 (15:22 +0200)
author imarom <[email protected]>
Wed, 26 Oct 2016 13:00:50 +0000 (15:00 +0200)
committer imarom <[email protected]>
Wed, 26 Oct 2016 13:22:47 +0000 (15:22 +0200)
diff --git a/linux_dpdk/d b/linux_dpdk/d

old mode 100644 (file)

new mode 100755 (executable)
diff --git a/scripts/automation/regression/setups/trex09/benchmark.yaml b/scripts/automation/regression/setups/trex09/benchmark.yaml

index ed51a46..f157d8f 100644 (file)
--- a/scripts/automation/regression/setups/trex09/benchmark.yaml
+++ b/scripts/automation/regression/setups/trex09/benchmark.yaml
@@ -209,24 +209,24 @@ test_performance_syn_attack_single_cpu:
  
  test_performance_vm_multi_cpus:
      cfg:
-        core_count             : 3
+        core_count             : 2
          mult                   : "90%"
          mpps_per_core_golden   :
-                                  min: 15.9
-                                  max: 16.5
+                                  min: 15.7
+                                  max: 16.3
  
  
  test_performance_vm_multi_cpus_cached:
      cfg:
-        core_count             : 3
+        core_count             : 2
          mult                   : "90%"
          mpps_per_core_golden   :
-                                  min: 29.6
-                                  max: 30.5
+                                  min: 28.8
+                                  max: 29.5
  
  test_performance_syn_attack_multi_cpus:
      cfg:
-        core_count             : 3
+        core_count             : 2
          mult                   : "90%"
          mpps_per_core_golden   :
                                    min: 13.0
diff --git a/scripts/automation/regression/stateless_tests/stl_performance_test.py b/scripts/automation/regression/stateless_tests/stl_performance_test.py

index a77c5c2..27c61cc 100644 (file)
--- a/scripts/automation/regression/stateless_tests/stl_performance_test.py
+++ b/scripts/automation/regression/stateless_tests/stl_performance_test.py
@@ -180,7 +180,7 @@ class STLPerformance_Test(CStlGeneral_Test):
          setup_cfg = self.get_benchmark_param('cfg')
          scenario_cfg = {}
  
-        scenario_cfg['name']        = "VM - 64 bytes, two CPUs"
+        scenario_cfg['name']        = "VM - 64 bytes, multi CPUs"
          scenario_cfg['streams']     = self.build_perf_profile_vm(64)
  
          scenario_cfg['core_count']           = setup_cfg['core_count']
@@ -191,12 +191,12 @@ class STLPerformance_Test(CStlGeneral_Test):
  
  
  
-    # two CPUs, VM, cached, 64 bytes
+    # multi CPUs, VM, cached, 64 bytes
      def test_performance_vm_multi_cpus_cached (self):
          setup_cfg = self.get_benchmark_param('cfg')
          scenario_cfg = {}
  
-        scenario_cfg['name']        = "VM - 64 bytes, single CPU, cache size 1024"
+        scenario_cfg['name']        = "VM - 64 bytes, multi CPU, cache size 1024"
          scenario_cfg['streams']     = self.build_perf_profile_vm(64, cache_size = 1024)
  
  
@@ -207,12 +207,12 @@ class STLPerformance_Test(CStlGeneral_Test):
          self.execute_single_scenario(scenario_cfg)
  
  
-    # two CPUs, syn attack, 64 bytes
+    # multi CPUs, syn attack, 64 bytes
      def test_performance_syn_attack_multi_cpus (self):
          setup_cfg = self.get_benchmark_param('cfg')
          scenario_cfg = {}
  
-        scenario_cfg['name']        = "syn attack - 64 bytes, two CPUs"
+        scenario_cfg['name']        = "syn attack - 64 bytes, multi CPUs"
          scenario_cfg['streams']     = self.build_perf_profile_syn_attack(64)
  
          scenario_cfg['core_count']           = setup_cfg['core_count']
@@ -254,6 +254,10 @@ class STLPerformance_Test(CStlGeneral_Test):
          self.c.add_streams(ports = [0], streams = scenario_cfg['streams'])
  
          # use one core
+        cores_per_port = self.c.system_info.get('dp_core_count_per_port', 0)
+        if cores_per_port < scenario_cfg['core_count']:
+            assert 0, "test configuration requires {0} cores but only {1} per port are available".format(scenario_cfg['core_count'], cores_per_port)
+
          core_mask = (2 ** scenario_cfg['core_count']) - 1
          self.c.start(ports = [0], mult = scenario_cfg['mult'], core_mask = [core_mask])
  
diff --git a/src/bp_sim.cpp b/src/bp_sim.cpp

index c4cb092..db273b1 100755 (executable)
--- a/src/bp_sim.cpp
+++ b/src/bp_sim.cpp
@@ -3787,22 +3787,6 @@ inline int CNodeGenerator::flush_file_realtime(dsec_t max_time,
              }
              break;
  
-         /* a case called when a time strech happens */
-         case scSTRECH:
-             {
-                 dsec_t dt = cur_time - n_time;
-                 handle_time_strech(cur_time, dt, offset, thread);
-
-                 /* re-read the top of the queue - it might have changed with messaging */
-                 node = m_p_queue.top();
-                 n_time = node->m_time + offset;
-
-                 /* go back to INIT */
-                 state = scINIT;
-
-             }
-             break;
-
           case scWORK:
              {
                  int node_count = 0;
@@ -3831,14 +3815,42 @@ inline int CNodeGenerator::flush_file_realtime(dsec_t max_time,
                  do_sleep(cur_time,thread,n_time); // estimate  loop
                  state=scWORK;
                  break;
+
+
           default:
-             assert(0);
+             handle_slow_operations(state, node, cur_time, n_time, offset, thread);
+             break;
          } /* switch */
+
      }/* while*/
  
      return (teardown(thread,always,old_offset,offset));
  }
  
+
+FORCE_NO_INLINE void CNodeGenerator::handle_slow_operations(sch_state_t &state,
+                                                            CGenNode * &node,
+                                                            dsec_t &cur_time,
+                                                            dsec_t &n_time,
+                                                            dsec_t &offset,
+                                                            CFlowGenListPerThread *thread) {
+    switch (state) {
+    case scSTRECH:
+        {
+            handle_time_strech(node, cur_time, n_time, offset, thread);
+
+            /* go back to work */
+            state = scWORK;
+
+        }
+        break;
+
+    default:
+        assert(0);
+    }
+
+}
+
  /**
   * when time is streched - the flow_sync node 
   * might be postpond too much 
@@ -3849,18 +3861,26 @@ inline int CNodeGenerator::flush_file_realtime(dsec_t max_time,
   * @author imarom (7/31/2016)
   * 
   */
-FORCE_NO_INLINE void CNodeGenerator::handle_time_strech(dsec_t cur_time,
-                                                        dsec_t dt,
-                                                        dsec_t &offset,
-                                                        CFlowGenListPerThread *thread) {
+void CNodeGenerator::handle_time_strech(CGenNode * &node,
+                                        dsec_t &cur_time,
+                                        dsec_t &n_time,
+                                        dsec_t &offset,
+                                        CFlowGenListPerThread *thread) {
+
+
+    /* fix the time offset */
+    dsec_t dt = cur_time - n_time;
+    offset += dt;
  
      /* check if flow sync message was delayed too much */
      if ( (cur_time - m_last_sync_time_sec) > SYNC_TIME_OUT ) {
          handle_maintenance(thread);
+
+        /* re-read the top of the queue - it might have changed with messaging */
+        node = m_p_queue.top();
+        n_time = node->m_time + offset;
      }
  
-    /* fix the time offset */
-    offset += dt;
  }
  
  int CNodeGenerator::flush_file_sim(dsec_t max_time,
diff --git a/src/bp_sim.h b/src/bp_sim.h

index 0af27b9..f7a1e73 100755 (executable)
--- a/src/bp_sim.h
+++ b/src/bp_sim.h
@@ -2142,7 +2142,19 @@ private:
                              CFlowGenListPerThread * thread,
                              double &old_offset);
  
-        FORCE_NO_INLINE void handle_time_strech(dsec_t cur_time, dsec_t dt, dsec_t &offset,  CFlowGenListPerThread * thread);
+        FORCE_NO_INLINE void handle_slow_operations(sch_state_t &state,
+                                                    CGenNode * &node,
+                                                    dsec_t &cur_time,
+                                                    dsec_t &n_time,
+                                                    dsec_t &offset,
+                                                    CFlowGenListPerThread *thread);
+
+        void handle_time_strech(CGenNode * &node,
+                                dsec_t &cur_time,
+                                dsec_t &n_time,
+                                dsec_t &offset,
+                                CFlowGenListPerThread *thread);
+
  
  private:        
      void handle_command(CGenNode *node, CFlowGenListPerThread *thread, bool &exit_scheduler);
author	imarom <[email protected]>
	Wed, 26 Oct 2016 13:00:50 +0000 (15:00 +0200)
committer	imarom <[email protected]>
	Wed, 26 Oct 2016 13:22:47 +0000 (15:22 +0200)
linux_dpdk/d	[changed mode: 0644->0755]	patch \| blob \| history
scripts/automation/regression/setups/trex09/benchmark.yaml		patch \| blob \| history
scripts/automation/regression/stateless_tests/stl_performance_test.py		patch \| blob \| history
src/bp_sim.cpp		patch \| blob \| history
src/bp_sim.h		patch \| blob \| history