Remove c-11 memcpy checks from perf-critical code
[vpp.git] / src / vnet / devices / netmap / node.c
index 68ea783..dde706f 100644 (file)
@@ -57,7 +57,7 @@ format_netmap_input_trace (u8 * s, va_list * args)
   CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
   CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
   netmap_input_trace_t *t = va_arg (*args, netmap_input_trace_t *);
-  uword indent = format_get_indent (s);
+  u32 indent = format_get_indent (s);
 
   s = format (s, "netmap: hw_if_index %d next-index %d",
              t->hw_if_index, t->next_index);
@@ -98,22 +98,22 @@ netmap_device_input_fn (vlib_main_t * vm, vlib_node_runtime_t * node,
   u32 n_free_bufs;
   struct netmap_ring *ring;
   int cur_ring;
-  u32 cpu_index = os_get_cpu_number ();
+  u32 thread_index = vm->thread_index;
   u32 n_buffer_bytes = vlib_buffer_free_list_buffer_size (vm,
                                                          VLIB_BUFFER_DEFAULT_FREE_LIST_INDEX);
 
   if (nif->per_interface_next_index != ~0)
     next_index = nif->per_interface_next_index;
 
-  n_free_bufs = vec_len (nm->rx_buffers[cpu_index]);
+  n_free_bufs = vec_len (nm->rx_buffers[thread_index]);
   if (PREDICT_FALSE (n_free_bufs < VLIB_FRAME_SIZE))
     {
-      vec_validate (nm->rx_buffers[cpu_index],
+      vec_validate (nm->rx_buffers[thread_index],
                    VLIB_FRAME_SIZE + n_free_bufs - 1);
       n_free_bufs +=
-       vlib_buffer_alloc (vm, &nm->rx_buffers[cpu_index][n_free_bufs],
+       vlib_buffer_alloc (vm, &nm->rx_buffers[thread_index][n_free_bufs],
                           VLIB_FRAME_SIZE);
-      _vec_len (nm->rx_buffers[cpu_index]) = n_free_bufs;
+      _vec_len (nm->rx_buffers[thread_index]) = n_free_bufs;
     }
 
   cur_ring = nif->first_rx_ring;
@@ -163,21 +163,20 @@ netmap_device_input_fn (vlib_main_t * vm, vlib_node_runtime_t * node,
                  vlib_buffer_t *b0;
                  /* grab free buffer */
                  u32 last_empty_buffer =
-                   vec_len (nm->rx_buffers[cpu_index]) - 1;
+                   vec_len (nm->rx_buffers[thread_index]) - 1;
                  prev_bi0 = bi0;
-                 bi0 = nm->rx_buffers[cpu_index][last_empty_buffer];
+                 bi0 = nm->rx_buffers[thread_index][last_empty_buffer];
                  b0 = vlib_get_buffer (vm, bi0);
-                 _vec_len (nm->rx_buffers[cpu_index]) = last_empty_buffer;
+                 _vec_len (nm->rx_buffers[thread_index]) = last_empty_buffer;
                  n_free_bufs--;
 
                  /* copy data */
                  u32 bytes_to_copy =
                    data_len > n_buffer_bytes ? n_buffer_bytes : data_len;
                  b0->current_data = 0;
-                 clib_memcpy (vlib_buffer_get_current (b0),
-                              (u8 *) NETMAP_BUF (ring,
-                                                 slot->buf_idx) + offset,
-                              bytes_to_copy);
+                 clib_memcpy_fast (vlib_buffer_get_current (b0),
+                                   (u8 *) NETMAP_BUF (ring, slot->buf_idx) +
+                                   offset, bytes_to_copy);
 
                  /* fill buffer header */
                  b0->current_length = bytes_to_copy;
@@ -247,9 +246,9 @@ netmap_device_input_fn (vlib_main_t * vm, vlib_node_runtime_t * node,
   vlib_increment_combined_counter
     (vnet_get_main ()->interface_main.combined_sw_if_counters
      + VNET_INTERFACE_COUNTER_RX,
-     os_get_cpu_number (), nif->hw_if_index, n_rx_packets, n_rx_bytes);
+     vlib_get_thread_index (), nif->hw_if_index, n_rx_packets, n_rx_bytes);
 
-  vnet_device_increment_rx_packets (cpu_index, n_rx_packets);
+  vnet_device_increment_rx_packets (thread_index, n_rx_packets);
 
   return n_rx_packets;
 }
@@ -260,7 +259,7 @@ netmap_input_fn (vlib_main_t * vm, vlib_node_runtime_t * node,
 {
   int i;
   u32 n_rx_packets = 0;
-  u32 cpu_index = os_get_cpu_number ();
+  u32 thread_index = vm->thread_index;
   netmap_main_t *nm = &netmap_main;
   netmap_if_t *nmi;
 
@@ -269,7 +268,7 @@ netmap_input_fn (vlib_main_t * vm, vlib_node_runtime_t * node,
       nmi = vec_elt_at_index (nm->interfaces, i);
       if (nmi->is_admin_up &&
          (i % nm->input_cpu_count) ==
-         (cpu_index - nm->input_cpu_first_index))
+         (thread_index - nm->input_cpu_first_index))
        n_rx_packets += netmap_device_input_fn (vm, node, frame, nmi);
     }