[aarch64] Fixes CLI crashes on dpaa2 platform.
[vpp.git] / src / vnet / devices / af_packet / node.c
index 69fc11c..ec7c273 100644 (file)
@@ -1,5 +1,4 @@
-/*
- *------------------------------------------------------------------
+/*------------------------------------------------------------------
  * af_packet.c - linux kernel packet interface
  *
  * Copyright (c) 2016 Cisco and/or its affiliates.
@@ -18,6 +17,7 @@
  */
 
 #include <linux/if_packet.h>
+#include <linux/virtio_net.h>
 
 #include <vlib/vlib.h>
 #include <vlib/unix/unix.h>
@@ -58,7 +58,7 @@ format_af_packet_input_trace (u8 * s, va_list * args)
   CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
   CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
   af_packet_input_trace_t *t = va_arg (*args, af_packet_input_trace_t *);
-  uword indent = format_get_indent (s);
+  u32 indent = format_get_indent (s);
 
   s = format (s, "af_packet: hw_if_index %d next-index %d",
              t->hw_if_index, t->next_index);
@@ -124,7 +124,7 @@ af_packet_device_input_fn (vlib_main_t * vm, vlib_node_runtime_t * node,
   u32 frame_num = apif->rx_req->tp_frame_nr;
   u8 *block_start = apif->rx_ring + block * block_size;
   uword n_trace = vlib_get_trace_count (vm, node);
-  u32 cpu_index = os_get_cpu_number ();
+  u32 thread_index = vlib_get_thread_index ();
   u32 n_buffer_bytes = vlib_buffer_free_list_buffer_size (vm,
                                                          VLIB_BUFFER_DEFAULT_FREE_LIST_INDEX);
   u32 min_bufs = apif->rx_req->tp_frame_size / n_buffer_bytes;
@@ -132,15 +132,15 @@ af_packet_device_input_fn (vlib_main_t * vm, vlib_node_runtime_t * node,
   if (apif->per_interface_next_index != ~0)
     next_index = apif->per_interface_next_index;
 
-  n_free_bufs = vec_len (apm->rx_buffers[cpu_index]);
+  n_free_bufs = vec_len (apm->rx_buffers[thread_index]);
   if (PREDICT_FALSE (n_free_bufs < VLIB_FRAME_SIZE))
     {
-      vec_validate (apm->rx_buffers[cpu_index],
+      vec_validate (apm->rx_buffers[thread_index],
                    VLIB_FRAME_SIZE + n_free_bufs - 1);
       n_free_bufs +=
-       vlib_buffer_alloc (vm, &apm->rx_buffers[cpu_index][n_free_bufs],
+       vlib_buffer_alloc (vm, &apm->rx_buffers[thread_index][n_free_bufs],
                           VLIB_FRAME_SIZE);
-      _vec_len (apm->rx_buffers[cpu_index]) = n_free_bufs;
+      _vec_len (apm->rx_buffers[thread_index]) = n_free_bufs;
     }
 
   rx_frame = apif->next_rx_frame;
@@ -155,30 +155,101 @@ af_packet_device_input_fn (vlib_main_t * vm, vlib_node_runtime_t * node,
       while ((tph->tp_status & TP_STATUS_USER) && (n_free_bufs > min_bufs) &&
             n_left_to_next)
        {
+
+         struct virtio_net_hdr *vh =
+           (struct virtio_net_hdr *) (((u8 *) tph) + tph->tp_mac -
+                                      sizeof (struct virtio_net_hdr));
          u32 data_len = tph->tp_snaplen;
          u32 offset = 0;
          u32 bi0 = 0, first_bi0 = 0, prev_bi0;
+         u32 vlan_len = 0;
+         ip_csum_t wsum = 0;
+         u16 *wsum_addr = NULL;
+         u32 do_vnet = apm->flags & AF_PACKET_USES_VNET_HEADERS;
+         u32 do_csum = tph->tp_status & TP_STATUS_CSUMNOTREADY;
 
          while (data_len)
            {
              /* grab free buffer */
              u32 last_empty_buffer =
-               vec_len (apm->rx_buffers[cpu_index]) - 1;
+               vec_len (apm->rx_buffers[thread_index]) - 1;
              prev_bi0 = bi0;
-             bi0 = apm->rx_buffers[cpu_index][last_empty_buffer];
+             bi0 = apm->rx_buffers[thread_index][last_empty_buffer];
              b0 = vlib_get_buffer (vm, bi0);
-             _vec_len (apm->rx_buffers[cpu_index]) = last_empty_buffer;
+             _vec_len (apm->rx_buffers[thread_index]) = last_empty_buffer;
              n_free_bufs--;
 
              /* copy data */
              u32 bytes_to_copy =
                data_len > n_buffer_bytes ? n_buffer_bytes : data_len;
+             u32 bytes_copied = 0;
              b0->current_data = 0;
-             clib_memcpy (vlib_buffer_get_current (b0),
-                          (u8 *) tph + tph->tp_mac + offset, bytes_to_copy);
+             /* Kernel removes VLAN headers, so reconstruct VLAN */
+             if (PREDICT_FALSE (tph->tp_status & TP_STATUS_VLAN_VALID))
+               {
+                 if (PREDICT_TRUE (offset == 0))
+                   {
+                     clib_memcpy (vlib_buffer_get_current (b0),
+                                  (u8 *) tph + tph->tp_mac,
+                                  sizeof (ethernet_header_t));
+                     ethernet_header_t *eth = vlib_buffer_get_current (b0);
+                     ethernet_vlan_header_t *vlan =
+                       (ethernet_vlan_header_t *) (eth + 1);
+                     vlan->priority_cfi_and_id =
+                       clib_host_to_net_u16 (tph->tp_vlan_tci);
+                     vlan->type = eth->type;
+                     eth->type = clib_host_to_net_u16 (ETHERNET_TYPE_VLAN);
+                     vlan_len = sizeof (ethernet_vlan_header_t);
+                     bytes_copied = sizeof (ethernet_header_t);
+                   }
+               }
+             /* Check if the incoming skb is marked as CSUM_PARTIAL,
+              * If VNET Headers are enabled TP_STATUS_CSUMNOTREADY is
+              * equivalent to the vnet csum flag.
+              **/
+             if (PREDICT_TRUE ((do_vnet != 0) && (do_csum != 0)))
+               {
+                 wsum_addr = (u16 *) (((u8 *) vlib_buffer_get_current (b0)) +
+                                      vlan_len + vh->csum_start +
+                                      vh->csum_offset);
+                 if (bytes_copied <= vh->csum_start)
+                   {
+                     clib_memcpy (((u8 *) vlib_buffer_get_current (b0)) +
+                                  bytes_copied + vlan_len,
+                                  (u8 *) tph + tph->tp_mac + offset +
+                                  bytes_copied,
+                                  (vh->csum_start - bytes_copied));
+                     wsum =
+                       ip_csum_and_memcpy (wsum,
+                                           ((u8 *)
+                                            vlib_buffer_get_current (b0)) +
+                                           vh->csum_start + vlan_len,
+                                           (u8 *) tph + tph->tp_mac +
+                                           offset + vh->csum_start,
+                                           (bytes_to_copy - vh->csum_start));
+                   }
+                 else
+                   {
+                     wsum =
+                       ip_csum_and_memcpy (wsum,
+                                           ((u8 *)
+                                            vlib_buffer_get_current (b0)) +
+                                           bytes_copied + vlan_len,
+                                           (u8 *) tph + tph->tp_mac +
+                                           offset + bytes_copied,
+                                           (bytes_to_copy - bytes_copied));
+                   }
+               }
+             else
+               {
+                 clib_memcpy (((u8 *) vlib_buffer_get_current (b0)) +
+                              bytes_copied + vlan_len,
+                              (u8 *) tph + tph->tp_mac + offset +
+                              bytes_copied, (bytes_to_copy - bytes_copied));
+               }
 
              /* fill buffer header */
-             b0->current_length = bytes_to_copy;
+             b0->current_length = bytes_to_copy + vlan_len;
 
              if (offset == 0)
                {
@@ -195,6 +266,10 @@ af_packet_device_input_fn (vlib_main_t * vm, vlib_node_runtime_t * node,
              offset += bytes_to_copy;
              data_len -= bytes_to_copy;
            }
+         if (PREDICT_TRUE ((do_vnet != 0) && (do_csum != 0)))
+           {
+             *wsum_addr = ~ip_csum_fold (wsum);
+           }
          n_rx_packets++;
          n_rx_bytes += tph->tp_snaplen;
          to_next[0] = first_bi0;
@@ -216,8 +291,7 @@ af_packet_device_input_fn (vlib_main_t * vm, vlib_node_runtime_t * node,
            }
 
          /* redirect if feature path enabled */
-         vnet_feature_start_device_input_x1 (apif->sw_if_index, &next0, b0,
-                                             0);
+         vnet_feature_start_device_input_x1 (apif->sw_if_index, &next0, b0);
 
          /* enque and take next packet */
          vlib_validate_buffer_enqueue_x1 (vm, node, next_index, to_next,
@@ -237,9 +311,9 @@ af_packet_device_input_fn (vlib_main_t * vm, vlib_node_runtime_t * node,
   vlib_increment_combined_counter
     (vnet_get_main ()->interface_main.combined_sw_if_counters
      + VNET_INTERFACE_COUNTER_RX,
-     os_get_cpu_number (), apif->hw_if_index, n_rx_packets, n_rx_bytes);
+     vlib_get_thread_index (), apif->hw_if_index, n_rx_packets, n_rx_bytes);
 
-  vnet_device_increment_rx_packets (cpu_index, n_rx_packets);
+  vnet_device_increment_rx_packets (thread_index, n_rx_packets);
   return n_rx_packets;
 }
 
@@ -247,20 +321,18 @@ static uword
 af_packet_input_fn (vlib_main_t * vm, vlib_node_runtime_t * node,
                    vlib_frame_t * frame)
 {
-  int i;
   u32 n_rx_packets = 0;
-  u32 cpu_index = os_get_cpu_number ();
   af_packet_main_t *apm = &af_packet_main;
-  af_packet_if_t *apif;
+  vnet_device_input_runtime_t *rt = (void *) node->runtime_data;
+  vnet_device_and_queue_t *dq;
 
-  for (i = 0; i < vec_len (apm->interfaces); i++)
-    {
-      apif = vec_elt_at_index (apm->interfaces, i);
-      if (apif->is_admin_up &&
-         (i % apm->input_cpu_count) ==
-         (cpu_index - apm->input_cpu_first_index))
-       n_rx_packets += af_packet_device_input_fn (vm, node, frame, apif);
-    }
+  foreach_device_and_queue (dq, rt->devices_and_queues)
+  {
+    af_packet_if_t *apif;
+    apif = vec_elt_at_index (apm->interfaces, dq->dev_instance);
+    if (apif->is_admin_up)
+      n_rx_packets += af_packet_device_input_fn (vm, node, frame, apif);
+  }
 
   return n_rx_packets;
 }
@@ -272,9 +344,6 @@ VLIB_REGISTER_NODE (af_packet_input_node) = {
   .sibling_of = "device-input",
   .format_trace = format_af_packet_input_trace,
   .type = VLIB_NODE_TYPE_INPUT,
-  /**
-   * default state is INTERRUPT mode, switch to POLLING if worker threads are enabled
-   */
   .state = VLIB_NODE_STATE_INTERRUPT,
   .n_errors = AF_PACKET_INPUT_N_ERROR,
   .error_strings = af_packet_input_error_strings,