vcl: add DSCP support in VCL

[vpp.git] / src / vnet / interface_output.c
diff --git a/src/vnet/interface_output.c b/src/vnet/interface_output.c

index 7d058c2..5b43f7e 100644 (file)
--- a/src/vnet/interface_output.c
+++ b/src/vnet/interface_output.c
@@ -47,6 +47,9 @@
  #include <vnet/feature/feature.h>
  #include <vnet/classify/pcap_classify.h>
  #include <vnet/interface_output.h>
+#include <vppinfra/vector/mask_compare.h>
+#include <vppinfra/vector/compress.h>
+#include <vppinfra/vector/count_equal.h>
  
  typedef struct
  {
@@ -173,8 +176,7 @@ static_always_inline uword
  vnet_interface_output_node_inline (vlib_main_t *vm, u32 sw_if_index,
                                    vlib_combined_counter_main_t *ccm,
                                    vlib_buffer_t **b, u32 config_index, u8 arc,
-                                  u32 n_left, int do_tx_offloads,
-                                  int arc_or_subif)
+                                  u32 n_left, int processing_level)
  {
    u32 n_bytes = 0;
    u32 n_bytes0, n_bytes1, n_bytes2, n_bytes3;
@@ -190,7 +192,7 @@ vnet_interface_output_node_inline (vlib_main_t *vm, u32 sw_if_index,
        vlib_prefetch_buffer_header (b[6], LOAD);
        vlib_prefetch_buffer_header (b[7], LOAD);
  
-      if (do_tx_offloads)
+      if (processing_level >= 1)
         or_flags = b[0]->flags | b[1]->flags | b[2]->flags | b[3]->flags;
  
        /* Be grumpy about zero length buffers for benefit of
@@ -205,7 +207,7 @@ vnet_interface_output_node_inline (vlib_main_t *vm, u32 sw_if_index,
        n_bytes += n_bytes2 = vlib_buffer_length_in_chain (vm, b[2]);
        n_bytes += n_bytes3 = vlib_buffer_length_in_chain (vm, b[3]);
  
-      if (arc_or_subif)
+      if (processing_level >= 2)
         {
           u32 tx_swif0, tx_swif1, tx_swif2, tx_swif3;
           tx_swif0 = vnet_buffer (b[0])->sw_if_index[VLIB_TX];
@@ -239,7 +241,7 @@ vnet_interface_output_node_inline (vlib_main_t *vm, u32 sw_if_index,
             }
         }
  
-      if (do_tx_offloads && (or_flags & VNET_BUFFER_F_OFFLOAD))
+      if (processing_level >= 1 && (or_flags & VNET_BUFFER_F_OFFLOAD))
         {
           vnet_interface_output_handle_offload (vm, b[0]);
           vnet_interface_output_handle_offload (vm, b[1]);
@@ -259,7 +261,7 @@ vnet_interface_output_node_inline (vlib_main_t *vm, u32 sw_if_index,
  
        n_bytes += n_bytes0 = vlib_buffer_length_in_chain (vm, b[0]);
  
-      if (arc_or_subif)
+      if (processing_level >= 2)
         {
           u32 tx_swif0 = vnet_buffer (b[0])->sw_if_index[VLIB_TX];
  
@@ -273,7 +275,7 @@ vnet_interface_output_node_inline (vlib_main_t *vm, u32 sw_if_index,
             vlib_increment_combined_counter (ccm, ti, tx_swif0, 1, n_bytes0);
         }
  
-      if (do_tx_offloads)
+      if (processing_level >= 1)
         vnet_interface_output_handle_offload (vm, b[0]);
  
        n_left -= 1;
@@ -283,25 +285,33 @@ vnet_interface_output_node_inline (vlib_main_t *vm, u32 sw_if_index,
    return n_bytes;
  }
  
-static_always_inline void vnet_interface_pcap_tx_trace
-  (vlib_main_t * vm, vlib_node_runtime_t * node, vlib_frame_t * frame,
-   int sw_if_index_from_buffer)
+static_always_inline void
+vnet_interface_pcap_tx_trace (vlib_main_t *vm, vlib_node_runtime_t *node,
+                             vlib_frame_t *frame, int in_interface_ouput)
  {
    vnet_main_t *vnm = vnet_get_main ();
    u32 n_left_from, *from;
-  u32 sw_if_index;
+  u32 sw_if_index = ~0, hw_if_index = ~0;
    vnet_pcap_t *pp = &vnm->pcap;
  
    if (PREDICT_TRUE (pp->pcap_tx_enable == 0))
      return;
  
-  if (sw_if_index_from_buffer == 0)
+  if (in_interface_ouput)
+    {
+      /* interface-output is called right before interface-output-template.
+       * We only want to capture packets here if there is a per-interface
+       * filter, in case it matches the sub-interface sw_if_index.
+       * If there is no per-interface filter configured, let the
+       * interface-output-template node deal with it */
+      if (pp->pcap_sw_if_index == 0)
+       return;
+    }
+  else
      {
        vnet_interface_output_runtime_t *rt = (void *) node->runtime_data;
        sw_if_index = rt->sw_if_index;
      }
-  else
-    sw_if_index = ~0;
  
    n_left_from = frame->n_vectors;
    from = vlib_frame_vector_args (frame);
@@ -313,14 +323,91 @@ static_always_inline void vnet_interface_pcap_tx_trace
        from++;
        n_left_from--;
  
-      if (sw_if_index_from_buffer)
-       sw_if_index = vnet_buffer (b0)->sw_if_index[VLIB_TX];
+      if (in_interface_ouput)
+       {
+         const u32 sii = vnet_buffer (b0)->sw_if_index[VLIB_TX];
+         if (PREDICT_FALSE (sii != sw_if_index))
+           {
+             const vnet_hw_interface_t *hi =
+               vnet_get_sup_hw_interface (vnm, sii);
+             hw_if_index = hi->sw_if_index;
+             sw_if_index = sii;
+           }
+         if (hw_if_index == sw_if_index)
+           continue; /* defer to interface-output-template */
+       }
  
        if (vnet_is_packet_pcaped (pp, b0, sw_if_index))
         pcap_add_buffer (&pp->pcap_main, vm, bi0, pp->max_bytes_per_pkt);
      }
  }
  
+static_always_inline void
+store_tx_frame_scalar_data (vnet_hw_if_output_node_runtime_t *r,
+                           vnet_hw_if_tx_frame_t *tf)
+{
+  if (r)
+    clib_memcpy_fast (tf, &r->frame, sizeof (vnet_hw_if_tx_frame_t));
+}
+
+static_always_inline void
+enqueu_to_tx_node (vlib_main_t *vm, vlib_node_runtime_t *node,
+                  vnet_hw_interface_t *hi, u32 *from, u32 n_vectors)
+{
+  u32 next_index = VNET_INTERFACE_OUTPUT_NEXT_TX;
+  vnet_hw_if_output_node_runtime_t *r = 0;
+  u32 n_free, n_copy, *to;
+  vnet_hw_if_tx_frame_t *tf;
+  vlib_frame_t *f;
+
+  ASSERT (n_vectors <= VLIB_FRAME_SIZE);
+
+  if (hi->output_node_thread_runtimes)
+    r = vec_elt_at_index (hi->output_node_thread_runtimes, vm->thread_index);
+
+  f = vlib_get_next_frame_internal (vm, node, next_index, 0);
+  tf = vlib_frame_scalar_args (f);
+
+  if (f->n_vectors > 0 && (r == 0 || tf->queue_id == r->frame.queue_id))
+    {
+      /* append current next frame */
+      n_free = VLIB_FRAME_SIZE - f->n_vectors;
+      n_copy = clib_min (n_vectors, n_free);
+      n_vectors -= n_copy;
+      to = vlib_frame_vector_args (f);
+      to += f->n_vectors;
+    }
+  else
+    {
+      if (f->n_vectors > 0)
+       {
+         /* current frame doesn't fit - grab empty one */
+         f = vlib_get_next_frame_internal (vm, node, next_index, 1);
+         tf = vlib_frame_scalar_args (f);
+       }
+
+      /* empty frame - store scalar data */
+      store_tx_frame_scalar_data (r, tf);
+      to = vlib_frame_vector_args (f);
+      n_free = VLIB_FRAME_SIZE;
+      n_copy = n_vectors;
+      n_vectors = 0;
+    }
+
+  vlib_buffer_copy_indices (to, from, n_copy);
+  vlib_put_next_frame (vm, node, next_index, n_free - n_copy);
+
+  if (n_vectors == 0)
+    return;
+
+  /* we have more indices to store, take empty frame */
+  from += n_copy;
+  f = vlib_get_next_frame_internal (vm, node, next_index, 1);
+  store_tx_frame_scalar_data (r, vlib_frame_scalar_args (f));
+  vlib_buffer_copy_indices (vlib_frame_vector_args (f), from, n_vectors);
+  vlib_put_next_frame (vm, node, next_index, VLIB_FRAME_SIZE - n_vectors);
+}
+
  VLIB_NODE_FN (vnet_interface_output_node)
  (vlib_main_t *vm, vlib_node_runtime_t *node, vlib_frame_t *frame)
  {
@@ -352,8 +439,7 @@ VLIB_NODE_FN (vnet_interface_output_node)
        /* buffer stride */ 1, n_buffers, VNET_INTERFACE_OUTPUT_NEXT_DROP,
        node->node_index, VNET_INTERFACE_OUTPUT_ERROR_INTERFACE_DELETED);
  
-  vnet_interface_pcap_tx_trace (vm, node, frame,
-                               0 /* sw_if_index_from_buffer */ );
+  vnet_interface_pcap_tx_trace (vm, node, frame, 0 /* in_interface_ouput */);
  
    vlib_get_buffers (vm, from, bufs, n_buffers);
  
@@ -389,24 +475,32 @@ VLIB_NODE_FN (vnet_interface_output_node)
  
    ccm = im->combined_sw_if_counters + VNET_INTERFACE_COUNTER_TX;
  
-  if ((hi->caps & VNET_HW_INTERFACE_CAP_SUPPORTS_TX_CKSUM) == 0)
+  /* if not all three flags IP4_,TCP_,UDP_CKSUM set, do compute them
+   * here before sending to the interface */
+  if ((hi->caps & VNET_HW_INTERFACE_CAP_SUPPORTS_TX_CKSUM) !=
+      VNET_HW_INTERFACE_CAP_SUPPORTS_TX_CKSUM)
      do_tx_offloads = 1;
  
    if (do_tx_offloads == 0 && arc_or_subif == 0)
      n_bytes = vnet_interface_output_node_inline (
-      vm, sw_if_index, ccm, bufs, config_index, arc, n_buffers, 0, 0);
-  else if (do_tx_offloads == 0 && arc_or_subif == 1)
-    n_bytes = vnet_interface_output_node_inline (
-      vm, sw_if_index, ccm, bufs, config_index, arc, n_buffers, 0, 1);
+      vm, sw_if_index, ccm, bufs, config_index, arc, n_buffers, 0);
    else if (do_tx_offloads == 1 && arc_or_subif == 0)
      n_bytes = vnet_interface_output_node_inline (
-      vm, sw_if_index, ccm, bufs, config_index, arc, n_buffers, 1, 0);
+      vm, sw_if_index, ccm, bufs, config_index, arc, n_buffers, 1);
    else
      n_bytes = vnet_interface_output_node_inline (
-      vm, sw_if_index, ccm, bufs, config_index, arc, n_buffers, 1, 1);
+      vm, sw_if_index, ccm, bufs, config_index, arc, n_buffers, 2);
  
-  vlib_buffer_enqueue_to_single_next (vm, node, vlib_frame_vector_args (frame),
-                                     next_index, frame->n_vectors);
+  from = vlib_frame_vector_args (frame);
+  if (PREDICT_TRUE (next_index == VNET_INTERFACE_OUTPUT_NEXT_TX))
+    {
+      enqueu_to_tx_node (vm, node, hi, from, frame->n_vectors);
+    }
+  else
+    {
+      vlib_buffer_enqueue_to_single_next (vm, node, from, next_index,
+                                         frame->n_vectors);
+    }
  
    /* Update main interface stats. */
    vlib_increment_combined_counter (ccm, ti, sw_if_index, n_buffers, n_bytes);
@@ -428,8 +522,7 @@ VLIB_NODE_FN (vnet_per_buffer_interface_output_node) (vlib_main_t * vm,
    u32 n_left_to_next, *from, *to_next;
    u32 n_left_from, next_index;
  
-  vnet_interface_pcap_tx_trace (vm, node, frame,
-                               1 /* sw_if_index_from_buffer */ );
+  vnet_interface_pcap_tx_trace (vm, node, frame, 1 /* in_interface_ouput */);
  
    n_left_from = frame->n_vectors;
  
@@ -993,10 +1086,16 @@ VLIB_NODE_FN (vnet_interface_output_arc_end_node)
  {
    vnet_main_t *vnm = vnet_get_main ();
    vnet_interface_main_t *im = &vnm->interface_main;
+  vnet_hw_if_output_node_runtime_t *r = 0;
+  vnet_hw_interface_t *hi;
+  vnet_hw_if_tx_frame_t *tf;
    vlib_buffer_t *bufs[VLIB_FRAME_SIZE], **b = bufs;
-  u16 nexts[VLIB_FRAME_SIZE], *next = nexts;
-  u32 *from, n_left;
-  u16 *lt = im->if_out_arc_end_next_index_by_sw_if_index;
+  u32 sw_if_indices[VLIB_FRAME_SIZE], *sw_if_index = sw_if_indices;
+  u64 used_elts[VLIB_FRAME_SIZE / 64] = {};
+  u64 mask[VLIB_FRAME_SIZE / 64] = {};
+  u32 *tmp, *from, n_left, n_free, n_comp, *to, swif, off;
+  u16 next_index;
+  vlib_frame_t *f;
  
    from = vlib_frame_vector_args (frame);
    n_left = frame->n_vectors;
@@ -1008,25 +1107,113 @@ VLIB_NODE_FN (vnet_interface_output_arc_end_node)
        vlib_prefetch_buffer_header (b[5], LOAD);
        vlib_prefetch_buffer_header (b[6], LOAD);
        vlib_prefetch_buffer_header (b[7], LOAD);
-      next[0] = vec_elt (lt, vnet_buffer (b[0])->sw_if_index[VLIB_TX]);
-      next[1] = vec_elt (lt, vnet_buffer (b[1])->sw_if_index[VLIB_TX]);
-      next[2] = vec_elt (lt, vnet_buffer (b[2])->sw_if_index[VLIB_TX]);
-      next[3] = vec_elt (lt, vnet_buffer (b[3])->sw_if_index[VLIB_TX]);
+      sw_if_index[0] = vnet_buffer (b[0])->sw_if_index[VLIB_TX];
+      sw_if_index[1] = vnet_buffer (b[1])->sw_if_index[VLIB_TX];
+      sw_if_index[2] = vnet_buffer (b[2])->sw_if_index[VLIB_TX];
+      sw_if_index[3] = vnet_buffer (b[3])->sw_if_index[VLIB_TX];
  
        b += 4;
-      next += 4;
+      sw_if_index += 4;
        n_left -= 4;
      }
  
    while (n_left)
      {
-      next[0] = vec_elt (lt, vnet_buffer (b[0])->sw_if_index[VLIB_TX]);
+      sw_if_index[0] = vnet_buffer (b[0])->sw_if_index[VLIB_TX];
        b++;
-      next++;
+      sw_if_index++;
        n_left--;
      }
  
-  vlib_buffer_enqueue_to_next (vm, node, from, nexts, frame->n_vectors);
+  n_left = frame->n_vectors;
+  swif = sw_if_indices[0];
+  off = 0;
+
+  /* a bit ugly but it allows us to reuse stack space for temporary store
+   * which may also improve memory latency */
+  tmp = (u32 *) bufs;
+
+more:
+  next_index = vec_elt (im->if_out_arc_end_next_index_by_sw_if_index, swif);
+  hi = vnet_get_sup_hw_interface (vnm, swif);
+  if (hi->output_node_thread_runtimes)
+    r = vec_elt_at_index (hi->output_node_thread_runtimes, vm->thread_index);
+  f = vlib_get_next_frame_internal (vm, node, next_index, 0);
+  tf = vlib_frame_scalar_args (f);
+
+  if (f->n_vectors > 0 && (r == 0 || r->frame.queue_id == tf->queue_id))
+    {
+      /* append frame */
+      n_free = VLIB_FRAME_SIZE - f->n_vectors;
+      if (n_free >= f->n_vectors)
+       to = (u32 *) vlib_frame_vector_args (f) + f->n_vectors;
+      else
+       to = tmp;
+    }
+  else
+    {
+      if (f->n_vectors > 0)
+       {
+         /* current frame doesn't fit - grab empty one */
+         f = vlib_get_next_frame_internal (vm, node, next_index, 1);
+         tf = vlib_frame_scalar_args (f);
+       }
+
+      /* empty frame - store scalar data */
+      store_tx_frame_scalar_data (r, tf);
+      n_free = VLIB_FRAME_SIZE;
+      to = vlib_frame_vector_args (f);
+    }
+
+  /* compare and compress based on comparison mask */
+  clib_mask_compare_u32 (swif, sw_if_indices, mask, frame->n_vectors);
+  n_comp = clib_compress_u32 (to, from, mask, frame->n_vectors);
+
+  if (tmp != to)
+    {
+      /* indices already written to frame, just close it */
+      vlib_put_next_frame (vm, node, next_index, n_free - n_comp);
+    }
+  else if (n_free >= n_comp)
+    {
+      /* enough space in the existing frame */
+      to = (u32 *) vlib_frame_vector_args (f) + f->n_vectors;
+      vlib_buffer_copy_indices (to, tmp, n_comp);
+      vlib_put_next_frame (vm, node, next_index, n_free - n_comp);
+    }
+  else
+    {
+      /* full frame */
+      to = (u32 *) vlib_frame_vector_args (f) + f->n_vectors;
+      vlib_buffer_copy_indices (to, tmp, n_free);
+      vlib_put_next_frame (vm, node, next_index, 0);
+
+      /* second frame */
+      u32 n_frame2 = n_comp - n_free;
+      f = vlib_get_next_frame_internal (vm, node, next_index, 1);
+      to = vlib_frame_vector_args (f);
+      vlib_buffer_copy_indices (to, tmp + n_free, n_frame2);
+      tf = vlib_frame_scalar_args (f);
+      store_tx_frame_scalar_data (r, tf);
+      vlib_put_next_frame (vm, node, next_index, VLIB_FRAME_SIZE - n_frame2);
+    }
+
+  n_left -= n_comp;
+  if (n_left)
+    {
+      /* store comparison mask so we can find next unused element */
+      for (int i = 0; i < ARRAY_LEN (used_elts); i++)
+       used_elts[i] |= mask[i];
+
+      /* fine first unused sw_if_index by scanning trough used_elts bitmap */
+      while (PREDICT_FALSE (used_elts[off] == ~0))
+       off++;
+
+      swif =
+       sw_if_indices[(off << 6) + count_trailing_zeros (~used_elts[off])];
+      goto more;
+    }
+
    return frame->n_vectors;
  }