ipsec: FIx feature ordering
[vpp.git] / src / vnet / ip / ip4_reassembly.c
index f273510..b82bafe 100644 (file)
@@ -132,7 +132,9 @@ typedef struct
   // trace operation counter
   u32 trace_op_counter;
   // next index - used by non-feature node
-  u8 next_index;
+  u32 next_index;
+  // error next index - used by custom apps (~0 if not used)
+  u32 error_next_index;
   // minimum fragment length for this reassembly - used to estimate MTU
   u16 min_fragment_length;
   // number of fragments in this reassembly
@@ -292,12 +294,6 @@ ip4_reass_add_trace (vlib_main_t * vm, vlib_node_runtime_t * node,
 {
   vlib_buffer_t *b = vlib_get_buffer (vm, bi);
   vnet_buffer_opaque_t *vnb = vnet_buffer (b);
-  if (pool_is_free_index (vm->trace_main.trace_buffer_pool, b->trace_index))
-    {
-      // this buffer's trace is gone
-      b->flags &= ~VLIB_BUFFER_IS_TRACED;
-      return;
-    }
   ip4_reass_trace_t *t = vlib_add_trace (vm, node, b, sizeof (t[0]));
   t->reass_id = reass->id;
   t->action = action;
@@ -332,8 +328,8 @@ ip4_reass_free (ip4_reass_main_t * rm, ip4_reass_per_thread_t * rt,
 }
 
 always_inline void
-ip4_reass_on_timeout (vlib_main_t * vm, ip4_reass_main_t * rm,
-                     ip4_reass_t * reass)
+ip4_reass_drop_all (vlib_main_t * vm, vlib_node_runtime_t * node,
+                   ip4_reass_main_t * rm, ip4_reass_t * reass)
 {
   u32 range_bi = reass->first_bi;
   vlib_buffer_t *range_b;
@@ -360,14 +356,45 @@ ip4_reass_on_timeout (vlib_main_t * vm, ip4_reass_main_t * rm,
        }
       range_bi = range_vnb->ip.reass.next_range_bi;
     }
-  vlib_buffer_free (vm, to_free, vec_len (to_free));
-  vec_free (to_free);
+  /* send to next_error_index */
+  if (~0 != reass->error_next_index)
+    {
+      u32 n_left_to_next, *to_next, next_index;
+
+      next_index = reass->error_next_index;
+      u32 bi = ~0;
+
+      while (vec_len (to_free) > 0)
+       {
+         vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next);
+
+         while (vec_len (to_free) > 0 && n_left_to_next > 0)
+           {
+             bi = vec_pop (to_free);
+
+             if (~0 != bi)
+               {
+                 to_next[0] = bi;
+                 to_next += 1;
+                 n_left_to_next -= 1;
+                 vlib_validate_buffer_enqueue_x1 (vm, node, next_index,
+                                                  to_next, n_left_to_next,
+                                                  bi, next_index);
+               }
+           }
+         vlib_put_next_frame (vm, node, next_index, n_left_to_next);
+       }
+    }
+  else
+    {
+      vlib_buffer_free (vm, to_free, vec_len (to_free));
+    }
 }
 
 static ip4_reass_t *
-ip4_reass_find_or_create (vlib_main_t * vm, ip4_reass_main_t * rm,
-                         ip4_reass_per_thread_t * rt, ip4_reass_kv_t * kv,
-                         u8 * do_handoff)
+ip4_reass_find_or_create (vlib_main_t * vm, vlib_node_runtime_t * node,
+                         ip4_reass_main_t * rm, ip4_reass_per_thread_t * rt,
+                         ip4_reass_kv_t * kv, u8 * do_handoff)
 {
   ip4_reass_t *reass = NULL;
   f64 now = vlib_time_now (rm->vlib_main);
@@ -384,7 +411,7 @@ ip4_reass_find_or_create (vlib_main_t * vm, ip4_reass_main_t * rm,
 
       if (now > reass->last_heard + rm->timeout)
        {
-         ip4_reass_on_timeout (vm, rm, reass);
+         ip4_reass_drop_all (vm, node, rm, reass);
          ip4_reass_free (rm, rt, reass);
          reass = NULL;
        }
@@ -410,6 +437,8 @@ ip4_reass_find_or_create (vlib_main_t * vm, ip4_reass_main_t * rm,
       reass->first_bi = ~0;
       reass->last_packet_octet = ~0;
       reass->data_len = 0;
+      reass->next_index = ~0;
+      reass->error_next_index = ~0;
       ++rt->reass_n;
     }
 
@@ -432,7 +461,7 @@ always_inline ip4_reass_rc_t
 ip4_reass_finalize (vlib_main_t * vm, vlib_node_runtime_t * node,
                    ip4_reass_main_t * rm, ip4_reass_per_thread_t * rt,
                    ip4_reass_t * reass, u32 * bi0, u32 * next0, u32 * error0,
-                   bool is_feature)
+                   bool is_custom_app)
 {
   vlib_buffer_t *first_b = vlib_get_buffer (vm, reass->first_bi);
   vlib_buffer_t *last_b = NULL;
@@ -489,6 +518,7 @@ ip4_reass_finalize (vlib_main_t * vm, vlib_node_runtime_t * node,
                    }
                  tmp->flags &= ~VLIB_BUFFER_NEXT_PRESENT;
                  tmp_bi = tmp->next_buffer;
+                 tmp->next_buffer = 0;
                  tmp = vlib_get_buffer (vm, tmp_bi);
                  vlib_buffer_free_one (vm, to_be_freed_bi);
                  continue;
@@ -540,12 +570,15 @@ ip4_reass_finalize (vlib_main_t * vm, vlib_node_runtime_t * node,
                }
              if (tmp->flags & VLIB_BUFFER_NEXT_PRESENT)
                {
+                 tmp->flags &= ~VLIB_BUFFER_NEXT_PRESENT;
                  tmp_bi = tmp->next_buffer;
-                 tmp = vlib_get_buffer (vm, tmp->next_buffer);
+                 tmp->next_buffer = 0;
+                 tmp = vlib_get_buffer (vm, tmp_bi);
                  vlib_buffer_free_one (vm, to_be_freed_bi);
                }
              else
                {
+                 tmp->next_buffer = 0;
                  vlib_buffer_free_one (vm, to_be_freed_bi);
                  break;
                }
@@ -562,6 +595,7 @@ ip4_reass_finalize (vlib_main_t * vm, vlib_node_runtime_t * node,
       return IP4_REASS_RC_INTERNAL_ERROR;
     }
   last_b->flags &= ~VLIB_BUFFER_NEXT_PRESENT;
+
   if (total_length < first_b->current_length)
     {
       return IP4_REASS_RC_INTERNAL_ERROR;
@@ -577,7 +611,8 @@ ip4_reass_finalize (vlib_main_t * vm, vlib_node_runtime_t * node,
     {
       return IP4_REASS_RC_NO_BUF;
     }
-
+  // reset to reconstruct the mbuf linking
+  first_b->flags &= ~VLIB_BUFFER_EXT_HDR_VALID;
   if (PREDICT_FALSE (first_b->flags & VLIB_BUFFER_IS_TRACED))
     {
       ip4_reass_add_trace (vm, node, rm, reass, reass->first_bi, FINALIZE, 0);
@@ -609,7 +644,7 @@ ip4_reass_finalize (vlib_main_t * vm, vlib_node_runtime_t * node,
 #endif
     }
   *bi0 = reass->first_bi;
-  if (is_feature)
+  if (!is_custom_app)
     {
       *next0 = IP4_REASSEMBLY_NEXT_INPUT;
     }
@@ -700,11 +735,13 @@ ip4_reass_remove_range_from_chain (vlib_main_t * vm,
        {
          discard_b->flags &= ~VLIB_BUFFER_NEXT_PRESENT;
          discard_bi = discard_b->next_buffer;
+         discard_b->next_buffer = 0;
          discard_b = vlib_get_buffer (vm, discard_bi);
          vlib_buffer_free_one (vm, to_be_freed_bi);
        }
       else
        {
+         discard_b->next_buffer = 0;
          vlib_buffer_free_one (vm, to_be_freed_bi);
          break;
        }
@@ -716,14 +753,19 @@ always_inline ip4_reass_rc_t
 ip4_reass_update (vlib_main_t * vm, vlib_node_runtime_t * node,
                  ip4_reass_main_t * rm, ip4_reass_per_thread_t * rt,
                  ip4_reass_t * reass, u32 * bi0, u32 * next0, u32 * error0,
-                 bool is_feature)
+                 bool is_custom_app)
 {
   ip4_reass_rc_t rc = IP4_REASS_RC_OK;
   int consumed = 0;
   vlib_buffer_t *fb = vlib_get_buffer (vm, *bi0);
   ip4_header_t *fip = vlib_buffer_get_current (fb);
   vnet_buffer_opaque_t *fvnb = vnet_buffer (fb);
-  reass->next_index = fvnb->ip.reass.next_index;       // store next_index before it's overwritten
+  if (is_custom_app)
+    {
+      // store (error_)next_index before it's overwritten
+      reass->next_index = fvnb->ip.reass.next_index;
+      reass->error_next_index = fvnb->ip.reass.error_next_index;
+    }
   const u32 fragment_first = ip4_get_fragment_offset_bytes (fip);
   const u32 fragment_length =
     clib_net_to_host_u16 (fip->length) - ip4_header_bytes (fip);
@@ -926,7 +968,7 @@ ip4_reass_update (vlib_main_t * vm, vlib_node_runtime_t * node,
       reass->data_len == reass->last_packet_octet + 1)
     {
       return ip4_reass_finalize (vm, node, rm, rt, reass, bi0, next0, error0,
-                                is_feature);
+                                is_custom_app);
     }
   else
     {
@@ -948,9 +990,9 @@ ip4_reass_update (vlib_main_t * vm, vlib_node_runtime_t * node,
 }
 
 always_inline uword
-ip4_reassembly_inline (vlib_main_t * vm,
-                      vlib_node_runtime_t * node,
-                      vlib_frame_t * frame, bool is_feature)
+ip4_reassembly_inline (vlib_main_t * vm, vlib_node_runtime_t * node,
+                      vlib_frame_t * frame, bool is_feature,
+                      bool is_custom_app)
 {
   u32 *from = vlib_frame_vector_args (frame);
   u32 n_left_from, n_left_to_next, *to_next, next_index;
@@ -978,7 +1020,7 @@ ip4_reassembly_inline (vlib_main_t * vm,
          if (!ip4_get_fragment_more (ip0) && !ip4_get_fragment_offset (ip0))
            {
              // this is a whole packet - no fragmentation
-             if (is_feature)
+             if (!is_custom_app)
                {
                  next0 = IP4_REASSEMBLY_NEXT_INPUT;
                }
@@ -1012,7 +1054,8 @@ ip4_reassembly_inline (vlib_main_t * vm,
                    (u64) ip0->fragment_id << 32 | (u64) ip0->protocol << 48;
 
                  ip4_reass_t *reass =
-                   ip4_reass_find_or_create (vm, rm, rt, &kv, &do_handoff);
+                   ip4_reass_find_or_create (vm, node, rm, rt, &kv,
+                                             &do_handoff);
 
                  if (PREDICT_FALSE (do_handoff))
                    {
@@ -1029,7 +1072,7 @@ ip4_reassembly_inline (vlib_main_t * vm,
                    {
                      switch (ip4_reass_update
                              (vm, node, rm, rt, reass, &bi0, &next0,
-                              &error0, is_feature))
+                              &error0, is_custom_app))
                        {
                        case IP4_REASS_RC_OK:
                          /* nothing to do here */
@@ -1038,7 +1081,7 @@ ip4_reassembly_inline (vlib_main_t * vm,
                          vlib_node_increment_counter (vm, node->node_index,
                                                       IP4_ERROR_REASS_FRAGMENT_CHAIN_TOO_LONG,
                                                       1);
-                         ip4_reass_on_timeout (vm, rm, reass);
+                         ip4_reass_drop_all (vm, node, rm, reass);
                          ip4_reass_free (rm, rt, reass);
                          goto next_packet;
                          break;
@@ -1046,15 +1089,16 @@ ip4_reassembly_inline (vlib_main_t * vm,
                          vlib_node_increment_counter (vm, node->node_index,
                                                       IP4_ERROR_REASS_NO_BUF,
                                                       1);
-                         ip4_reass_on_timeout (vm, rm, reass);
+                         ip4_reass_drop_all (vm, node, rm, reass);
                          ip4_reass_free (rm, rt, reass);
                          goto next_packet;
                          break;
                        case IP4_REASS_RC_INTERNAL_ERROR:
+                         /* drop everything and start with a clean slate */
                          vlib_node_increment_counter (vm, node->node_index,
                                                       IP4_ERROR_REASS_INTERNAL_ERROR,
                                                       1);
-                         ip4_reass_on_timeout (vm, rm, reass);
+                         ip4_reass_drop_all (vm, node, rm, reass);
                          ip4_reass_free (rm, rt, reass);
                          goto next_packet;
                          break;
@@ -1107,7 +1151,8 @@ static char *ip4_reassembly_error_strings[] = {
 VLIB_NODE_FN (ip4_reass_node) (vlib_main_t * vm, vlib_node_runtime_t * node,
                               vlib_frame_t * frame)
 {
-  return ip4_reassembly_inline (vm, node, frame, false /* is_feature */ );
+  return ip4_reassembly_inline (vm, node, frame, false /* is_feature */ ,
+                               false /* is_custom_app */ );
 }
 
 /* *INDENT-OFF* */
@@ -1132,7 +1177,8 @@ VLIB_NODE_FN (ip4_reass_node_feature) (vlib_main_t * vm,
                                       vlib_node_runtime_t * node,
                                       vlib_frame_t * frame)
 {
-  return ip4_reassembly_inline (vm, node, frame, true /* is_feature */ );
+  return ip4_reassembly_inline (vm, node, frame, true /* is_feature */ ,
+                               false /* is_custom_app */ );
 }
 
 /* *INDENT-OFF* */
@@ -1156,7 +1202,8 @@ VLIB_REGISTER_NODE (ip4_reass_node_feature) = {
 VNET_FEATURE_INIT (ip4_reassembly_feature, static) = {
     .arc_name = "ip4-unicast",
     .node_name = "ip4-reassembly-feature",
-    .runs_before = VNET_FEATURES ("ip4-lookup"),
+    .runs_before = VNET_FEATURES ("ip4-lookup",
+                                  "ipsec4-input-feature"),
     .runs_after = 0,
 };
 /* *INDENT-ON* */
@@ -1245,6 +1292,7 @@ ip4_reass_set (u32 timeout_ms, u32 max_reassemblies,
          clib_bihash_free_16_8 (&ip4_reass_main.hash);
          clib_memcpy_fast (&ip4_reass_main.hash, &new_hash,
                            sizeof (ip4_reass_main.hash));
+         clib_bihash_copied (&ip4_reass_main.hash, &new_hash);
        }
     }
   return 0;
@@ -1361,7 +1409,7 @@ ip4_reass_walk_expired (vlib_main_t * vm,
           vec_foreach (i, pool_indexes_to_free)
           {
             ip4_reass_t *reass = pool_elt_at_index (rt->pool, i[0]);
-            ip4_reass_on_timeout (vm, rm, reass);
+            ip4_reass_drop_all (vm, node, rm, reass);
             ip4_reass_free (rm, rt, reass);
           }
           /* *INDENT-ON* */