Convert GRE nodes to new buffer APIs and multiarch
[vpp.git] / src / vnet / gre / node.c
index 7223b01..ff74d1b 100644 (file)
@@ -43,9 +43,11 @@ typedef struct
   u32 length;
   ip46_address_t src;
   ip46_address_t dst;
-  u8 is_ipv6;
 } gre_rx_trace_t;
 
+extern u8 *format_gre_rx_trace (u8 * s, va_list * args);
+
+#ifndef CLIB_MARCH_VARIANT
 u8 *
 format_gre_rx_trace (u8 * s, va_list * args)
 {
@@ -59,6 +61,7 @@ format_gre_rx_trace (u8 * s, va_list * args)
              format_ip46_address, &t->dst, IP46_TYPE_ANY);
   return s;
 }
+#endif /* CLIB_MARCH_VARIANT */
 
 typedef struct
 {
@@ -67,500 +70,375 @@ typedef struct
   u16 *next_by_protocol;
 } gre_input_runtime_t;
 
+always_inline void
+gre_trace (vlib_main_t * vm, vlib_node_runtime_t * node, vlib_buffer_t * b,
+          u32 tun_sw_if_index, const ip6_header_t * ip6,
+          const ip4_header_t * ip4, int is_ipv6)
+{
+  gre_rx_trace_t *tr = vlib_add_trace (vm, node,
+                                      b, sizeof (*tr));
+  tr->tunnel_id = tun_sw_if_index;
+  if (is_ipv6)
+    {
+      tr->length = ip6->payload_length;
+      tr->src.ip6.as_u64[0] = ip6->src_address.as_u64[0];
+      tr->src.ip6.as_u64[1] = ip6->src_address.as_u64[1];
+      tr->dst.ip6.as_u64[0] = ip6->dst_address.as_u64[0];
+      tr->dst.ip6.as_u64[1] = ip6->dst_address.as_u64[1];
+    }
+  else
+    {
+      tr->length = ip4->length;
+      tr->src.as_u64[0] = tr->src.as_u64[1] = 0;
+      tr->dst.as_u64[0] = tr->dst.as_u64[1] = 0;
+      tr->src.ip4.as_u32 = ip4->src_address.as_u32;
+      tr->dst.ip4.as_u32 = ip4->dst_address.as_u32;
+    }
+}
+
+always_inline void
+gre_tunnel_get (const gre_main_t * gm, vlib_node_runtime_t * node,
+               vlib_buffer_t * b, u16 * next, const gre_tunnel_key_t * key,
+               gre_tunnel_key_t * cached_key, u32 * tun_sw_if_index,
+               u32 * cached_tun_sw_if_index, int is_ipv6)
+{
+  const uword *p;
+  p = is_ipv6 ? hash_get_mem (gm->tunnel_by_key6, &key->gtk_v6)
+    : hash_get_mem (gm->tunnel_by_key4, &key->gtk_v4);
+  if (PREDICT_FALSE (!p))
+    {
+      *next = GRE_INPUT_NEXT_DROP;
+      b->error = node->errors[GRE_ERROR_NO_SUCH_TUNNEL];
+      *tun_sw_if_index = ~0;
+    }
+  else
+    {
+      const gre_tunnel_t *tun;
+      tun = pool_elt_at_index (gm->tunnels, *p);
+      *cached_tun_sw_if_index = *tun_sw_if_index = tun->sw_if_index;
+      if (is_ipv6)
+       cached_key->gtk_v6 = key->gtk_v6;
+      else
+       cached_key->gtk_v4 = key->gtk_v4;
+    }
+}
+
 always_inline uword
 gre_input (vlib_main_t * vm,
-          vlib_node_runtime_t * node, vlib_frame_t * from_frame, u8 is_ipv6)
+          vlib_node_runtime_t * node, vlib_frame_t * frame,
+          const int is_ipv6)
 {
   gre_main_t *gm = &gre_main;
-  __attribute__ ((unused)) u32 n_left_from, next_index, *from, *to_next;
-  gre_tunnel_key_t cached_tunnel_key;
+  u32 *from, n_left_from;
+  vlib_buffer_t *bufs[VLIB_FRAME_SIZE], **b = bufs;
+  u16 nexts[VLIB_FRAME_SIZE], *next = nexts;
+  u16 cached_protocol = ~0;
+  u32 cached_next_index = SPARSE_VEC_INVALID_INDEX;
+  u32 cached_tun_sw_if_index = ~0;
+  gre_tunnel_key_t cached_key;
+
+  from = vlib_frame_vector_args (frame);
+  n_left_from = frame->n_vectors;
+  vlib_get_buffers (vm, from, bufs, n_left_from);
+
+  if (is_ipv6)
+    clib_memset (&cached_key.gtk_v6, 0xff, sizeof (cached_key.gtk_v6));
+  else
+    clib_memset (&cached_key.gtk_v4, 0xff, sizeof (cached_key.gtk_v4));
 
-  u32 cached_tunnel_sw_if_index = ~0, tunnel_sw_if_index = ~0;
+  while (n_left_from >= 2)
+    {
+      const ip6_header_t *ip6[2];
+      const ip4_header_t *ip4[2];
+      const gre_header_t *gre[2];
+      u32 nidx[2];
+      next_info_t ni[2];
+      u8 type[2];
+      u16 version[2];
+      u32 len[2];
+      gre_tunnel_key_t key[2];
+      u8 matched[2];
+      u32 tun_sw_if_index[2];
+
+      if (PREDICT_TRUE (n_left_from >= 6))
+       {
+         vlib_prefetch_buffer_data (b[2], LOAD);
+         vlib_prefetch_buffer_data (b[3], LOAD);
+         vlib_prefetch_buffer_header (b[4], STORE);
+         vlib_prefetch_buffer_header (b[5], STORE);
+       }
 
-  u32 thread_index = vlib_get_thread_index ();
-  u32 len;
-  vnet_interface_main_t *im = &gm->vnet_main->interface_main;
+      if (is_ipv6)
+       {
+         /* ip6_local hands us the ip header, not the gre header */
+         ip6[0] = vlib_buffer_get_current (b[0]);
+         ip6[1] = vlib_buffer_get_current (b[1]);
+         gre[0] = (void *) (ip6[0] + 1);
+         gre[1] = (void *) (ip6[1] + 1);
+         vlib_buffer_advance (b[0], sizeof (*ip6[0]) + sizeof (*gre[0]));
+         vlib_buffer_advance (b[1], sizeof (*ip6[0]) + sizeof (*gre[0]));
+       }
+      else
+       {
+         /* ip4_local hands us the ip header, not the gre header */
+         ip4[0] = vlib_buffer_get_current (b[0]);
+         ip4[1] = vlib_buffer_get_current (b[1]);
+         gre[0] = (void *) (ip4[0] + 1);
+         gre[1] = (void *) (ip4[1] + 1);
+         vlib_buffer_advance (b[0], sizeof (*ip4[0]) + sizeof (*gre[0]));
+         vlib_buffer_advance (b[1], sizeof (*ip4[0]) + sizeof (*gre[0]));
+       }
 
-  if (!is_ipv6)
-    memset (&cached_tunnel_key.gtk_v4, 0xff,
-           sizeof (cached_tunnel_key.gtk_v4));
-  else
-    memset (&cached_tunnel_key.gtk_v6, 0xff,
-           sizeof (cached_tunnel_key.gtk_v6));
+      if (PREDICT_TRUE (cached_protocol == gre[0]->protocol))
+       {
+         nidx[0] = cached_next_index;
+       }
+      else
+       {
+         cached_next_index = nidx[0] =
+           sparse_vec_index (gm->next_by_protocol, gre[0]->protocol);
+         cached_protocol = gre[0]->protocol;
+       }
+      if (PREDICT_TRUE (cached_protocol == gre[1]->protocol))
+       {
+         nidx[1] = cached_next_index;
+       }
+      else
+       {
+         cached_next_index = nidx[1] =
+           sparse_vec_index (gm->next_by_protocol, gre[1]->protocol);
+         cached_protocol = gre[1]->protocol;
+       }
+
+      ni[0] = vec_elt (gm->next_by_protocol, nidx[0]);
+      ni[1] = vec_elt (gm->next_by_protocol, nidx[1]);
+      next[0] = ni[0].next_index;
+      next[1] = ni[1].next_index;
+      type[0] = ni[0].tunnel_type;
+      type[1] = ni[1].tunnel_type;
+
+      b[0]->error = nidx[0] == SPARSE_VEC_INVALID_INDEX
+       ? node->errors[GRE_ERROR_UNKNOWN_PROTOCOL]
+       : node->errors[GRE_ERROR_NONE];
+      b[1]->error = nidx[1] == SPARSE_VEC_INVALID_INDEX
+       ? node->errors[GRE_ERROR_UNKNOWN_PROTOCOL]
+       : node->errors[GRE_ERROR_NONE];
+
+      version[0] = clib_net_to_host_u16 (gre[0]->flags_and_version);
+      version[1] = clib_net_to_host_u16 (gre[1]->flags_and_version);
+      version[0] &= GRE_VERSION_MASK;
+      version[1] &= GRE_VERSION_MASK;
+
+      b[0]->error = version[0]
+       ? node->errors[GRE_ERROR_UNSUPPORTED_VERSION] : b[0]->error;
+      next[0] = version[0] ? GRE_INPUT_NEXT_DROP : next[0];
+      b[1]->error = version[1]
+       ? node->errors[GRE_ERROR_UNSUPPORTED_VERSION] : b[1]->error;
+      next[1] = version[1] ? GRE_INPUT_NEXT_DROP : next[1];
+
+      len[0] = vlib_buffer_length_in_chain (vm, b[0]);
+      len[1] = vlib_buffer_length_in_chain (vm, b[1]);
+
+      if (is_ipv6)
+       {
+         gre_mk_key6 (&ip6[0]->dst_address,
+                      &ip6[0]->src_address,
+                      vnet_buffer (b[0])->ip.fib_index,
+                      type[0], 0, &key[0].gtk_v6);
+         gre_mk_key6 (&ip6[1]->dst_address,
+                      &ip6[1]->src_address,
+                      vnet_buffer (b[1])->ip.fib_index,
+                      type[1], 0, &key[1].gtk_v6);
+         matched[0] = gre_match_key6 (&cached_key.gtk_v6, &key[0].gtk_v6);
+         matched[1] = gre_match_key6 (&cached_key.gtk_v6, &key[1].gtk_v6);
+       }
+      else
+       {
+         gre_mk_key4 (ip4[0]->dst_address,
+                      ip4[0]->src_address,
+                      vnet_buffer (b[0])->ip.fib_index,
+                      type[0], 0, &key[0].gtk_v4);
+         gre_mk_key4 (ip4[1]->dst_address,
+                      ip4[1]->src_address,
+                      vnet_buffer (b[1])->ip.fib_index,
+                      type[1], 0, &key[1].gtk_v4);
+         matched[0] = gre_match_key4 (&cached_key.gtk_v4, &key[0].gtk_v4);
+         matched[1] = gre_match_key4 (&cached_key.gtk_v4, &key[1].gtk_v4);
+       }
+
+      tun_sw_if_index[0] = cached_tun_sw_if_index;
+      tun_sw_if_index[1] = cached_tun_sw_if_index;
+      if (PREDICT_FALSE (!matched[0]))
+       gre_tunnel_get (gm, node, b[0], &next[0], &key[0], &cached_key,
+                       &tun_sw_if_index[0], &cached_tun_sw_if_index,
+                       is_ipv6);
+      if (PREDICT_FALSE (!matched[1]))
+       gre_tunnel_get (gm, node, b[1], &next[1], &key[1], &cached_key,
+                       &tun_sw_if_index[1], &cached_tun_sw_if_index,
+                       is_ipv6);
+
+      if (PREDICT_TRUE (next[0] > GRE_INPUT_NEXT_DROP))
+       {
+         vlib_increment_combined_counter (&gm->vnet_main->
+                                          interface_main.combined_sw_if_counters
+                                          [VNET_INTERFACE_COUNTER_RX],
+                                          vm->thread_index,
+                                          tun_sw_if_index[0],
+                                          1 /* packets */ ,
+                                          len[0] /* bytes */ );
+         vnet_buffer (b[0])->sw_if_index[VLIB_RX] = tun_sw_if_index[0];
+       }
+      if (PREDICT_TRUE (next[1] > GRE_INPUT_NEXT_DROP))
+       {
+         vlib_increment_combined_counter (&gm->vnet_main->
+                                          interface_main.combined_sw_if_counters
+                                          [VNET_INTERFACE_COUNTER_RX],
+                                          vm->thread_index,
+                                          tun_sw_if_index[1],
+                                          1 /* packets */ ,
+                                          len[1] /* bytes */ );
+         vnet_buffer (b[1])->sw_if_index[VLIB_RX] = tun_sw_if_index[1];
+       }
 
-  from = vlib_frame_vector_args (from_frame);
-  n_left_from = from_frame->n_vectors;
+      if (PREDICT_FALSE (b[0]->flags & VLIB_BUFFER_IS_TRACED))
+       gre_trace (vm, node, b[0], tun_sw_if_index[0], ip6[0], ip4[0],
+                  is_ipv6);
+      if (PREDICT_FALSE (b[1]->flags & VLIB_BUFFER_IS_TRACED))
+       gre_trace (vm, node, b[1], tun_sw_if_index[1], ip6[1], ip4[1],
+                  is_ipv6);
 
-  next_index = node->cached_next_index;
+      b += 2;
+      next += 2;
+      n_left_from -= 2;
+    }
 
-  while (n_left_from > 0)
+  while (n_left_from >= 1)
     {
-      u32 n_left_to_next;
+      const ip6_header_t *ip6[1];
+      const ip4_header_t *ip4[1];
+      const gre_header_t *gre[1];
+      u32 nidx[1];
+      next_info_t ni[1];
+      u8 type[1];
+      u16 version[1];
+      u32 len[1];
+      gre_tunnel_key_t key[1];
+      u8 matched[1];
+      u32 tun_sw_if_index[1];
+
+      if (PREDICT_TRUE (n_left_from >= 3))
+       {
+         vlib_prefetch_buffer_data (b[1], LOAD);
+         vlib_prefetch_buffer_header (b[2], STORE);
+       }
 
-      vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next);
+      if (is_ipv6)
+       {
+         /* ip6_local hands us the ip header, not the gre header */
+         ip6[0] = vlib_buffer_get_current (b[0]);
+         gre[0] = (void *) (ip6[0] + 1);
+         vlib_buffer_advance (b[0], sizeof (*ip6[0]) + sizeof (*gre[0]));
+       }
+      else
+       {
+         /* ip4_local hands us the ip header, not the gre header */
+         ip4[0] = vlib_buffer_get_current (b[0]);
+         gre[0] = (void *) (ip4[0] + 1);
+         vlib_buffer_advance (b[0], sizeof (*ip4[0]) + sizeof (*gre[0]));
+       }
 
-      while (n_left_from >= 4 && n_left_to_next >= 2)
+      if (PREDICT_TRUE (cached_protocol == gre[0]->protocol))
        {
-         u32 bi0, bi1;
-         vlib_buffer_t *b0, *b1;
-         gre_header_t *h0, *h1;
-         u16 version0, version1;
-         int verr0, verr1;
-         u32 i0, i1, next0, next1, protocol0, protocol1;
-         ip4_header_t *ip4_0, *ip4_1;
-         ip6_header_t *ip6_0, *ip6_1;
-         gre_tunnel_key_t key0, key1;
-
-         /* Prefetch next iteration. */
-         {
-           vlib_buffer_t *p2, *p3;
-
-           p2 = vlib_get_buffer (vm, from[2]);
-           p3 = vlib_get_buffer (vm, from[3]);
-
-           vlib_prefetch_buffer_header (p2, LOAD);
-           vlib_prefetch_buffer_header (p3, LOAD);
-
-           CLIB_PREFETCH (p2->data, sizeof (h0[0]), LOAD);
-           CLIB_PREFETCH (p3->data, sizeof (h1[0]), LOAD);
-         }
-
-         bi0 = from[0];
-         bi1 = from[1];
-         to_next[0] = bi0;
-         to_next[1] = bi1;
-         from += 2;
-         to_next += 2;
-         n_left_to_next -= 2;
-         n_left_from -= 2;
-
-         b0 = vlib_get_buffer (vm, bi0);
-         b1 = vlib_get_buffer (vm, bi1);
-
-         if (!is_ipv6)
-           {
-             /* ip4_local hands us the ip header, not the gre header */
-             ip4_0 = vlib_buffer_get_current (b0);
-             ip4_1 = vlib_buffer_get_current (b1);
-
-             vlib_buffer_advance (b0, sizeof (*ip4_0));
-             vlib_buffer_advance (b1, sizeof (*ip4_1));
-           }
-         else
-           {
-             /* ip6_local hands us the ip header, not the gre header */
-             ip6_0 = vlib_buffer_get_current (b0);
-             ip6_1 = vlib_buffer_get_current (b1);
-
-             vlib_buffer_advance (b0, sizeof (*ip6_0));
-             vlib_buffer_advance (b1, sizeof (*ip6_1));
-           }
-
-         h0 = vlib_buffer_get_current (b0);
-         h1 = vlib_buffer_get_current (b1);
-
-         /* Index sparse array with network byte order. */
-         protocol0 = h0->protocol;
-         protocol1 = h1->protocol;
-         sparse_vec_index2 (gm->next_by_protocol, protocol0, protocol1,
-                            &i0, &i1);
-         next0 = vec_elt (gm->next_by_protocol, i0);
-         next1 = vec_elt (gm->next_by_protocol, i1);
-
-         b0->error =
-           node->errors[i0 ==
-                        SPARSE_VEC_INVALID_INDEX ? GRE_ERROR_UNKNOWN_PROTOCOL
-                        : GRE_ERROR_NONE];
-         b1->error =
-           node->errors[i1 ==
-                        SPARSE_VEC_INVALID_INDEX ? GRE_ERROR_UNKNOWN_PROTOCOL
-                        : GRE_ERROR_NONE];
-
-         version0 = clib_net_to_host_u16 (h0->flags_and_version);
-         verr0 = version0 & GRE_VERSION_MASK;
-         version1 = clib_net_to_host_u16 (h1->flags_and_version);
-         verr1 = version1 & GRE_VERSION_MASK;
-
-         b0->error = verr0 ? node->errors[GRE_ERROR_UNSUPPORTED_VERSION]
-           : b0->error;
-         next0 = verr0 ? GRE_INPUT_NEXT_DROP : next0;
-         b1->error = verr1 ? node->errors[GRE_ERROR_UNSUPPORTED_VERSION]
-           : b1->error;
-         next1 = verr1 ? GRE_INPUT_NEXT_DROP : next1;
-
-
-         /* RPF check for ip4/ip6 input */
-         if (PREDICT_TRUE (next0 == GRE_INPUT_NEXT_IP4_INPUT
-                           || next0 == GRE_INPUT_NEXT_IP6_INPUT
-                           || next0 == GRE_INPUT_NEXT_ETHERNET_INPUT
-                           || next0 == GRE_INPUT_NEXT_MPLS_INPUT))
-           {
-             if (is_ipv6)
-               {
-                 gre_mk_key6 (&ip6_0->dst_address,
-                              &ip6_0->src_address,
-                              vnet_buffer (b0)->ip.fib_index, &key0.gtk_v6);
-               }
-             else
-               {
-                 gre_mk_key4 (&ip4_0->dst_address,
-                              &ip4_0->src_address,
-                              vnet_buffer (b0)->ip.fib_index, &key0.gtk_v4);
-               }
-
-             if ((!is_ipv6 && !gre_match_key4 (&cached_tunnel_key.gtk_v4,
-                                               &key0.gtk_v4)) ||
-                 (is_ipv6 && !gre_match_key6 (&cached_tunnel_key.gtk_v6,
-                                              &key0.gtk_v6)))
-               {
-                 gre_tunnel_t *t;
-                 uword *p;
-
-                 if (!is_ipv6)
-                   {
-                     p = hash_get_mem (gm->tunnel_by_key4, &key0.gtk_v4);
-                   }
-                 else
-                   {
-                     p = hash_get_mem (gm->tunnel_by_key6, &key0.gtk_v6);
-                   }
-                 if (!p)
-                   {
-                     next0 = GRE_INPUT_NEXT_DROP;
-                     b0->error = node->errors[GRE_ERROR_NO_SUCH_TUNNEL];
-                     goto drop0;
-                   }
-                 t = pool_elt_at_index (gm->tunnels, p[0]);
-                 tunnel_sw_if_index = t->sw_if_index;
-
-                 cached_tunnel_sw_if_index = tunnel_sw_if_index;
-                 if (!is_ipv6)
-                   {
-                     cached_tunnel_key.gtk_v4 = key0.gtk_v4;
-                   }
-                 else
-                   {
-                     cached_tunnel_key.gtk_v6 = key0.gtk_v6;
-                   }
-               }
-             else
-               {
-                 tunnel_sw_if_index = cached_tunnel_sw_if_index;
-               }
-           }
-         else
-           {
-             next0 = GRE_INPUT_NEXT_DROP;
-             goto drop0;
-           }
-         len = vlib_buffer_length_in_chain (vm, b0);
-         vlib_increment_combined_counter (im->combined_sw_if_counters
-                                          + VNET_INTERFACE_COUNTER_RX,
-                                          thread_index,
-                                          tunnel_sw_if_index,
-                                          1 /* packets */ ,
-                                          len /* bytes */ );
-
-         vnet_buffer (b0)->sw_if_index[VLIB_RX] = tunnel_sw_if_index;
-
-       drop0:
-         if (PREDICT_TRUE (next1 == GRE_INPUT_NEXT_IP4_INPUT
-                           || next1 == GRE_INPUT_NEXT_IP6_INPUT
-                           || next1 == GRE_INPUT_NEXT_ETHERNET_INPUT
-                           || next1 == GRE_INPUT_NEXT_MPLS_INPUT))
-           {
-             if (is_ipv6)
-               {
-                 gre_mk_key6 (&ip6_1->dst_address,
-                              &ip6_1->src_address,
-                              vnet_buffer (b1)->ip.fib_index, &key1.gtk_v6);
-               }
-             else
-               {
-                 gre_mk_key4 (&ip4_1->dst_address,
-                              &ip4_1->src_address,
-                              vnet_buffer (b1)->ip.fib_index, &key1.gtk_v4);
-               }
-
-             if ((!is_ipv6 && !gre_match_key4 (&cached_tunnel_key.gtk_v4,
-                                               &key1.gtk_v4)) ||
-                 (is_ipv6 && !gre_match_key6 (&cached_tunnel_key.gtk_v6,
-                                              &key1.gtk_v6)))
-               {
-                 gre_tunnel_t *t;
-                 uword *p;
-
-                 if (!is_ipv6)
-                   {
-                     p = hash_get_mem (gm->tunnel_by_key4, &key1.gtk_v4);
-                   }
-                 else
-                   {
-                     p = hash_get_mem (gm->tunnel_by_key6, &key1.gtk_v6);
-                   }
-                 if (!p)
-                   {
-                     next1 = GRE_INPUT_NEXT_DROP;
-                     b1->error = node->errors[GRE_ERROR_NO_SUCH_TUNNEL];
-                     goto drop1;
-                   }
-                 t = pool_elt_at_index (gm->tunnels, p[0]);
-                 tunnel_sw_if_index = t->sw_if_index;
-
-                 cached_tunnel_sw_if_index = tunnel_sw_if_index;
-                 if (!is_ipv6)
-                   {
-                     cached_tunnel_key.gtk_v4 = key1.gtk_v4;
-                   }
-                 else
-                   {
-                     cached_tunnel_key.gtk_v6 = key1.gtk_v6;
-                   }
-               }
-             else
-               {
-                 tunnel_sw_if_index = cached_tunnel_sw_if_index;
-               }
-           }
-         else
-           {
-             next1 = GRE_INPUT_NEXT_DROP;
-             goto drop1;
-           }
-         len = vlib_buffer_length_in_chain (vm, b1);
-         vlib_increment_combined_counter (im->combined_sw_if_counters
-                                          + VNET_INTERFACE_COUNTER_RX,
-                                          thread_index,
-                                          tunnel_sw_if_index,
-                                          1 /* packets */ ,
-                                          len /* bytes */ );
-
-         vnet_buffer (b1)->sw_if_index[VLIB_RX] = tunnel_sw_if_index;
-
-       drop1:
-         if (PREDICT_FALSE (b0->flags & VLIB_BUFFER_IS_TRACED))
-           {
-             gre_rx_trace_t *tr = vlib_add_trace (vm, node,
-                                                  b0, sizeof (*tr));
-             tr->tunnel_id = tunnel_sw_if_index;
-             if (!is_ipv6)
-               {
-                 tr->length = ip4_0->length;
-                 tr->src.ip4.as_u32 = ip4_0->src_address.as_u32;
-                 tr->dst.ip4.as_u32 = ip4_0->dst_address.as_u32;
-               }
-             else
-               {
-                 tr->length = ip6_0->payload_length;
-                 tr->src.ip6.as_u64[0] = ip6_0->src_address.as_u64[0];
-                 tr->src.ip6.as_u64[1] = ip6_0->src_address.as_u64[1];
-                 tr->dst.ip6.as_u64[0] = ip6_0->dst_address.as_u64[0];
-                 tr->dst.ip6.as_u64[1] = ip6_0->dst_address.as_u64[1];
-               }
-           }
-
-         if (PREDICT_FALSE (b1->flags & VLIB_BUFFER_IS_TRACED))
-           {
-             gre_rx_trace_t *tr = vlib_add_trace (vm, node,
-                                                  b1, sizeof (*tr));
-             tr->tunnel_id = tunnel_sw_if_index;
-             if (!is_ipv6)
-               {
-                 tr->length = ip4_1->length;
-                 tr->src.ip4.as_u32 = ip4_1->src_address.as_u32;
-                 tr->dst.ip4.as_u32 = ip4_1->dst_address.as_u32;
-               }
-             else
-               {
-                 tr->length = ip6_1->payload_length;
-                 tr->src.ip6.as_u64[0] = ip6_1->src_address.as_u64[0];
-                 tr->src.ip6.as_u64[1] = ip6_1->src_address.as_u64[1];
-                 tr->dst.ip6.as_u64[0] = ip6_1->dst_address.as_u64[0];
-                 tr->dst.ip6.as_u64[1] = ip6_1->dst_address.as_u64[1];
-               }
-           }
-
-         vlib_buffer_advance (b0, sizeof (*h0));
-         vlib_buffer_advance (b1, sizeof (*h1));
-
-         vlib_validate_buffer_enqueue_x2 (vm, node, next_index,
-                                          to_next, n_left_to_next,
-                                          bi0, bi1, next0, next1);
+         nidx[0] = cached_next_index;
        }
+      else
+       {
+         cached_next_index = nidx[0] =
+           sparse_vec_index (gm->next_by_protocol, gre[0]->protocol);
+         cached_protocol = gre[0]->protocol;
+       }
+
+      ni[0] = vec_elt (gm->next_by_protocol, nidx[0]);
+      next[0] = ni[0].next_index;
+      type[0] = ni[0].tunnel_type;
+
+      b[0]->error = nidx[0] == SPARSE_VEC_INVALID_INDEX
+       ? node->errors[GRE_ERROR_UNKNOWN_PROTOCOL]
+       : node->errors[GRE_ERROR_NONE];
+
+      version[0] = clib_net_to_host_u16 (gre[0]->flags_and_version);
+      version[0] &= GRE_VERSION_MASK;
+
+      b[0]->error = version[0]
+       ? node->errors[GRE_ERROR_UNSUPPORTED_VERSION] : b[0]->error;
+      next[0] = version[0] ? GRE_INPUT_NEXT_DROP : next[0];
+
+      len[0] = vlib_buffer_length_in_chain (vm, b[0]);
+
+      if (is_ipv6)
+       {
+         gre_mk_key6 (&ip6[0]->dst_address,
+                      &ip6[0]->src_address,
+                      vnet_buffer (b[0])->ip.fib_index,
+                      type[0], 0, &key[0].gtk_v6);
+         matched[0] = gre_match_key6 (&cached_key.gtk_v6, &key[0].gtk_v6);
+       }
+      else
+       {
+         gre_mk_key4 (ip4[0]->dst_address,
+                      ip4[0]->src_address,
+                      vnet_buffer (b[0])->ip.fib_index,
+                      type[0], 0, &key[0].gtk_v4);
+         matched[0] = gre_match_key4 (&cached_key.gtk_v4, &key[0].gtk_v4);
+       }
+
+      tun_sw_if_index[0] = cached_tun_sw_if_index;
+      if (PREDICT_FALSE (!matched[0]))
+       gre_tunnel_get (gm, node, b[0], &next[0], &key[0], &cached_key,
+                       &tun_sw_if_index[0], &cached_tun_sw_if_index,
+                       is_ipv6);
 
-      while (n_left_from > 0 && n_left_to_next > 0)
+      if (PREDICT_TRUE (next[0] > GRE_INPUT_NEXT_DROP))
        {
-         u32 bi0;
-         vlib_buffer_t *b0;
-         gre_header_t *h0;
-         ip4_header_t *ip4_0;
-         ip6_header_t *ip6_0;
-         u16 version0;
-         int verr0;
-         u32 i0, next0;
-         gre_tunnel_key_t key0;
-
-         bi0 = from[0];
-         to_next[0] = bi0;
-         from += 1;
-         to_next += 1;
-         n_left_from -= 1;
-         n_left_to_next -= 1;
-
-         b0 = vlib_get_buffer (vm, bi0);
-         ip4_0 = vlib_buffer_get_current (b0);
-         ip6_0 = (void *) ip4_0;
-
-         if (!is_ipv6)
-           {
-             vlib_buffer_advance (b0, sizeof (*ip4_0));
-           }
-         else
-           {
-             vlib_buffer_advance (b0, sizeof (*ip6_0));
-           }
-
-         h0 = vlib_buffer_get_current (b0);
-
-         i0 = sparse_vec_index (gm->next_by_protocol, h0->protocol);
-         next0 = vec_elt (gm->next_by_protocol, i0);
-
-         b0->error =
-           node->errors[i0 == SPARSE_VEC_INVALID_INDEX
-                        ? GRE_ERROR_UNKNOWN_PROTOCOL : GRE_ERROR_NONE];
-
-         version0 = clib_net_to_host_u16 (h0->flags_and_version);
-         verr0 = version0 & GRE_VERSION_MASK;
-         b0->error = verr0 ? node->errors[GRE_ERROR_UNSUPPORTED_VERSION]
-           : b0->error;
-         next0 = verr0 ? GRE_INPUT_NEXT_DROP : next0;
-
-
-         /* For IP payload we need to find source interface
-            so we can increase counters and help forward node to
-            pick right FIB */
-         /* RPF check for ip4/ip6 input */
-         if (PREDICT_TRUE (next0 == GRE_INPUT_NEXT_IP4_INPUT
-                           || next0 == GRE_INPUT_NEXT_IP6_INPUT
-                           || next0 == GRE_INPUT_NEXT_ETHERNET_INPUT
-                           || next0 == GRE_INPUT_NEXT_MPLS_INPUT))
-           {
-             if (is_ipv6)
-               {
-                 gre_mk_key6 (&ip6_0->dst_address,
-                              &ip6_0->src_address,
-                              vnet_buffer (b0)->ip.fib_index, &key0.gtk_v6);
-               }
-             else
-               {
-                 gre_mk_key4 (&ip4_0->dst_address,
-                              &ip4_0->src_address,
-                              vnet_buffer (b0)->ip.fib_index, &key0.gtk_v4);
-               }
-
-             if ((!is_ipv6 && !gre_match_key4 (&cached_tunnel_key.gtk_v4,
-                                               &key0.gtk_v4)) ||
-                 (is_ipv6 && !gre_match_key6 (&cached_tunnel_key.gtk_v6,
-                                              &key0.gtk_v6)))
-               {
-                 gre_tunnel_t *t;
-                 uword *p;
-
-                 if (!is_ipv6)
-                   {
-                     p = hash_get_mem (gm->tunnel_by_key4, &key0.gtk_v4);
-                   }
-                 else
-                   {
-                     p = hash_get_mem (gm->tunnel_by_key6, &key0.gtk_v6);
-                   }
-                 if (!p)
-                   {
-                     next0 = GRE_INPUT_NEXT_DROP;
-                     b0->error = node->errors[GRE_ERROR_NO_SUCH_TUNNEL];
-                     goto drop;
-                   }
-                 t = pool_elt_at_index (gm->tunnels, p[0]);
-                 tunnel_sw_if_index = t->sw_if_index;
-
-                 cached_tunnel_sw_if_index = tunnel_sw_if_index;
-                 if (!is_ipv6)
-                   {
-                     cached_tunnel_key.gtk_v4 = key0.gtk_v4;
-                   }
-                 else
-                   {
-                     cached_tunnel_key.gtk_v6 = key0.gtk_v6;
-                   }
-               }
-             else
-               {
-                 tunnel_sw_if_index = cached_tunnel_sw_if_index;
-               }
-           }
-         else
-           {
-             next0 = GRE_INPUT_NEXT_DROP;
-             goto drop;
-           }
-         len = vlib_buffer_length_in_chain (vm, b0);
-         vlib_increment_combined_counter (im->combined_sw_if_counters
-                                          + VNET_INTERFACE_COUNTER_RX,
-                                          thread_index,
-                                          tunnel_sw_if_index,
+         vlib_increment_combined_counter (&gm->vnet_main->
+                                          interface_main.combined_sw_if_counters
+                                          [VNET_INTERFACE_COUNTER_RX],
+                                          vm->thread_index,
+                                          tun_sw_if_index[0],
                                           1 /* packets */ ,
-                                          len /* bytes */ );
-
-         vnet_buffer (b0)->sw_if_index[VLIB_RX] = tunnel_sw_if_index;
-
-       drop:
-         if (PREDICT_FALSE (b0->flags & VLIB_BUFFER_IS_TRACED))
-           {
-             gre_rx_trace_t *tr = vlib_add_trace (vm, node,
-                                                  b0, sizeof (*tr));
-             tr->tunnel_id = tunnel_sw_if_index;
-             if (!is_ipv6)
-               {
-                 tr->length = ip4_0->length;
-                 tr->src.ip4.as_u32 = ip4_0->src_address.as_u32;
-                 tr->dst.ip4.as_u32 = ip4_0->dst_address.as_u32;
-               }
-             else
-               {
-                 tr->length = ip6_0->payload_length;
-                 tr->src.ip6.as_u64[0] = ip6_0->src_address.as_u64[0];
-                 tr->src.ip6.as_u64[1] = ip6_0->src_address.as_u64[1];
-                 tr->dst.ip6.as_u64[0] = ip6_0->dst_address.as_u64[0];
-                 tr->dst.ip6.as_u64[1] = ip6_0->dst_address.as_u64[1];
-               }
-           }
-
-         vlib_buffer_advance (b0, sizeof (*h0));
-
-         vlib_validate_buffer_enqueue_x1 (vm, node, next_index,
-                                          to_next, n_left_to_next,
-                                          bi0, next0);
+                                          len[0] /* bytes */ );
+         vnet_buffer (b[0])->sw_if_index[VLIB_RX] = tun_sw_if_index[0];
        }
 
-      vlib_put_next_frame (vm, node, next_index, n_left_to_next);
+      if (PREDICT_FALSE (b[0]->flags & VLIB_BUFFER_IS_TRACED))
+       gre_trace (vm, node, b[0], tun_sw_if_index[0], ip6[0], ip4[0],
+                  is_ipv6);
+
+      b += 1;
+      next += 1;
+      n_left_from -= 1;
     }
+
+  vlib_buffer_enqueue_to_next (vm, node, from, nexts, frame->n_vectors);
+
   vlib_node_increment_counter (vm,
-                              !is_ipv6 ? gre4_input_node.index :
-                              gre6_input_node.index, GRE_ERROR_PKTS_DECAP,
-                              from_frame->n_vectors);
-  return from_frame->n_vectors;
+                              is_ipv6 ? gre6_input_node.index :
+                              gre4_input_node.index, GRE_ERROR_PKTS_DECAP,
+                              n_left_from);
+
+  return frame->n_vectors;
 }
 
-static uword
-gre4_input (vlib_main_t * vm,
-           vlib_node_runtime_t * node, vlib_frame_t * from_frame)
+VLIB_NODE_FN (gre4_input_node) (vlib_main_t * vm,
+                               vlib_node_runtime_t * node,
+                               vlib_frame_t * from_frame)
 {
   return gre_input (vm, node, from_frame, /* is_ip6 */ 0);
 }
 
-static uword
-gre6_input (vlib_main_t * vm,
-           vlib_node_runtime_t * node, vlib_frame_t * from_frame)
+VLIB_NODE_FN (gre6_input_node) (vlib_main_t * vm,
+                               vlib_node_runtime_t * node,
+                               vlib_frame_t * from_frame)
 {
   return gre_input (vm, node, from_frame, /* is_ip6 */ 1);
 }
@@ -573,7 +451,6 @@ static char *gre_error_strings[] = {
 
 /* *INDENT-OFF* */
 VLIB_REGISTER_NODE (gre4_input_node) = {
-  .function = gre4_input,
   .name = "gre4-input",
   /* Takes a vector of packets. */
   .vector_size = sizeof (u32),
@@ -592,11 +469,8 @@ VLIB_REGISTER_NODE (gre4_input_node) = {
   .format_trace = format_gre_rx_trace,
   .unformat_buffer = unformat_gre_header,
 };
-/* *INDENT-ON* */
 
-/* *INDENT-OFF* */
 VLIB_REGISTER_NODE (gre6_input_node) = {
-  .function = gre6_input,
   .name = "gre6-input",
   /* Takes a vector of packets. */
   .vector_size = sizeof (u32),
@@ -619,15 +493,15 @@ VLIB_REGISTER_NODE (gre6_input_node) = {
 };
 /* *INDENT-ON* */
 
-VLIB_NODE_FUNCTION_MULTIARCH (gre4_input_node, gre4_input)
-VLIB_NODE_FUNCTION_MULTIARCH (gre6_input_node, gre6_input)
-     void
-       gre_register_input_protocol (vlib_main_t * vm,
-                                   gre_protocol_t protocol, u32 node_index)
+#ifndef CLIB_MARCH_VARIANT
+void
+gre_register_input_protocol (vlib_main_t * vm,
+                            gre_protocol_t protocol, u32 node_index,
+                            gre_tunnel_type_t tunnel_type)
 {
   gre_main_t *em = &gre_main;
   gre_protocol_info_t *pi;
-  u16 *n;
+  next_info_t *n;
   u32 i;
 
   {
@@ -638,6 +512,7 @@ VLIB_NODE_FUNCTION_MULTIARCH (gre6_input_node, gre6_input)
 
   pi = gre_get_protocol_info (em, protocol);
   pi->node_index = node_index;
+  pi->tunnel_type = tunnel_type;
   pi->next_index = vlib_node_add_next (vm, gre4_input_node.index, node_index);
   i = vlib_node_add_next (vm, gre6_input_node.index, node_index);
   ASSERT (i == pi->next_index);
@@ -645,7 +520,8 @@ VLIB_NODE_FUNCTION_MULTIARCH (gre6_input_node, gre6_input)
   /* Setup gre protocol -> next index sparse vector mapping. */
   n = sparse_vec_validate (em->next_by_protocol,
                           clib_host_to_net_u16 (protocol));
-  n[0] = pi->next_index;
+  n->next_index = pi->next_index;
+  n->tunnel_type = tunnel_type;
 }
 
 static void
@@ -689,14 +565,17 @@ gre_input_init (vlib_main_t * vm)
   mpls_unicast_input = vlib_get_node_by_name (vm, (u8 *) "mpls-input");
   ASSERT (mpls_unicast_input);
 
-  gre_register_input_protocol (vm, GRE_PROTOCOL_teb, ethernet_input->index);
+  gre_register_input_protocol (vm, GRE_PROTOCOL_teb,
+                              ethernet_input->index, GRE_TUNNEL_TYPE_TEB);
 
-  gre_register_input_protocol (vm, GRE_PROTOCOL_ip4, ip4_input->index);
+  gre_register_input_protocol (vm, GRE_PROTOCOL_ip4,
+                              ip4_input->index, GRE_TUNNEL_TYPE_L3);
 
-  gre_register_input_protocol (vm, GRE_PROTOCOL_ip6, ip6_input->index);
+  gre_register_input_protocol (vm, GRE_PROTOCOL_ip6,
+                              ip6_input->index, GRE_TUNNEL_TYPE_L3);
 
   gre_register_input_protocol (vm, GRE_PROTOCOL_mpls_unicast,
-                              mpls_unicast_input->index);
+                              mpls_unicast_input->index, GRE_TUNNEL_TYPE_L3);
 
   ip4_register_protocol (IP_PROTOCOL_GRE, gre4_input_node.index);
   ip6_register_protocol (IP_PROTOCOL_GRE, gre6_input_node.index);
@@ -706,6 +585,7 @@ gre_input_init (vlib_main_t * vm)
 
 VLIB_INIT_FUNCTION (gre_input_init);
 
+#endif /* CLIB_MARCH_VARIANT */
 /*
  * fd.io coding-style-patch-verification: ON
  *