LISP GPE: initial CP commit and DP improvements
[vpp.git] / vnet / vnet / lisp-gpe / decap.c
index e10f1f2..356dbf2 100644 (file)
@@ -1,7 +1,5 @@
 /*
- * decap.c: lisp-gpe decap processing
- *
- * Copyright (c) 2014 Cisco and/or its affiliates.
+ * Copyright (c) 2016 Cisco and/or its affiliates.
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at:
 #include <vnet/pg/pg.h>
 #include <vnet/lisp-gpe/lisp_gpe.h>
 
-typedef struct {
+typedef struct
+{
   u32 next_index;
   u32 tunnel_index;
   u32 error;
   lisp_gpe_header_t h;
 } lisp_gpe_rx_trace_t;
 
-static u8 * format_lisp_gpe_rx_trace (u8 * s, va_list * args)
+static u8 *
+format_lisp_gpe_rx_trace (u8 * s, va_list * args)
 {
   CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
   CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
@@ -34,27 +34,55 @@ static u8 * format_lisp_gpe_rx_trace (u8 * s, va_list * args)
 
   if (t->tunnel_index != ~0)
     {
-      s = format (s, "NSH-VXLAN: tunnel %d next %d error %d", t->tunnel_index, 
-                  t->next_index, t->error);
+      s = format (s, "LISP-GPE: tunnel %d next %d error %d", t->tunnel_index,
+          t->next_index, t->error);
     }
   else
     {
-      s = format (s, "NSH-VXLAN: no tunnel next %d error %d\n", t->next_index, 
-                  t->error);
+      s = format (s, "LISP-GPE: no tunnel next %d error %d\n", t->next_index,
+          t->error);
     }
-  s = format (s, "\n  %U", format_lisp_gpe_header_with_length, &t->h, 
-              (u32) sizeof (t->h) /* max size */);
+  s = format (s, "\n  %U", format_lisp_gpe_header_with_length, &t->h,
+      (u32) sizeof (t->h) /* max size */);
   return s;
 }
 
+static u32
+next_proto_to_next_index[LISP_GPE_NEXT_PROTOS] ={
+    LISP_GPE_INPUT_NEXT_DROP,
+    LISP_GPE_INPUT_NEXT_IP4_INPUT,
+    LISP_GPE_INPUT_NEXT_IP6_INPUT,
+    LISP_GPE_INPUT_NEXT_DROP,
+    LISP_GPE_INPUT_NEXT_DROP
+};
+
+static u32
+next_protocol_to_next_index (lisp_gpe_header_t * lgh, u8 * next_header)
+{
+  /* legay lisp router */
+  if (PREDICT_FALSE((lgh->flags & LISP_GPE_FLAGS_P) == 0))
+    {
+      ip4_header_t * iph = (ip4_header_t *) next_header;
+      if ((iph->ip_version_and_header_length & 0xF0) == 0x40)
+        return LISP_GPE_INPUT_NEXT_IP4_INPUT;
+      else if ((iph->ip_version_and_header_length & 0xF0) == 0x60)
+        return LISP_GPE_INPUT_NEXT_IP6_INPUT;
+      else
+        return LISP_GPE_INPUT_NEXT_DROP;
+    }
+  /* lisp-gpe router */
+  else if ((lgh->flags & LISP_GPE_FLAGS_P)
+      && lgh->next_protocol < LISP_GPE_NEXT_PROTOS)
+    return next_proto_to_next_index[lgh->next_protocol];
+  else
+    return LISP_GPE_INPUT_NEXT_DROP;
+}
+
 static uword
-lisp_gpe_input (vlib_main_t * vm,
-                     vlib_node_runtime_t * node,
-                     vlib_frame_t * from_frame)
+lisp_gpe_input (vlib_main_t * vm, vlib_node_runtime_t * node,
+                vlib_frame_t * from_frame)
 {
   u32 n_left_from, next_index, * from, * to_next;
-  lisp_gpe_main_t * ngm = &lisp_gpe_main;
-  u32 last_tunnel_index = ~0;
   lisp_gpe_tunnel_key_t last_key;
   u32 pkts_decapsulated = 0;
 
@@ -69,182 +97,143 @@ lisp_gpe_input (vlib_main_t * vm,
     {
       u32 n_left_to_next;
 
-      vlib_get_next_frame (vm, node, next_index,
-                          to_next, n_left_to_next);
+      vlib_get_next_frame(vm, node, next_index, to_next, n_left_to_next);
 
-#if 0
       while (n_left_from >= 4 && n_left_to_next >= 2)
-       {
-         u32 bi0, bi1;
-         vlib_buffer_t * b0, * b1;
-         nsh_unicast_header_t * h0, * h1;
-          u32 label0, label1;
-         u32 next0, next1;
-         uword * p0, * p1;
-
-         /* Prefetch next iteration. */
-         {
-           vlib_buffer_t * p2, * p3;
-
-           p2 = vlib_get_buffer (vm, from[2]);
-           p3 = vlib_get_buffer (vm, from[3]);
-
-           vlib_prefetch_buffer_header (p2, LOAD);
-           vlib_prefetch_buffer_header (p3, LOAD);
-
-           CLIB_PREFETCH (p2->data, 2*CLIB_CACHE_LINE_BYTES, LOAD);
-           CLIB_PREFETCH (p3->data, 2*CLIB_CACHE_LINE_BYTES, LOAD);
-         }
-
-         bi0 = from[0];
-         bi1 = from[1];
-         to_next[0] = bi0;
-         to_next[1] = bi1;
-         from += 2;
-         to_next += 2;
-         n_left_to_next -= 2;
-         n_left_from -= 2;
-
-         b0 = vlib_get_buffer (vm, bi0);
-         b1 = vlib_get_buffer (vm, bi1);
-
-          h0 = vlib_buffer_get_current (b0);
-          h1 = vlib_buffer_get_current (b1);
-          
+        {
+          u32 bi0, bi1;
+          vlib_buffer_t * b0, * b1;
+          ip4_udp_lisp_gpe_header_t * iul0, * iul1;
+          u32 error0, error1;
+          u32 next0, next1;
+
           next0 = next1 = LISP_GPE_INPUT_NEXT_IP4_INPUT;
 
-          label0 = clib_net_to_host_u32 (h0->label_exp_s_ttl);
-          label1 = clib_net_to_host_u32 (h1->label_exp_s_ttl);
+          /* Prefetch next iteration. */
+          {
+            vlib_buffer_t * p2, * p3;
 
-         /* 
-          * Translate label contents into a fib index.
-          * This is a decent sanity check, and guarantees
-          * a sane FIB for the downstream lookup
-          */
-          label0 = vnet_nsh_uc_get_label (label0);
-          label1 = vnet_nsh_uc_get_label (label1);
+            p2 = vlib_get_buffer (vm, from[2]);
+            p3 = vlib_get_buffer (vm, from[3]);
 
-          /* If 2xlabels match, and match the 1-wide cache, use it */
-          if (label0 == label1 && rt->last_label == label0)
-            {
-              vnet_buffer(b0)->sw_if_index[VLIB_TX] = rt->last_fib_index;
-              vnet_buffer(b1)->sw_if_index[VLIB_TX] = rt->last_fib_index;
-            }
-          else
-            {
-              p0 = hash_get (rt->mm->fib_index_by_nsh_label, label0);
-              if (PREDICT_FALSE (p0 == 0))
-                {
-                  next0 = LISP_GPE_INPUT_NEXT_DROP;
-                  b0->error = node->errors[NSH_ERROR_BAD_LABEL];
-                }
-              else
-                vnet_buffer(b0)->sw_if_index[VLIB_TX] = p0[0];
-              
-              p1 = hash_get (rt->mm->fib_index_by_nsh_label, label1);
-              if (PREDICT_FALSE (p1 == 0))
-                {
-                  next1 = LISP_GPE_INPUT_NEXT_DROP;
-                  b1->error = node->errors[NSH_ERROR_BAD_LABEL];
-                }
-              else
-                {
-                  vnet_buffer(b1)->sw_if_index[VLIB_TX] = p1[0];
-                  rt->last_fib_index = p1[0];
-                  rt->last_label = label1;
-                }
-            }
+            vlib_prefetch_buffer_header (p2, LOAD);
+            vlib_prefetch_buffer_header (p3, LOAD);
 
-          if (PREDICT_FALSE(b0->flags & VLIB_BUFFER_IS_TRACED)) 
+            CLIB_PREFETCH (p2->data, 2*CLIB_CACHE_LINE_BYTES, LOAD);
+            CLIB_PREFETCH (p3->data, 2*CLIB_CACHE_LINE_BYTES, LOAD);
+          }
+
+          bi0 = from[0];
+          bi1 = from[1];
+          to_next[0] = bi0;
+          to_next[1] = bi1;
+          from += 2;
+          to_next += 2;
+          n_left_to_next -= 2;
+          n_left_from -= 2;
+
+          b0 = vlib_get_buffer (vm, bi0);
+          b1 = vlib_get_buffer (vm, bi1);
+
+          /* udp leaves current_data pointing at the lisp header */
+          vlib_buffer_advance (b0, - IP_UDP_HDR_LEN);
+          vlib_buffer_advance (b1, - IP_UDP_HDR_LEN);
+
+          iul0 = vlib_buffer_get_current (b0);
+          iul1 = vlib_buffer_get_current (b1);
+
+          /* pop (ip, udp, lisp-gpe) */
+          vlib_buffer_advance (b0, sizeof (*iul0));
+          vlib_buffer_advance (b1, sizeof (*iul1));
+
+          /* determine next_index from lisp-gpe header */
+          next0 = next_protocol_to_next_index (&iul0->lisp,
+                                               vlib_buffer_get_current (b0));
+          next1 = next_protocol_to_next_index (&iul1->lisp,
+                                               vlib_buffer_get_current (b1));
+
+          /* Required to make the l2 tag push / pop code work on l2 subifs */
+          vnet_update_l2_len (b0);
+          vnet_update_l2_len (b1);
+
+          /* TODO hash to map iid to fib */
+          vnet_buffer(b0)->sw_if_index[VLIB_TX] = iul0->lisp.iid;
+          vnet_buffer(b1)->sw_if_index[VLIB_TX] = iul1->lisp.iid;
+
+          pkts_decapsulated += 2;
+
+          /* TODO error handling if security is implemented */
+          error0 = error1 = 0;
+          b0->error = error0 ? node->errors[error0] : 0;
+          b1->error = error1 ? node->errors[error1] : 0;
+
+          if (PREDICT_FALSE(b0->flags & VLIB_BUFFER_IS_TRACED))
             {
-              nsh_rx_trace_t *tr = vlib_add_trace (vm, node, 
-                                                   b0, sizeof (*tr));
-              tr->label_exp_s_ttl = label0;
+              lisp_gpe_rx_trace_t *tr = vlib_add_trace (vm, node, b0,
+                                                        sizeof(*tr));
+              tr->next_index = next0;
+              tr->error = error0;
+              tr->h = iul0->lisp;
             }
-          if (PREDICT_FALSE(b1->flags & VLIB_BUFFER_IS_TRACED)) 
+
+          if (PREDICT_FALSE(b1->flags & VLIB_BUFFER_IS_TRACED))
             {
-              nsh_rx_trace_t *tr = vlib_add_trace (vm, node, 
-                                                   b1, sizeof (*tr));
-              tr->label_exp_s_ttl = label1;
+              lisp_gpe_rx_trace_t *tr = vlib_add_trace (vm, node, b1,
+                                                        sizeof(*tr));
+              tr->next_index = next1;
+              tr->error = error1;
+              tr->h = iul1->lisp;
             }
 
-          vlib_buffer_advance (b0, sizeof (*h0));
-          vlib_buffer_advance (b1, sizeof (*h1));
-
-         vlib_validate_buffer_enqueue_x2 (vm, node, next_index,
-                                          to_next, n_left_to_next,
-                                          bi0, bi1, next0, next1);
-       }
-#endif 
+          vlib_validate_buffer_enqueue_x2(vm, node, next_index, to_next,
+                                          n_left_to_next, bi0, bi1, next0,
+                                          next1);
+        }
     
       while (n_left_from > 0 && n_left_to_next > 0)
-       {
-         u32 bi0;
-         vlib_buffer_t * b0;
-         u32 next0;
+        {
+          u32 bi0;
+          vlib_buffer_t * b0;
+          u32 next0;
           ip4_udp_lisp_gpe_header_t * iul0;
-         uword * p0;
-          u32 tunnel_index0;
-          lisp_gpe_tunnel_t * t0;
-          lisp_gpe_tunnel_key_t key0;
           u32 error0;
 
-         bi0 = from[0];
-         to_next[0] = bi0;
-         from += 1;
-         to_next += 1;
-         n_left_from -= 1;
-         n_left_to_next -= 1;
+          bi0 = from[0];
+          to_next[0] = bi0;
+          from += 1;
+          to_next += 1;
+          n_left_from -= 1;
+          n_left_to_next -= 1;
 
-         b0 = vlib_get_buffer (vm, bi0);
+          b0 = vlib_get_buffer (vm, bi0);
 
           /* udp leaves current_data pointing at the lisp header */
-          vlib_buffer_advance 
-            (b0, -(word)(sizeof(udp_header_t)+sizeof(ip4_header_t)));
+          vlib_buffer_advance (b0, - IP_UDP_HDR_LEN);
 
           iul0 = vlib_buffer_get_current (b0);
 
           /* pop (ip, udp, lisp-gpe) */
           vlib_buffer_advance (b0, sizeof (*iul0));
 
-          tunnel_index0 = ~0;
-          error0 = 0;
-          next0 = LISP_GPE_INPUT_NEXT_DROP;
-
-          key0.src = iul0->ip4.src_address.as_u32;
-          key0.iid = iul0->lisp.iid;
-
-          if (PREDICT_FALSE ((key0.as_u64[0] != last_key.as_u64[0])))
-            {
-              p0 = hash_get_mem (ngm->lisp_gpe_tunnel_by_key, &key0);
-
-              if (p0 == 0)
-                {
-                  error0 = LISP_GPE_ERROR_NO_SUCH_TUNNEL;
-                  goto trace0;
-                }
-
-              last_key.as_u64[0] = key0.as_u64[0];
-              tunnel_index0 = last_tunnel_index = p0[0];
-            }
-          else
-            tunnel_index0 = last_tunnel_index;
-
-          t0 = pool_elt_at_index (ngm->tunnels, tunnel_index0);
+          /* TODO if security is to be implemented, something similar to RPF,
+           * probably we'd like to check that the peer is allowed to send us
+           * packets. For this, we should use the tunnel table OR check that
+           * we have a mapping for the source eid and that the outer source of
+           * the packet is one of its locators */
 
-          next0 = t0->decap_next_index;
+          /* determine next_index from lisp-gpe header */
+          next0 = next_protocol_to_next_index (&iul0->lisp,
+                                               vlib_buffer_get_current (b0));
 
           /* Required to make the l2 tag push / pop code work on l2 subifs */
           vnet_update_l2_len (b0);
 
-          /* 
-           * ip[46] lookup in the configured FIB
-           * lisp-gpe-encap, here's the encap tunnel sw_if_index
-           */
-          vnet_buffer(b0)->sw_if_index[VLIB_TX] = t0->decap_fib_index;
+          /* TODO hash to map iid to fib */
+          vnet_buffer(b0)->sw_if_index[VLIB_TX] = iul0->lisp.iid;
           pkts_decapsulated ++;
 
-        trace0:
+          /* TODO error handling if security is implemented */
+          error0 = 0;
           b0->error = error0 ? node->errors[error0] : 0;
 
           if (PREDICT_FALSE(b0->flags & VLIB_BUFFER_IS_TRACED)) 
@@ -253,13 +242,12 @@ lisp_gpe_input (vlib_main_t * vm,
                 = vlib_add_trace (vm, node, b0, sizeof (*tr));
               tr->next_index = next0;
               tr->error = error0;
-              tr->tunnel_index = tunnel_index0;
               tr->h = iul0->lisp;
             }
-         vlib_validate_buffer_enqueue_x1 (vm, node, next_index,
-                                          to_next, n_left_to_next,
-                                          bi0, next0);
-       }
+
+          vlib_validate_buffer_enqueue_x1(vm, node, next_index, to_next,
+                                          n_left_to_next, bi0, next0);
+        }
 
       vlib_put_next_frame (vm, node, next_index, n_left_to_next);
     }