SFF NSH support VXLAN GPE
[vpp.git] / vnet / vnet / nsh-vxlan-gpe / decap.c
1 /*
2  * nsh.c: nsh packet processing
3  *
4  * Copyright (c) 2013 Cisco and/or its affiliates.
5  * Licensed under the Apache License, Version 2.0 (the "License");
6  * you may not use this file except in compliance with the License.
7  * You may obtain a copy of the License at:
8  *
9  *     http://www.apache.org/licenses/LICENSE-2.0
10  *
11  * Unless required by applicable law or agreed to in writing, software
12  * distributed under the License is distributed on an "AS IS" BASIS,
13  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14  * See the License for the specific language governing permissions and
15  * limitations under the License.
16  */
17
18 #include <vlib/vlib.h>
19 #include <vnet/pg/pg.h>
20 #include <vnet/nsh-vxlan-gpe/nsh_vxlan_gpe.h>
21
22 vlib_node_registration_t nsh_vxlan_gpe_input_node;
23
24 /* From nsh-gre */
25 u8 * format_nsh_header_with_length (u8 * s, va_list * args);
26
27 typedef struct {
28   u32 next_index;
29   u32 tunnel_index;
30   u32 error;
31   nsh_header_t h;
32 } nsh_vxlan_gpe_rx_trace_t;
33
34 static u8 * format_nsh_vxlan_gpe_rx_trace (u8 * s, va_list * args)
35 {
36   CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
37   CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
38   nsh_vxlan_gpe_rx_trace_t * t = va_arg (*args, nsh_vxlan_gpe_rx_trace_t *);
39
40   if (t->tunnel_index != ~0)
41     {
42       s = format (s, "NSH-VXLAN: tunnel %d next %d error %d", t->tunnel_index, 
43                   t->next_index, t->error);
44     }
45   else
46     {
47       s = format (s, "NSH-VXLAN: no tunnel next %d error %d\n", t->next_index, 
48                   t->error);
49     }
50   s = format (s, "\n  %U", format_nsh_header_with_length, &t->h, 
51               (u32) sizeof (t->h) /* max size */);
52   return s;
53 }
54
55 static uword
56 nsh_vxlan_gpe_input (vlib_main_t * vm,
57                      vlib_node_runtime_t * node,
58                      vlib_frame_t * from_frame)
59 {
60   u32 n_left_from, next_index, * from, * to_next;
61   nsh_vxlan_gpe_main_t * ngm = &nsh_vxlan_gpe_main;
62   u32 last_tunnel_index = ~0;
63   nsh_vxlan_gpe_tunnel_key_t last_key;
64   u32 pkts_decapsulated = 0;
65
66   memset (&last_key, 0xff, sizeof (last_key));
67
68   from = vlib_frame_vector_args (from_frame);
69   n_left_from = from_frame->n_vectors;
70
71   next_index = node->cached_next_index;
72
73   while (n_left_from > 0)
74     {
75       u32 n_left_to_next;
76
77       vlib_get_next_frame (vm, node, next_index,
78                            to_next, n_left_to_next);
79
80       while (n_left_from >= 4 && n_left_to_next >= 2)
81         {
82           u32 bi0, bi1;
83           vlib_buffer_t * b0, * b1;
84           u32 next0, next1;
85           ip4_vxlan_gpe_and_nsh_header_t * iuvn0, * iuvn1;
86           uword * p0, * p1;
87           u32 tunnel_index0, tunnel_index1;
88           nsh_vxlan_gpe_tunnel_t * t0, * t1;
89           nsh_vxlan_gpe_tunnel_key_t key0, key1;
90           u32 error0, error1;
91
92           /* Prefetch next iteration. */
93           {
94             vlib_buffer_t * p2, * p3;
95
96             p2 = vlib_get_buffer (vm, from[2]);
97             p3 = vlib_get_buffer (vm, from[3]);
98
99             vlib_prefetch_buffer_header (p2, LOAD);
100             vlib_prefetch_buffer_header (p3, LOAD);
101
102             CLIB_PREFETCH (p2->data, 2*CLIB_CACHE_LINE_BYTES, LOAD);
103             CLIB_PREFETCH (p3->data, 2*CLIB_CACHE_LINE_BYTES, LOAD);
104           }
105
106           bi0 = from[0];
107           bi1 = from[1];
108           to_next[0] = bi0;
109           to_next[1] = bi1;
110           from += 2;
111           to_next += 2;
112           n_left_to_next -= 2;
113           n_left_from -= 2;
114
115           b0 = vlib_get_buffer (vm, bi0);
116           b1 = vlib_get_buffer (vm, bi1);
117
118           /* udp leaves current_data pointing at the vxlan header */
119           vlib_buffer_advance 
120             (b0, -(word)(sizeof(udp_header_t)+sizeof(ip4_header_t)));
121           vlib_buffer_advance 
122             (b1, -(word)(sizeof(udp_header_t)+sizeof(ip4_header_t)));
123
124           iuvn0 = vlib_buffer_get_current (b0);
125           iuvn1 = vlib_buffer_get_current (b1);
126
127           /* pop (ip, udp, vxlan, nsh) */
128           vlib_buffer_advance (b0, sizeof (*iuvn0));
129           vlib_buffer_advance (b1, sizeof (*iuvn1));
130
131           tunnel_index0 = ~0;
132           error0 = 0;
133           next0 = NSH_VXLAN_GPE_INPUT_NEXT_DROP;
134
135           tunnel_index1 = ~0;
136           error1 = 0;
137           next1 = NSH_VXLAN_GPE_INPUT_NEXT_DROP;
138
139           key0.src = iuvn0->ip4.src_address.as_u32;
140           key0.vni = iuvn0->vxlan.vni_res;
141           key0.spi_si = iuvn0->nsh.spi_si;
142           key0.pad = 0;
143
144           if (PREDICT_FALSE ((key0.as_u64[0] != last_key.as_u64[0])
145                              || (key0.as_u64[1] != last_key.as_u64[1])))
146             {
147               p0 = hash_get_mem (ngm->nsh_vxlan_gpe_tunnel_by_key, &key0);
148
149               if (p0 == 0)
150                 {
151                   error0 = NSH_VXLAN_GPE_ERROR_NO_SUCH_TUNNEL;
152                   goto trace0;
153                 }
154
155               last_key.as_u64[0] = key0.as_u64[0];
156               last_key.as_u64[1] = key0.as_u64[1];
157               tunnel_index0 = last_tunnel_index = p0[0];
158             }
159           else
160             tunnel_index0 = last_tunnel_index;
161
162           t0 = pool_elt_at_index (ngm->tunnels, tunnel_index0);
163
164           next0 = t0->decap_next_index;
165
166           /* Required to make the l2 tag push / pop code work on l2 subifs */
167           vnet_update_l2_len (b0);
168
169           if (next0 == NSH_VXLAN_GPE_INPUT_NEXT_NSH_VXLAN_GPE_ENCAP)
170             {
171               /*
172                * Functioning as SFF (ie "half NSH tunnel mode")
173                * If ingress (we are in decap.c) with NSH header, and 'decap next nsh-vxlan-gpe' then "NSH switch"
174                * 1. Take DST, remap to SRC, remap other keys in place
175                * 2. Look up new t0 as per above
176                * 3. Set sw_if_index[VLIB_TX] to be t0->sw_if_index
177                */
178               uword * next_p0;
179               nsh_vxlan_gpe_tunnel_t  * next_t0;
180               nsh_vxlan_gpe_tunnel_key_t next_key0;
181
182               next_key0.src = iuvn0->ip4.dst_address.as_u32;
183               next_key0.vni = iuvn0->vxlan.vni_res;
184               next_key0.spi_si = iuvn0->nsh.spi_si;
185               next_key0.pad = 0;
186
187               next_p0 = hash_get_mem (ngm->nsh_vxlan_gpe_tunnel_by_key, &next_key0);
188
189               if (next_p0 == 0)
190                 {
191                   error0 = NSH_VXLAN_GPE_ERROR_NO_SUCH_TUNNEL;
192                   goto trace0;
193                 }
194               next_t0 = pool_elt_at_index (ngm->tunnels, next_p0[0]);
195               vnet_buffer(b0)->sw_if_index[VLIB_TX] = next_t0->sw_if_index;
196
197             }
198           else
199             {
200               /*
201                * ip[46] lookup in the configured FIB
202                * nsh-vxlan-gpe-encap, here's the encap tunnel sw_if_index
203                */
204               vnet_buffer(b0)->sw_if_index[VLIB_TX] = t0->decap_fib_index;
205             }
206
207
208         trace0:
209           b0->error = error0 ? node->errors[error0] : 0;
210
211           if (PREDICT_FALSE(b0->flags & VLIB_BUFFER_IS_TRACED)) 
212             {
213               nsh_vxlan_gpe_rx_trace_t *tr 
214                 = vlib_add_trace (vm, node, b0, sizeof (*tr));
215               tr->next_index = next0;
216               tr->error = error0;
217               tr->tunnel_index = tunnel_index0;
218               tr->h = iuvn0->nsh;
219             }
220
221           key1.src = iuvn1->ip4.src_address.as_u32;
222           key1.vni = iuvn1->vxlan.vni_res;
223           key1.spi_si = iuvn1->nsh.spi_si;
224           key1.pad = 0;
225
226           if (PREDICT_FALSE ((key1.as_u64[0] != last_key.as_u64[0])
227                              || (key1.as_u64[1] != last_key.as_u64[1])))
228             {
229               p1 = hash_get_mem (ngm->nsh_vxlan_gpe_tunnel_by_key, &key1);
230
231               if (p1 == 0)
232                 {
233                   error1 = NSH_VXLAN_GPE_ERROR_NO_SUCH_TUNNEL;
234                   goto trace1;
235                 }
236
237               last_key.as_u64[0] = key1.as_u64[0];
238               last_key.as_u64[1] = key1.as_u64[1];
239               tunnel_index1 = last_tunnel_index = p1[0];
240             }
241           else
242             tunnel_index1 = last_tunnel_index;
243
244           t1 = pool_elt_at_index (ngm->tunnels, tunnel_index1);
245
246           next1 = t1->decap_next_index;
247
248           /* Required to make the l2 tag push / pop code work on l2 subifs */
249           vnet_update_l2_len (b1);
250
251           if (next1 == NSH_VXLAN_GPE_INPUT_NEXT_NSH_VXLAN_GPE_ENCAP)
252             {
253               /*
254                * Functioning as SFF (ie "half NSH tunnel mode")
255                * If ingress (we are in decap.c) with NSH header, and 'decap next nsh-vxlan-gpe' then "NSH switch"
256                * 1. Take DST, remap to SRC, remap other keys in place
257                * 2. Look up new t0 as per above
258                * 3. Set sw_if_index[VLIB_TX] to be t0->sw_if_index
259                */
260               uword * next_p1;
261               nsh_vxlan_gpe_tunnel_t  * next_t1;
262               nsh_vxlan_gpe_tunnel_key_t next_key1;
263
264               next_key1.src = iuvn0->ip4.dst_address.as_u32;
265               next_key1.vni = iuvn0->vxlan.vni_res;
266               next_key1.spi_si = iuvn0->nsh.spi_si;
267               next_key1.pad = 0;
268
269               next_p1 = hash_get_mem (ngm->nsh_vxlan_gpe_tunnel_by_key, &next_key1);
270
271               if (next_p1 == 0)
272                 {
273                   error1 = NSH_VXLAN_GPE_ERROR_NO_SUCH_TUNNEL;
274                   goto trace1;
275                 }
276               next_t1 = pool_elt_at_index (ngm->tunnels, next_p1[0]);
277               vnet_buffer(b1)->sw_if_index[VLIB_TX] = next_t1->sw_if_index;
278
279             }
280           else
281             {
282               /*
283                * ip[46] lookup in the configured FIB
284                * nsh-vxlan-gpe-encap, here's the encap tunnel sw_if_index
285                */
286               vnet_buffer(b1)->sw_if_index[VLIB_TX] = t1->decap_fib_index;
287             }
288
289           vnet_buffer(b1)->sw_if_index[VLIB_TX] = t1->decap_fib_index;
290           pkts_decapsulated += 2;
291
292         trace1:
293           b1->error = error1 ? node->errors[error1] : 0;
294
295           if (PREDICT_FALSE(b1->flags & VLIB_BUFFER_IS_TRACED)) 
296             {
297               nsh_vxlan_gpe_rx_trace_t *tr 
298                 = vlib_add_trace (vm, node, b1, sizeof (*tr));
299               tr->next_index = next1;
300               tr->error = error1;
301               tr->tunnel_index = tunnel_index1;
302               tr->h = iuvn1->nsh;
303             }
304
305           vlib_validate_buffer_enqueue_x2 (vm, node, next_index,
306                                            to_next, n_left_to_next,
307                                            bi0, bi1, next0, next1);
308         }
309     
310       while (n_left_from > 0 && n_left_to_next > 0)
311         {
312           u32 bi0;
313           vlib_buffer_t * b0;
314           u32 next0;
315           ip4_vxlan_gpe_and_nsh_header_t * iuvn0;
316           uword * p0;
317           u32 tunnel_index0;
318           nsh_vxlan_gpe_tunnel_t * t0;
319           nsh_vxlan_gpe_tunnel_key_t key0;
320           u32 error0;
321
322           bi0 = from[0];
323           to_next[0] = bi0;
324           from += 1;
325           to_next += 1;
326           n_left_from -= 1;
327           n_left_to_next -= 1;
328
329           b0 = vlib_get_buffer (vm, bi0);
330
331           /* udp leaves current_data pointing at the vxlan header */
332           vlib_buffer_advance 
333             (b0, -(word)(sizeof(udp_header_t)+sizeof(ip4_header_t)));
334
335           iuvn0 = vlib_buffer_get_current (b0);
336
337           /* pop (ip, udp, vxlan, nsh) */
338           vlib_buffer_advance (b0, sizeof (*iuvn0));
339
340           tunnel_index0 = ~0;
341           error0 = 0;
342           next0 = NSH_VXLAN_GPE_INPUT_NEXT_DROP;
343
344           key0.src = iuvn0->ip4.src_address.as_u32;
345           key0.vni = iuvn0->vxlan.vni_res;
346           key0.spi_si = iuvn0->nsh.spi_si;
347           key0.pad = 0;
348
349           if (PREDICT_FALSE ((key0.as_u64[0] != last_key.as_u64[0])
350                              || (key0.as_u64[1] != last_key.as_u64[1])))
351             {
352               p0 = hash_get_mem (ngm->nsh_vxlan_gpe_tunnel_by_key, &key0);
353           
354               if (p0 == 0)
355                 {
356                   error0 = NSH_VXLAN_GPE_ERROR_NO_SUCH_TUNNEL;
357                   goto trace00;
358                 }
359
360               last_key.as_u64[0] = key0.as_u64[0];
361               last_key.as_u64[1] = key0.as_u64[1];
362               tunnel_index0 = last_tunnel_index = p0[0];
363             }
364           else
365             tunnel_index0 = last_tunnel_index;
366
367           t0 = pool_elt_at_index (ngm->tunnels, tunnel_index0);
368
369           next0 = t0->decap_next_index;
370
371           /* Required to make the l2 tag push / pop code work on l2 subifs */
372           vnet_update_l2_len (b0);
373
374           if (next0 == NSH_VXLAN_GPE_INPUT_NEXT_NSH_VXLAN_GPE_ENCAP)
375             {
376               /* 
377                * Functioning as SFF (ie "half NSH tunnel mode")
378                * If ingress (we are in decap.c) with NSH header, and 'decap next nsh-vxlan-gpe' then "NSH switch"
379                * 1. Take DST, remap to SRC, remap other keys in place
380                * 2. Look up new t0 as per above
381                * 3. Set sw_if_index[VLIB_TX] to be t0->sw_if_index
382                */
383               uword * next_p0;
384               nsh_vxlan_gpe_tunnel_t  * next_t0;
385               nsh_vxlan_gpe_tunnel_key_t next_key0;
386
387               next_key0.src = iuvn0->ip4.dst_address.as_u32;
388               next_key0.vni = iuvn0->vxlan.vni_res;
389               next_key0.spi_si = iuvn0->nsh.spi_si;
390               next_key0.pad = 0;
391
392               next_p0 = hash_get_mem (ngm->nsh_vxlan_gpe_tunnel_by_key, &next_key0);
393
394               if (next_p0 == 0)
395                 {
396                   error0 = NSH_VXLAN_GPE_ERROR_NO_SUCH_TUNNEL;
397                   goto trace00;
398                 }
399               next_t0 = pool_elt_at_index (ngm->tunnels, next_p0[0]);
400               vnet_buffer(b0)->sw_if_index[VLIB_TX] = next_t0->sw_if_index;
401               
402             } 
403           else 
404             {
405               /* 
406                * ip[46] lookup in the configured FIB
407                * nsh-vxlan-gpe-encap, here's the encap tunnel sw_if_index
408                */
409               vnet_buffer(b0)->sw_if_index[VLIB_TX] = t0->decap_fib_index;
410             }
411
412           pkts_decapsulated ++;
413
414         trace00:
415           b0->error = error0 ? node->errors[error0] : 0;
416
417           if (PREDICT_FALSE(b0->flags & VLIB_BUFFER_IS_TRACED)) 
418             {
419               nsh_vxlan_gpe_rx_trace_t *tr 
420                 = vlib_add_trace (vm, node, b0, sizeof (*tr));
421               tr->next_index = next0;
422               tr->error = error0;
423               tr->tunnel_index = tunnel_index0;
424               tr->h = iuvn0->nsh;
425             }
426           vlib_validate_buffer_enqueue_x1 (vm, node, next_index,
427                                            to_next, n_left_to_next,
428                                            bi0, next0);
429         }
430
431       vlib_put_next_frame (vm, node, next_index, n_left_to_next);
432     }
433   vlib_node_increment_counter (vm, nsh_vxlan_gpe_input_node.index,
434                                NSH_VXLAN_GPE_ERROR_DECAPSULATED, 
435                                pkts_decapsulated);
436   return from_frame->n_vectors;
437 }
438
439 static char * nsh_vxlan_gpe_error_strings[] = {
440 #define nsh_vxlan_gpe_error(n,s) s,
441 #include <vnet/nsh-vxlan-gpe/nsh_vxlan_gpe_error.def>
442 #undef nsh_vxlan_gpe_error
443 #undef _
444 };
445
446 VLIB_REGISTER_NODE (nsh_vxlan_gpe_input_node) = {
447   .function = nsh_vxlan_gpe_input,
448   .name = "nsh-vxlan-gpe-input",
449   /* Takes a vector of packets. */
450   .vector_size = sizeof (u32),
451
452   .n_errors = NSH_VXLAN_GPE_N_ERROR,
453   .error_strings = nsh_vxlan_gpe_error_strings,
454
455   .n_next_nodes = NSH_VXLAN_GPE_INPUT_N_NEXT,
456   .next_nodes = {
457 #define _(s,n) [NSH_VXLAN_GPE_INPUT_NEXT_##s] = n,
458     foreach_nsh_vxlan_gpe_input_next
459 #undef _
460   },
461
462   .format_buffer = format_nsh_header_with_length,
463   .format_trace = format_nsh_vxlan_gpe_rx_trace,
464   // $$$$ .unformat_buffer = unformat_nsh_vxlan_gpe_header,
465 };