2 * decap.c - decapsulate VXLAN GPE
4 * Copyright (c) 2013 Cisco and/or its affiliates.
5 * Licensed under the Apache License, Version 2.0 (the "License");
6 * you may not use this file except in compliance with the License.
7 * You may obtain a copy of the License at:
9 * http://www.apache.org/licenses/LICENSE-2.0
11 * Unless required by applicable law or agreed to in writing, software
12 * distributed under the License is distributed on an "AS IS" BASIS,
13 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14 * See the License for the specific language governing permissions and
15 * limitations under the License.
19 * @brief Functions for decapsulating VXLAN GPE tunnels
23 #include <vlib/vlib.h>
24 #include <vnet/pg/pg.h>
25 #include <vnet/vxlan-gpe/vxlan_gpe.h>
27 vlib_node_registration_t vxlan_gpe_input_node;
30 * @brief Struct for VXLAN GPE decap packet tracing
37 } vxlan_gpe_rx_trace_t;
40 * @brief Tracing function for VXLAN GPE packet decapsulation
48 static u8 * format_vxlan_gpe_rx_trace (u8 * s, va_list * args)
50 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
51 CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
52 vxlan_gpe_rx_trace_t * t = va_arg (*args, vxlan_gpe_rx_trace_t *);
54 if (t->tunnel_index != ~0)
56 s = format (s, "VXLAN-GPE: tunnel %d next %d error %d", t->tunnel_index,
57 t->next_index, t->error);
61 s = format (s, "VXLAN-GPE: no tunnel next %d error %d\n", t->next_index,
68 * @brief Tracing function for VXLAN GPE packet decapsulation including length
76 static u8 * format_vxlan_gpe_with_length (u8 * s, va_list * args)
78 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
79 CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
86 * @brief Common processing for IPv4 and IPv6 VXLAN GPE decap dispatch functions
88 * It is worth noting that other than trivial UDP forwarding (transit), VXLAN GPE
89 * tunnels are "terminate local". This means that there is no "TX" interface for this
90 * decap case, so that field in the buffer_metadata can be "used for something else".
91 * The something else in this case is, for the IPv4/IPv6 inner-packet type case, the
92 * FIB index used to look up the inner-packet's adjacency.
94 * vnet_buffer(b0)->sw_if_index[VLIB_TX] = t0->decap_fib_index;
101 * @return from_frame->n_vectors
105 vxlan_gpe_input (vlib_main_t * vm,
106 vlib_node_runtime_t * node,
107 vlib_frame_t * from_frame,
110 u32 n_left_from, next_index, *from, *to_next;
111 vxlan_gpe_main_t * ngm = &vxlan_gpe_main;
112 vnet_main_t * vnm = ngm->vnet_main;
113 vnet_interface_main_t * im = &vnm->interface_main;
114 u32 last_tunnel_index = ~0;
115 vxlan4_gpe_tunnel_key_t last_key4;
116 vxlan6_gpe_tunnel_key_t last_key6;
117 u32 pkts_decapsulated = 0;
118 u32 cpu_index = os_get_cpu_number ();
119 u32 stats_sw_if_index, stats_n_packets, stats_n_bytes;
122 memset (&last_key4, 0xff, sizeof(last_key4));
124 memset (&last_key6, 0xff, sizeof(last_key6));
126 from = vlib_frame_vector_args (from_frame);
127 n_left_from = from_frame->n_vectors;
129 next_index = node->cached_next_index;
130 stats_sw_if_index = node->runtime_data[0];
131 stats_n_packets = stats_n_bytes = 0;
133 while (n_left_from > 0)
137 vlib_get_next_frame(vm, node, next_index, to_next, n_left_to_next);
139 while (n_left_from >= 4 && n_left_to_next >= 2)
142 vlib_buffer_t * b0, *b1;
144 ip4_vxlan_gpe_header_t * iuvn4_0, *iuvn4_1;
145 ip6_vxlan_gpe_header_t * iuvn6_0, *iuvn6_1;
147 u32 tunnel_index0, tunnel_index1;
148 vxlan_gpe_tunnel_t * t0, *t1;
149 vxlan4_gpe_tunnel_key_t key4_0, key4_1;
150 vxlan6_gpe_tunnel_key_t key6_0, key6_1;
152 u32 sw_if_index0, sw_if_index1, len0, len1;
154 /* Prefetch next iteration. */
156 vlib_buffer_t * p2, *p3;
158 p2 = vlib_get_buffer (vm, from[2]);
159 p3 = vlib_get_buffer (vm, from[3]);
161 vlib_prefetch_buffer_header(p2, LOAD);
162 vlib_prefetch_buffer_header(p3, LOAD);
164 CLIB_PREFETCH(p2->data, 2*CLIB_CACHE_LINE_BYTES, LOAD);
165 CLIB_PREFETCH(p3->data, 2*CLIB_CACHE_LINE_BYTES, LOAD);
177 b0 = vlib_get_buffer (vm, bi0);
178 b1 = vlib_get_buffer (vm, bi1);
182 /* udp leaves current_data pointing at the vxlan-gpe header */
183 vlib_buffer_advance (b0, -(word) (sizeof(udp_header_t) + sizeof(ip4_header_t)));
184 vlib_buffer_advance (b1, -(word) (sizeof(udp_header_t) + sizeof(ip4_header_t)));
186 iuvn4_0 = vlib_buffer_get_current (b0);
187 iuvn4_1 = vlib_buffer_get_current (b1);
189 /* pop (ip, udp, vxlan) */
190 vlib_buffer_advance (b0, sizeof(*iuvn4_0));
191 vlib_buffer_advance (b1, sizeof(*iuvn4_1));
195 /* udp leaves current_data pointing at the vxlan-gpe header */
196 vlib_buffer_advance (b0, -(word) (sizeof(udp_header_t) + sizeof(ip6_header_t)));
197 vlib_buffer_advance (b1, -(word) (sizeof(udp_header_t) + sizeof(ip6_header_t)));
199 iuvn6_0 = vlib_buffer_get_current (b0);
200 iuvn6_1 = vlib_buffer_get_current (b1);
202 /* pop (ip, udp, vxlan) */
203 vlib_buffer_advance (b0, sizeof(*iuvn6_0));
204 vlib_buffer_advance (b1, sizeof(*iuvn6_1));
214 next0 = (iuvn4_0->vxlan.protocol < node->n_next_nodes) ?
215 iuvn4_0->vxlan.protocol : VXLAN_GPE_INPUT_NEXT_DROP;
216 next1 = (iuvn4_1->vxlan.protocol < node->n_next_nodes) ?
217 iuvn4_1->vxlan.protocol : VXLAN_GPE_INPUT_NEXT_DROP;
219 key4_0.local = iuvn4_0->ip4.dst_address.as_u32;
220 key4_1.local = iuvn4_1->ip4.dst_address.as_u32;
222 key4_0.remote = iuvn4_0->ip4.src_address.as_u32;
223 key4_1.remote = iuvn4_1->ip4.src_address.as_u32;
225 key4_0.vni = iuvn4_0->vxlan.vni_res;
226 key4_1.vni = iuvn4_1->vxlan.vni_res;
233 next0 = (iuvn6_0->vxlan.protocol < node->n_next_nodes) ?
234 iuvn6_0->vxlan.protocol : VXLAN_GPE_INPUT_NEXT_DROP;
235 next1 = (iuvn6_1->vxlan.protocol < node->n_next_nodes) ?
236 iuvn6_1->vxlan.protocol : VXLAN_GPE_INPUT_NEXT_DROP;
238 key6_0.local.as_u64[0] = iuvn6_0->ip6.dst_address.as_u64[0];
239 key6_0.local.as_u64[1] = iuvn6_0->ip6.dst_address.as_u64[1];
240 key6_1.local.as_u64[0] = iuvn6_1->ip6.dst_address.as_u64[0];
241 key6_1.local.as_u64[1] = iuvn6_1->ip6.dst_address.as_u64[1];
243 key6_0.remote.as_u64[0] = iuvn6_0->ip6.src_address.as_u64[0];
244 key6_0.remote.as_u64[1] = iuvn6_0->ip6.src_address.as_u64[1];
245 key6_1.remote.as_u64[0] = iuvn6_1->ip6.src_address.as_u64[0];
246 key6_1.remote.as_u64[1] = iuvn6_1->ip6.src_address.as_u64[1];
248 key6_0.vni = iuvn6_0->vxlan.vni_res;
249 key6_1.vni = iuvn6_1->vxlan.vni_res;
252 /* Processing packet 0*/
255 /* Processing for key4_0 */
256 if (PREDICT_FALSE((key4_0.as_u64[0] != last_key4.as_u64[0])
257 || (key4_0.as_u64[1] != last_key4.as_u64[1])))
259 p0 = hash_get_mem(ngm->vxlan4_gpe_tunnel_by_key, &key4_0);
263 error0 = VXLAN_GPE_ERROR_NO_SUCH_TUNNEL;
267 last_key4.as_u64[0] = key4_0.as_u64[0];
268 last_key4.as_u64[1] = key4_0.as_u64[1];
269 tunnel_index0 = last_tunnel_index = p0[0];
272 tunnel_index0 = last_tunnel_index;
276 /* Processing for key6_0 */
277 if (PREDICT_FALSE(memcmp (&key6_0, &last_key6, sizeof(last_key6)) != 0))
279 p0 = hash_get_mem(ngm->vxlan6_gpe_tunnel_by_key, &key6_0);
283 error0 = VXLAN_GPE_ERROR_NO_SUCH_TUNNEL;
287 memcpy (&last_key6, &key6_0, sizeof(key6_0));
288 tunnel_index0 = last_tunnel_index = p0[0];
291 tunnel_index0 = last_tunnel_index;
294 t0 = pool_elt_at_index(ngm->tunnels, tunnel_index0);
296 next0 = t0->protocol;
298 sw_if_index0 = t0->sw_if_index;
299 len0 = vlib_buffer_length_in_chain (vm, b0);
301 /* Required to make the l2 tag push / pop code work on l2 subifs */
302 vnet_update_l2_len (b0);
305 * ip[46] lookup in the configured FIB
307 vnet_buffer(b0)->sw_if_index[VLIB_TX] = t0->decap_fib_index;
310 stats_n_packets += 1;
311 stats_n_bytes += len0;
313 if (PREDICT_FALSE(sw_if_index0 != stats_sw_if_index))
315 stats_n_packets -= 1;
316 stats_n_bytes -= len0;
318 vlib_increment_combined_counter (
319 im->combined_sw_if_counters + VNET_INTERFACE_COUNTER_RX,
320 cpu_index, stats_sw_if_index, stats_n_packets, stats_n_bytes);
322 stats_n_bytes = len0;
323 stats_sw_if_index = sw_if_index0;
326 trace0: b0->error = error0 ? node->errors[error0] : 0;
328 if (PREDICT_FALSE(b0->flags & VLIB_BUFFER_IS_TRACED))
330 vxlan_gpe_rx_trace_t *tr = vlib_add_trace (vm, node, b0, sizeof(*tr));
331 tr->next_index = next0;
333 tr->tunnel_index = tunnel_index0;
336 /* Process packet 1 */
339 /* Processing for key4_1 */
341 (key4_1.as_u64[0] != last_key4.as_u64[0])
342 || (key4_1.as_u64[1] != last_key4.as_u64[1])))
344 p1 = hash_get_mem(ngm->vxlan4_gpe_tunnel_by_key, &key4_1);
348 error1 = VXLAN_GPE_ERROR_NO_SUCH_TUNNEL;
352 last_key4.as_u64[0] = key4_1.as_u64[0];
353 last_key4.as_u64[1] = key4_1.as_u64[1];
354 tunnel_index1 = last_tunnel_index = p1[0];
357 tunnel_index1 = last_tunnel_index;
361 /* Processing for key6_1 */
362 if (PREDICT_FALSE(memcmp (&key6_1, &last_key6, sizeof(last_key6)) != 0))
364 p1 = hash_get_mem(ngm->vxlan6_gpe_tunnel_by_key, &key6_1);
368 error1 = VXLAN_GPE_ERROR_NO_SUCH_TUNNEL;
372 memcpy (&last_key6, &key6_1, sizeof(key6_1));
373 tunnel_index1 = last_tunnel_index = p1[0];
376 tunnel_index1 = last_tunnel_index;
379 t1 = pool_elt_at_index(ngm->tunnels, tunnel_index1);
381 next1 = t1->protocol;
382 sw_if_index1 = t1->sw_if_index;
383 len1 = vlib_buffer_length_in_chain (vm, b1);
385 /* Required to make the l2 tag push / pop code work on l2 subifs */
386 vnet_update_l2_len (b1);
389 * ip[46] lookup in the configured FIB
391 vnet_buffer(b1)->sw_if_index[VLIB_TX] = t1->decap_fib_index;
394 stats_n_packets += 1;
395 stats_n_bytes += len1;
397 /* Batch stats increment on the same vxlan tunnel so counter
398 is not incremented per packet */
399 if (PREDICT_FALSE(sw_if_index1 != stats_sw_if_index))
401 stats_n_packets -= 1;
402 stats_n_bytes -= len1;
404 vlib_increment_combined_counter (
405 im->combined_sw_if_counters + VNET_INTERFACE_COUNTER_RX,
406 cpu_index, stats_sw_if_index, stats_n_packets, stats_n_bytes);
408 stats_n_bytes = len1;
409 stats_sw_if_index = sw_if_index1;
411 vnet_buffer(b1)->sw_if_index[VLIB_TX] = t1->decap_fib_index;
413 trace1: b1->error = error1 ? node->errors[error1] : 0;
415 if (PREDICT_FALSE(b1->flags & VLIB_BUFFER_IS_TRACED))
417 vxlan_gpe_rx_trace_t *tr = vlib_add_trace (vm, node, b1, sizeof(*tr));
418 tr->next_index = next1;
420 tr->tunnel_index = tunnel_index1;
423 vlib_validate_buffer_enqueue_x2(vm, node, next_index, to_next,
424 n_left_to_next, bi0, bi1, next0, next1);
427 while (n_left_from > 0 && n_left_to_next > 0)
432 ip4_vxlan_gpe_header_t * iuvn4_0;
433 ip6_vxlan_gpe_header_t * iuvn6_0;
436 vxlan_gpe_tunnel_t * t0;
437 vxlan4_gpe_tunnel_key_t key4_0;
438 vxlan6_gpe_tunnel_key_t key6_0;
440 u32 sw_if_index0, len0;
449 b0 = vlib_get_buffer (vm, bi0);
453 /* udp leaves current_data pointing at the vxlan-gpe header */
454 vlib_buffer_advance (
455 b0, -(word) (sizeof(udp_header_t) + sizeof(ip4_header_t)));
457 iuvn4_0 = vlib_buffer_get_current (b0);
459 /* pop (ip, udp, vxlan) */
460 vlib_buffer_advance (b0, sizeof(*iuvn4_0));
464 /* udp leaves current_data pointing at the vxlan-gpe header */
465 vlib_buffer_advance (
466 b0, -(word) (sizeof(udp_header_t) + sizeof(ip6_header_t)));
468 iuvn6_0 = vlib_buffer_get_current (b0);
470 /* pop (ip, udp, vxlan) */
471 vlib_buffer_advance (b0, sizeof(*iuvn6_0));
480 (iuvn4_0->vxlan.protocol < node->n_next_nodes) ?
481 iuvn4_0->vxlan.protocol : VXLAN_GPE_INPUT_NEXT_DROP;
483 key4_0.local = iuvn4_0->ip4.dst_address.as_u32;
484 key4_0.remote = iuvn4_0->ip4.src_address.as_u32;
485 key4_0.vni = iuvn4_0->vxlan.vni_res;
488 /* Processing for key4_0 */
490 (key4_0.as_u64[0] != last_key4.as_u64[0])
491 || (key4_0.as_u64[1] != last_key4.as_u64[1])))
493 p0 = hash_get_mem(ngm->vxlan4_gpe_tunnel_by_key, &key4_0);
497 error0 = VXLAN_GPE_ERROR_NO_SUCH_TUNNEL;
501 last_key4.as_u64[0] = key4_0.as_u64[0];
502 last_key4.as_u64[1] = key4_0.as_u64[1];
503 tunnel_index0 = last_tunnel_index = p0[0];
506 tunnel_index0 = last_tunnel_index;
510 next0 = (iuvn6_0->vxlan.protocol < node->n_next_nodes) ?
511 iuvn6_0->vxlan.protocol : VXLAN_GPE_INPUT_NEXT_DROP;
513 key6_0.local.as_u64[0] = iuvn6_0->ip6.dst_address.as_u64[0];
514 key6_0.local.as_u64[1] = iuvn6_0->ip6.dst_address.as_u64[1];
515 key6_0.remote.as_u64[0] = iuvn6_0->ip6.src_address.as_u64[0];
516 key6_0.remote.as_u64[1] = iuvn6_0->ip6.src_address.as_u64[1];
517 key6_0.vni = iuvn6_0->vxlan.vni_res;
519 /* Processing for key6_0 */
520 if (PREDICT_FALSE(memcmp (&key6_0, &last_key6, sizeof(last_key6)) != 0))
522 p0 = hash_get_mem(ngm->vxlan6_gpe_tunnel_by_key, &key6_0);
526 error0 = VXLAN_GPE_ERROR_NO_SUCH_TUNNEL;
530 memcpy (&last_key6, &key6_0, sizeof(key6_0));
531 tunnel_index0 = last_tunnel_index = p0[0];
534 tunnel_index0 = last_tunnel_index;
537 t0 = pool_elt_at_index(ngm->tunnels, tunnel_index0);
539 next0 = t0->protocol;
541 sw_if_index0 = t0->sw_if_index;
542 len0 = vlib_buffer_length_in_chain (vm, b0);
544 /* Required to make the l2 tag push / pop code work on l2 subifs */
545 vnet_update_l2_len (b0);
548 * ip[46] lookup in the configured FIB
550 vnet_buffer(b0)->sw_if_index[VLIB_TX] = t0->decap_fib_index;
553 stats_n_packets += 1;
554 stats_n_bytes += len0;
556 /* Batch stats increment on the same vxlan-gpe tunnel so counter
557 is not incremented per packet */
558 if (PREDICT_FALSE(sw_if_index0 != stats_sw_if_index))
560 stats_n_packets -= 1;
561 stats_n_bytes -= len0;
563 vlib_increment_combined_counter (
564 im->combined_sw_if_counters + VNET_INTERFACE_COUNTER_RX,
565 cpu_index, stats_sw_if_index, stats_n_packets, stats_n_bytes);
567 stats_n_bytes = len0;
568 stats_sw_if_index = sw_if_index0;
571 trace00: b0->error = error0 ? node->errors[error0] : 0;
573 if (PREDICT_FALSE(b0->flags & VLIB_BUFFER_IS_TRACED))
575 vxlan_gpe_rx_trace_t *tr = vlib_add_trace (vm, node, b0, sizeof(*tr));
576 tr->next_index = next0;
578 tr->tunnel_index = tunnel_index0;
580 vlib_validate_buffer_enqueue_x1(vm, node, next_index, to_next,
581 n_left_to_next, bi0, next0);
584 vlib_put_next_frame (vm, node, next_index, n_left_to_next);
586 vlib_node_increment_counter (vm, vxlan_gpe_input_node.index,
587 VXLAN_GPE_ERROR_DECAPSULATED, pkts_decapsulated);
588 /* Increment any remaining batch stats */
591 vlib_increment_combined_counter (
592 im->combined_sw_if_counters + VNET_INTERFACE_COUNTER_RX, cpu_index,
593 stats_sw_if_index, stats_n_packets, stats_n_bytes);
594 node->runtime_data[0] = stats_sw_if_index;
596 return from_frame->n_vectors;
600 * @brief Graph processing dispatch function for IPv4 VXLAN GPE
602 * @node vxlan4-gpe-input
607 * @return from_frame->n_vectors
611 vxlan4_gpe_input (vlib_main_t * vm, vlib_node_runtime_t * node,
612 vlib_frame_t * from_frame)
614 return vxlan_gpe_input (vm, node, from_frame, /* is_ip4 */1);
618 * @brief Graph processing dispatch function for IPv6 VXLAN GPE
620 * @node vxlan6-gpe-input
625 * @return from_frame->n_vectors - uword
629 vxlan6_gpe_input (vlib_main_t * vm, vlib_node_runtime_t * node,
630 vlib_frame_t * from_frame)
632 return vxlan_gpe_input (vm, node, from_frame, /* is_ip4 */0);
636 * @brief VXLAN GPE error strings
638 static char * vxlan_gpe_error_strings[] = {
639 #define vxlan_gpe_error(n,s) s,
640 #include <vnet/vxlan-gpe/vxlan_gpe_error.def>
641 #undef vxlan_gpe_error
645 VLIB_REGISTER_NODE (vxlan4_gpe_input_node) = {
646 .function = vxlan4_gpe_input,
647 .name = "vxlan4-gpe-input",
648 /* Takes a vector of packets. */
649 .vector_size = sizeof (u32),
650 .type = VLIB_NODE_TYPE_INTERNAL,
651 .n_errors = ARRAY_LEN(vxlan_gpe_error_strings),
652 .error_strings = vxlan_gpe_error_strings,
654 .n_next_nodes = VXLAN_GPE_INPUT_N_NEXT,
656 #define _(s,n) [VXLAN_GPE_INPUT_NEXT_##s] = n,
657 foreach_vxlan_gpe_input_next
661 .format_buffer = format_vxlan_gpe_with_length,
662 .format_trace = format_vxlan_gpe_rx_trace,
663 // $$$$ .unformat_buffer = unformat_vxlan_gpe_header,
666 VLIB_NODE_FUNCTION_MULTIARCH (vxlan4_gpe_input_node, vxlan4_gpe_input);
668 VLIB_REGISTER_NODE (vxlan6_gpe_input_node) = {
669 .function = vxlan6_gpe_input,
670 .name = "vxlan6-gpe-input",
671 /* Takes a vector of packets. */
672 .vector_size = sizeof (u32),
673 .type = VLIB_NODE_TYPE_INTERNAL,
674 .n_errors = ARRAY_LEN(vxlan_gpe_error_strings),
675 .error_strings = vxlan_gpe_error_strings,
677 .n_next_nodes = VXLAN_GPE_INPUT_N_NEXT,
679 #define _(s,n) [VXLAN_GPE_INPUT_NEXT_##s] = n,
680 foreach_vxlan_gpe_input_next
684 .format_buffer = format_vxlan_gpe_with_length,
685 .format_trace = format_vxlan_gpe_rx_trace,
686 // $$$$ .unformat_buffer = unformat_vxlan_gpe_header,
689 VLIB_NODE_FUNCTION_MULTIARCH (vxlan6_gpe_input_node, vxlan6_gpe_input);