2 * gre_interface.c: gre interfaces
4 * Copyright (c) 2012 Cisco and/or its affiliates.
5 * Licensed under the Apache License, Version 2.0 (the "License");
6 * you may not use this file except in compliance with the License.
7 * You may obtain a copy of the License at:
9 * http://www.apache.org/licenses/LICENSE-2.0
11 * Unless required by applicable law or agreed to in writing, software
12 * distributed under the License is distributed on an "AS IS" BASIS,
13 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14 * See the License for the specific language governing permissions and
15 * limitations under the License.
18 #include <vnet/vnet.h>
19 #include <vnet/pg/pg.h>
20 #include <vnet/gre/gre.h>
21 #include <vnet/ip/format.h>
22 #include <vnet/fib/ip4_fib.h>
23 #include <vnet/fib/ip6_fib.h>
24 #include <vnet/adj/adj_midchain.h>
25 #include <vnet/adj/adj_nbr.h>
26 #include <vnet/mpls/mpls.h>
28 static const char *gre_tunnel_type_names[] = GRE_TUNNEL_TYPE_NAMES;
31 format_gre_tunnel (u8 * s, va_list * args)
33 gre_tunnel_t *t = va_arg (*args, gre_tunnel_t *);
35 s = format (s, "[%d] instance %d src %U dst %U fib-idx %d sw-if-idx %d ",
36 t->dev_instance, t->user_instance,
37 format_ip46_address, &t->tunnel_src, IP46_TYPE_ANY,
38 format_ip46_address, &t->tunnel_dst.fp_addr, IP46_TYPE_ANY,
39 t->outer_fib_index, t->sw_if_index);
41 s = format (s, "payload %s ", gre_tunnel_type_names[t->type]);
43 if (t->type == GRE_TUNNEL_TYPE_ERSPAN)
44 s = format (s, "session %d ", t->session_id);
46 if (t->type != GRE_TUNNEL_TYPE_L3)
47 s = format (s, "l2-adj-idx %d ", t->l2_adj_index);
53 gre_tunnel_db_find (const vnet_gre_add_del_tunnel_args_t * a,
54 u32 outer_fib_index, gre_tunnel_key_t * key)
56 gre_main_t *gm = &gre_main;
61 gre_mk_key4 (a->src.ip4, a->dst.ip4, outer_fib_index,
62 a->tunnel_type, a->session_id, &key->gtk_v4);
63 p = hash_get_mem (gm->tunnel_by_key4, &key->gtk_v4);
67 gre_mk_key6 (&a->src.ip6, &a->dst.ip6, outer_fib_index,
68 a->tunnel_type, a->session_id, &key->gtk_v6);
69 p = hash_get_mem (gm->tunnel_by_key6, &key->gtk_v6);
75 return (pool_elt_at_index (gm->tunnels, p[0]));
79 gre_tunnel_db_add (gre_tunnel_t * t, gre_tunnel_key_t * key)
81 gre_main_t *gm = &gre_main;
83 t->key = clib_mem_alloc (sizeof (*t->key));
84 clib_memcpy (t->key, key, sizeof (*key));
86 if (t->tunnel_dst.fp_proto == FIB_PROTOCOL_IP6)
88 hash_set_mem (gm->tunnel_by_key6, &t->key->gtk_v6, t->dev_instance);
92 hash_set_mem (gm->tunnel_by_key4, &t->key->gtk_v4, t->dev_instance);
97 gre_tunnel_db_remove (gre_tunnel_t * t)
99 gre_main_t *gm = &gre_main;
101 if (t->tunnel_dst.fp_proto == FIB_PROTOCOL_IP6)
103 hash_unset_mem (gm->tunnel_by_key6, &t->key->gtk_v6);
107 hash_unset_mem (gm->tunnel_by_key4, &t->key->gtk_v4);
110 clib_mem_free (t->key);
114 static gre_tunnel_t *
115 gre_tunnel_from_fib_node (fib_node_t * node)
117 ASSERT (FIB_NODE_TYPE_GRE_TUNNEL == node->fn_type);
118 return ((gre_tunnel_t *) (((char *) node) -
119 STRUCT_OFFSET_OF (gre_tunnel_t, node)));
125 * 'stack' (resolve the recursion for) the tunnel's midchain adjacency
128 gre_tunnel_stack (adj_index_t ai)
130 gre_main_t *gm = &gre_main;
136 sw_if_index = adj->rewrite_header.sw_if_index;
138 if ((vec_len (gm->tunnel_index_by_sw_if_index) < sw_if_index) ||
139 (~0 == gm->tunnel_index_by_sw_if_index[sw_if_index]))
142 gt = pool_elt_at_index (gm->tunnels,
143 gm->tunnel_index_by_sw_if_index[sw_if_index]);
145 if ((vnet_hw_interface_get_flags (vnet_get_main (), gt->hw_if_index) &
146 VNET_HW_INTERFACE_FLAG_LINK_UP) == 0)
148 adj_nbr_midchain_unstack (ai);
152 dpo_id_t tmp = DPO_INVALID;
153 fib_forward_chain_type_t fib_fwd = (FIB_PROTOCOL_IP6 == adj->ia_nh_proto) ?
154 FIB_FORW_CHAIN_TYPE_UNICAST_IP6 : FIB_FORW_CHAIN_TYPE_UNICAST_IP4;
156 fib_entry_contribute_forwarding (gt->fib_entry_index, fib_fwd, &tmp);
157 if (DPO_LOAD_BALANCE == tmp.dpoi_type)
160 * post GRE rewrite we will load-balance. However, the GRE encap
161 * is always the same for this adjacency/tunnel and hence the IP/GRE
162 * src,dst hash is always the same result too. So we do that hash now and
163 * stack on the choice.
164 * If the choice is an incomplete adj then we will need a poke when
165 * it becomes complete. This happens since the adj update walk propagates
166 * as far a recursive paths.
168 const dpo_id_t *choice;
172 lb = load_balance_get (tmp.dpoi_index);
174 if (fib_fwd == FIB_FORW_CHAIN_TYPE_UNICAST_IP4)
175 hash = ip4_compute_flow_hash ((ip4_header_t *) adj_get_rewrite (ai),
178 hash = ip6_compute_flow_hash ((ip6_header_t *) adj_get_rewrite (ai),
181 load_balance_get_bucket_i (lb, hash & lb->lb_n_buckets_minus_1);
182 dpo_copy (&tmp, choice);
185 adj_nbr_midchain_stack (ai, &tmp);
190 * @brief Call back when restacking all adjacencies on a GRE interface
193 gre_adj_walk_cb (adj_index_t ai, void *ctx)
195 gre_tunnel_stack (ai);
197 return (ADJ_WALK_RC_CONTINUE);
201 gre_tunnel_restack (gre_tunnel_t * gt)
203 fib_protocol_t proto;
206 * walk all the adjacencies on th GRE interface and restack them
208 FOR_EACH_FIB_IP_PROTOCOL (proto)
210 adj_nbr_walk (gt->sw_if_index, proto, gre_adj_walk_cb, NULL);
215 * Function definition to backwalk a FIB node
217 static fib_node_back_walk_rc_t
218 gre_tunnel_back_walk (fib_node_t * node, fib_node_back_walk_ctx_t * ctx)
220 gre_tunnel_restack (gre_tunnel_from_fib_node (node));
222 return (FIB_NODE_BACK_WALK_CONTINUE);
226 * Function definition to get a FIB node from its index
229 gre_tunnel_fib_node_get (fib_node_index_t index)
235 gt = pool_elt_at_index (gm->tunnels, index);
241 * Function definition to inform the FIB node that its last lock has gone.
244 gre_tunnel_last_lock_gone (fib_node_t * node)
247 * The MPLS GRE tunnel is a root of the graph. As such
248 * it never has children and thus is never locked.
254 * Virtual function table registered by MPLS GRE tunnels
255 * for participation in the FIB object graph.
257 const static fib_node_vft_t gre_vft = {
258 .fnv_get = gre_tunnel_fib_node_get,
259 .fnv_last_lock = gre_tunnel_last_lock_gone,
260 .fnv_back_walk = gre_tunnel_back_walk,
264 vnet_gre_tunnel_add (vnet_gre_add_del_tunnel_args_t * a,
265 u32 outer_fib_index, u32 * sw_if_indexp)
267 gre_main_t *gm = &gre_main;
268 vnet_main_t *vnm = gm->vnet_main;
269 ip4_main_t *im4 = &ip4_main;
270 ip6_main_t *im6 = &ip6_main;
272 vnet_hw_interface_t *hi;
273 u32 hw_if_index, sw_if_index;
275 u8 is_ipv6 = a->is_ipv6;
276 gre_tunnel_key_t key;
278 t = gre_tunnel_db_find (a, outer_fib_index, &key);
280 return VNET_API_ERROR_IF_ALREADY_EXISTS;
282 pool_get_aligned (gm->tunnels, t, CLIB_CACHE_LINE_BYTES);
283 memset (t, 0, sizeof (*t));
285 /* Reconcile the real dev_instance and a possible requested instance */
286 u32 t_idx = t - gm->tunnels; /* tunnel index (or instance) */
287 u32 u_idx = a->instance; /* user specified instance */
290 if (hash_get (gm->instance_used, u_idx))
292 pool_put (gm->tunnels, t);
293 return VNET_API_ERROR_INSTANCE_IN_USE;
295 hash_set (gm->instance_used, u_idx, 1);
297 t->dev_instance = t_idx; /* actual */
298 t->user_instance = u_idx; /* name */
299 fib_node_init (&t->node, FIB_NODE_TYPE_GRE_TUNNEL);
301 t->type = a->tunnel_type;
302 if (t->type == GRE_TUNNEL_TYPE_ERSPAN)
303 t->session_id = a->session_id;
305 if (t->type == GRE_TUNNEL_TYPE_L3)
306 hw_if_index = vnet_register_interface (vnm, gre_device_class.index, t_idx,
307 gre_hw_interface_class.index,
311 /* Default MAC address (d00b:eed0:0000 + sw_if_index) */
313 { 0xd0, 0x0b, 0xee, 0xd0, (u8) (t_idx >> 8), (u8) t_idx };
315 ethernet_register_interface (vnm, gre_device_class.index, t_idx,
316 address, &hw_if_index, 0);
319 clib_error_report (error);
320 return VNET_API_ERROR_INVALID_REGISTRATION;
324 /* Set GRE tunnel interface output node (not used for L3 payload) */
325 vnet_set_interface_output_node (vnm, hw_if_index, gre_encap_node.index);
327 hi = vnet_get_hw_interface (vnm, hw_if_index);
328 sw_if_index = hi->sw_if_index;
330 t->hw_if_index = hw_if_index;
331 t->outer_fib_index = outer_fib_index;
332 t->sw_if_index = sw_if_index;
333 t->l2_adj_index = ADJ_INDEX_INVALID;
335 vec_validate_init_empty (gm->tunnel_index_by_sw_if_index, sw_if_index, ~0);
336 gm->tunnel_index_by_sw_if_index[sw_if_index] = t_idx;
340 vec_validate (im4->fib_index_by_sw_if_index, sw_if_index);
341 hi->min_packet_bytes =
342 64 + sizeof (gre_header_t) + sizeof (ip4_header_t);
346 vec_validate (im6->fib_index_by_sw_if_index, sw_if_index);
347 hi->min_packet_bytes =
348 64 + sizeof (gre_header_t) + sizeof (ip6_header_t);
351 hi->per_packet_overhead_bytes =
352 /* preamble */ 8 + /* inter frame gap */ 12;
354 /* Standard default gre MTU. */
355 hi->max_l3_packet_bytes[VLIB_RX] = hi->max_l3_packet_bytes[VLIB_TX] = 9000;
358 * source the FIB entry for the tunnel's destination
359 * and become a child thereof. The tunnel will then get poked
360 * when the forwarding for the entry updates, and the tunnel can
361 * re-stack accordingly
364 clib_memcpy (&t->tunnel_src, &a->src, sizeof (t->tunnel_src));
365 t->tunnel_dst.fp_len = !is_ipv6 ? 32 : 128;
366 t->tunnel_dst.fp_proto = !is_ipv6 ? FIB_PROTOCOL_IP4 : FIB_PROTOCOL_IP6;
367 t->tunnel_dst.fp_addr = a->dst;
369 gre_tunnel_db_add (t, &key);
370 if (t->type == GRE_TUNNEL_TYPE_ERSPAN)
375 gre_mk_sn_key (t, &skey);
376 gre_sn = (gre_sn_t *) hash_get_mem (gm->seq_num_by_key, &skey);
384 gre_sn = clib_mem_alloc (sizeof (gre_sn_t));
386 gre_sn->ref_count = 1;
388 hash_set_mem_alloc (&gm->seq_num_by_key, &skey, (uword) gre_sn);
392 t->fib_entry_index = fib_table_entry_special_add
393 (outer_fib_index, &t->tunnel_dst, FIB_SOURCE_RR, FIB_ENTRY_FLAG_NONE);
394 t->sibling_index = fib_entry_child_add
395 (t->fib_entry_index, FIB_NODE_TYPE_GRE_TUNNEL, t_idx);
397 if (t->type != GRE_TUNNEL_TYPE_L3)
399 t->l2_adj_index = adj_nbr_add_or_lock
400 (t->tunnel_dst.fp_proto, VNET_LINK_ETHERNET, &zero_addr, sw_if_index);
401 gre_update_adj (vnm, t->sw_if_index, t->l2_adj_index);
405 *sw_if_indexp = sw_if_index;
411 vnet_gre_tunnel_delete (vnet_gre_add_del_tunnel_args_t * a,
412 u32 outer_fib_index, u32 * sw_if_indexp)
414 gre_main_t *gm = &gre_main;
415 vnet_main_t *vnm = gm->vnet_main;
417 gre_tunnel_key_t key;
420 t = gre_tunnel_db_find (a, outer_fib_index, &key);
422 return VNET_API_ERROR_NO_SUCH_ENTRY;
424 sw_if_index = t->sw_if_index;
425 vnet_sw_interface_set_flags (vnm, sw_if_index, 0 /* down */ );
427 /* make sure tunnel is removed from l2 bd or xconnect */
428 set_int_l2_mode (gm->vlib_main, vnm, MODE_L3, sw_if_index, 0, 0, 0, 0);
429 gm->tunnel_index_by_sw_if_index[sw_if_index] = ~0;
431 if (t->type == GRE_TUNNEL_TYPE_L3)
432 vnet_delete_hw_interface (vnm, t->hw_if_index);
434 ethernet_delete_interface (vnm, t->hw_if_index);
436 if (t->l2_adj_index != ADJ_INDEX_INVALID)
437 adj_unlock (t->l2_adj_index);
439 fib_entry_child_remove (t->fib_entry_index, t->sibling_index);
440 fib_table_entry_delete_index (t->fib_entry_index, FIB_SOURCE_RR);
442 ASSERT ((t->type != GRE_TUNNEL_TYPE_ERSPAN) || (t->gre_sn != NULL));
443 if ((t->type == GRE_TUNNEL_TYPE_ERSPAN) && (t->gre_sn->ref_count-- == 1))
446 gre_mk_sn_key (t, &skey);
447 hash_unset_mem_free (&gm->seq_num_by_key, &skey);
448 clib_mem_free (t->gre_sn);
451 hash_unset (gm->instance_used, t->user_instance);
452 gre_tunnel_db_remove (t);
453 fib_node_deinit (&t->node);
454 pool_put (gm->tunnels, t);
457 *sw_if_indexp = sw_if_index;
463 vnet_gre_add_del_tunnel (vnet_gre_add_del_tunnel_args_t * a,
469 outer_fib_index = ip4_fib_index_from_table_id (a->outer_fib_id);
471 outer_fib_index = ip6_fib_index_from_table_id (a->outer_fib_id);
473 if (~0 == outer_fib_index)
474 return VNET_API_ERROR_NO_SUCH_FIB;
476 if (a->session_id > GTK_SESSION_ID_MAX)
477 return VNET_API_ERROR_INVALID_SESSION_ID;
480 return (vnet_gre_tunnel_add (a, outer_fib_index, sw_if_indexp));
482 return (vnet_gre_tunnel_delete (a, outer_fib_index, sw_if_indexp));
486 gre_interface_admin_up_down (vnet_main_t * vnm, u32 hw_if_index, u32 flags)
488 gre_main_t *gm = &gre_main;
489 vnet_hw_interface_t *hi;
493 hi = vnet_get_hw_interface (vnm, hw_if_index);
495 if (NULL == gm->tunnel_index_by_sw_if_index ||
496 hi->sw_if_index >= vec_len (gm->tunnel_index_by_sw_if_index))
499 ti = gm->tunnel_index_by_sw_if_index[hi->sw_if_index];
502 /* not one of ours */
505 t = pool_elt_at_index (gm->tunnels, ti);
507 if (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
508 vnet_hw_interface_set_flags (vnm, hw_if_index,
509 VNET_HW_INTERFACE_FLAG_LINK_UP);
511 vnet_hw_interface_set_flags (vnm, hw_if_index, 0 /* down */ );
513 gre_tunnel_restack (t);
515 return /* no error */ 0;
518 static clib_error_t *
519 create_gre_tunnel_command_fn (vlib_main_t * vm,
520 unformat_input_t * input,
521 vlib_cli_command_t * cmd)
523 unformat_input_t _line_input, *line_input = &_line_input;
524 vnet_gre_add_del_tunnel_args_t _a, *a = &_a;
525 ip46_address_t src, dst;
527 u32 outer_fib_id = 0;
528 gre_tunnel_type_t t_type = GRE_TUNNEL_TYPE_L3;
534 clib_error_t *error = NULL;
538 /* Get a line of input. */
539 if (!unformat_user (input, unformat_line_input, line_input))
542 while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
544 if (unformat (line_input, "del"))
546 else if (unformat (line_input, "instance %d", &instance))
549 if (unformat (line_input, "src %U", unformat_ip4_address, &src.ip4))
555 if (unformat (line_input, "dst %U", unformat_ip4_address, &dst.ip4))
561 if (unformat (line_input, "src %U", unformat_ip6_address, &src.ip6))
567 if (unformat (line_input, "dst %U", unformat_ip6_address, &dst.ip6))
572 else if (unformat (line_input, "outer-fib-id %d", &outer_fib_id))
574 else if (unformat (line_input, "teb"))
575 t_type = GRE_TUNNEL_TYPE_TEB;
576 else if (unformat (line_input, "erspan %d", &session_id))
577 t_type = GRE_TUNNEL_TYPE_ERSPAN;
580 error = clib_error_return (0, "unknown input `%U'",
581 format_unformat_error, line_input);
588 error = clib_error_return (0, "mandatory argument(s) missing");
592 if ((ipv4_set && memcmp (&src.ip4, &dst.ip4, sizeof (src.ip4)) == 0) ||
593 (ipv6_set && memcmp (&src.ip6, &dst.ip6, sizeof (src.ip6)) == 0))
595 error = clib_error_return (0, "src and dst are identical");
599 if (ipv4_set && ipv6_set)
600 return clib_error_return (0, "both IPv4 and IPv6 addresses specified");
602 if ((ipv4_set && memcmp (&dst.ip4, &zero_addr.ip4, sizeof (dst.ip4)) == 0)
604 && memcmp (&dst.ip6, &zero_addr.ip6, sizeof (dst.ip6)) == 0))
606 error = clib_error_return (0, "dst address cannot be zero");
610 memset (a, 0, sizeof (*a));
612 a->outer_fib_id = outer_fib_id;
613 a->tunnel_type = t_type;
614 a->session_id = session_id;
615 a->is_ipv6 = ipv6_set;
616 a->instance = instance;
619 clib_memcpy (&a->src.ip4, &src.ip4, sizeof (src.ip4));
620 clib_memcpy (&a->dst.ip4, &dst.ip4, sizeof (dst.ip4));
624 clib_memcpy (&a->src.ip6, &src.ip6, sizeof (src.ip6));
625 clib_memcpy (&a->dst.ip6, &dst.ip6, sizeof (dst.ip6));
628 rv = vnet_gre_add_del_tunnel (a, &sw_if_index);
633 vlib_cli_output (vm, "%U\n", format_vnet_sw_if_index_name,
634 vnet_get_main (), sw_if_index);
636 case VNET_API_ERROR_IF_ALREADY_EXISTS:
637 error = clib_error_return (0, "GRE tunnel already exists...");
639 case VNET_API_ERROR_NO_SUCH_FIB:
640 error = clib_error_return (0, "outer fib ID %d doesn't exist\n",
643 case VNET_API_ERROR_NO_SUCH_ENTRY:
644 error = clib_error_return (0, "GRE tunnel doesn't exist");
646 case VNET_API_ERROR_INVALID_SESSION_ID:
647 error = clib_error_return (0, "session ID %d out of range\n",
650 case VNET_API_ERROR_INSTANCE_IN_USE:
651 error = clib_error_return (0, "Instance is in use");
655 clib_error_return (0, "vnet_gre_add_del_tunnel returned %d", rv);
660 unformat_free (line_input);
666 VLIB_CLI_COMMAND (create_gre_tunnel_command, static) = {
667 .path = "create gre tunnel",
668 .short_help = "create gre tunnel src <addr> dst <addr> [instance <n>] "
669 "[outer-fib-id <fib>] [teb | erspan <session-id>] [del]",
670 .function = create_gre_tunnel_command_fn,
674 static clib_error_t *
675 show_gre_tunnel_command_fn (vlib_main_t * vm,
676 unformat_input_t * input,
677 vlib_cli_command_t * cmd)
679 gre_main_t *gm = &gre_main;
683 if (pool_elts (gm->tunnels) == 0)
684 vlib_cli_output (vm, "No GRE tunnels configured...");
686 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
688 if (unformat (input, "%d", &ti))
697 pool_foreach (t, gm->tunnels,
699 vlib_cli_output (vm, "%U", format_gre_tunnel, t);
705 t = pool_elt_at_index (gm->tunnels, ti);
707 vlib_cli_output (vm, "%U", format_gre_tunnel, t);
714 VLIB_CLI_COMMAND (show_gre_tunnel_command, static) = {
715 .path = "show gre tunnel",
716 .function = show_gre_tunnel_command_fn,
720 /* force inclusion from application's main.c */
722 gre_interface_init (vlib_main_t * vm)
724 fib_node_register_type (FIB_NODE_TYPE_GRE_TUNNEL, &gre_vft);
729 VLIB_INIT_FUNCTION (gre_interface_init);
732 * fd.io coding-style-patch-verification: ON
735 * eval: (c-set-style "gnu")