2 * Copyright (c) 2016 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
7 * http://www.apache.org/licenses/LICENSE-2.0
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
16 #include <vnet/mfib/ip6_mfib.h>
18 #include <vnet/mfib/mfib_table.h>
19 #include <vnet/mfib/mfib_entry.h>
20 #include <vnet/fib/ip6_fib.h>
22 ip6_mfib_table_instance_t ip6_mfib_table;
25 * Key and mask for radix
27 typedef clib_bihash_kv_40_8_t ip6_mfib_key_t;
29 static const mfib_prefix_t all_zeros = {
38 .fp_proto = FIB_PROTOCOL_IP6,
41 typedef enum ip6_mfib_special_type_t_ {
42 IP6_MFIB_SPECIAL_TYPE_NONE,
43 IP6_MFIB_SPECIAL_TYPE_SOLICITED,
44 } ip6_mfib_special_type_t;
46 typedef struct ip6_mfib_special_t_ {
48 * @brief solicited or not
50 ip6_mfib_special_type_t ims_type;
53 * @brief the Prefix length
58 * @brief The last byte of the mcast address
62 * @brief The scope of the address
67 static const ip6_mfib_special_t ip6_mfib_specials[] =
71 * Add ff02::1:ff00:0/104 via local route for all tables.
72 * This is required for neighbor discovery to work.
74 .ims_type = IP6_MFIB_SPECIAL_TYPE_SOLICITED,
79 * all-routers multicast address
81 .ims_type = IP6_MFIB_SPECIAL_TYPE_NONE,
82 .ims_scope = IP6_MULTICAST_SCOPE_link_local,
83 .ims_byte = IP6_MULTICAST_GROUP_ID_all_routers,
88 * all-nodes multicast address
90 .ims_type = IP6_MFIB_SPECIAL_TYPE_NONE,
91 .ims_scope = IP6_MULTICAST_SCOPE_link_local,
92 .ims_byte = IP6_MULTICAST_GROUP_ID_all_hosts,
97 * Add all-mldv2 multicast address via local route for all tables
99 .ims_type = IP6_MFIB_SPECIAL_TYPE_NONE,
101 .ims_scope = IP6_MULTICAST_SCOPE_link_local,
102 .ims_byte = IP6_MULTICAST_GROUP_ID_mldv2_routers,
106 #define FOR_EACH_IP6_SPECIAL(_pfx, _body) \
108 const ip6_mfib_special_t *_spec; \
111 _ii < ARRAY_LEN(ip6_mfib_specials); \
114 _spec = &ip6_mfib_specials[_ii]; \
115 if (IP6_MFIB_SPECIAL_TYPE_SOLICITED == _spec->ims_type) \
117 ip6_set_solicited_node_multicast_address( \
118 &(_pfx)->fp_grp_addr.ip6, 0); \
122 ip6_set_reserved_multicast_address ( \
123 &(_pfx)->fp_grp_addr.ip6, \
127 (_pfx)->fp_len = _spec->ims_len; \
128 do { _body; } while (0); \
134 ip6_create_mfib_with_table_id (u32 table_id,
137 mfib_table_t *mfib_table;
138 mfib_prefix_t pfx = {
139 .fp_proto = FIB_PROTOCOL_IP6,
141 const fib_route_path_t path_for_us = {
142 .frp_proto = DPO_PROTO_IP6,
143 .frp_addr = zero_addr,
144 .frp_sw_if_index = 0xffffffff,
147 .frp_flags = FIB_ROUTE_PATH_LOCAL,
148 .frp_mitf_flags = MFIB_ITF_FLAG_FORWARD,
151 pool_get_aligned(ip6_main.mfibs, mfib_table, CLIB_CACHE_LINE_BYTES);
152 clib_memset(mfib_table, 0, sizeof(*mfib_table));
154 mfib_table->mft_proto = FIB_PROTOCOL_IP6;
155 mfib_table->mft_index =
156 mfib_table->v6.index =
157 (mfib_table - ip6_main.mfibs);
159 hash_set (ip6_main.mfib_index_by_table_id,
161 mfib_table->mft_index);
163 mfib_table->mft_table_id =
164 mfib_table->v6.table_id =
167 mfib_table_lock(mfib_table->mft_index, FIB_PROTOCOL_IP6, src);
170 * add the special entries into the new FIB
172 mfib_table_entry_update(mfib_table->mft_index,
174 MFIB_SOURCE_DEFAULT_ROUTE,
176 MFIB_ENTRY_FLAG_DROP);
179 * Add each of the specials
181 FOR_EACH_IP6_SPECIAL(&pfx,
183 mfib_table_entry_path_update(mfib_table->mft_index,
189 return (mfib_table->mft_index);
193 ip6_mfib_table_destroy (ip6_mfib_t *mfib)
195 mfib_table_t *mfib_table = (mfib_table_t*)mfib;
196 fib_node_index_t mfei;
197 mfib_prefix_t pfx = {
198 .fp_proto = FIB_PROTOCOL_IP6,
200 const fib_route_path_t path_for_us = {
201 .frp_proto = DPO_PROTO_IP6,
202 .frp_addr = zero_addr,
203 .frp_sw_if_index = 0xffffffff,
206 .frp_flags = FIB_ROUTE_PATH_LOCAL,
210 * remove all the specials we added when the table was created.
212 FOR_EACH_IP6_SPECIAL(&pfx,
214 mfib_table_entry_path_remove(mfib_table->mft_index,
220 mfei = mfib_table_lookup_exact_match(mfib_table->mft_index, &all_zeros);
221 mfib_table_entry_delete_index(mfei, MFIB_SOURCE_DEFAULT_ROUTE);
224 * validate no more routes.
226 ASSERT(0 == mfib_table->mft_total_route_counts);
227 ASSERT(~0 != mfib_table->mft_table_id);
229 hash_unset (ip6_main.mfib_index_by_table_id, mfib_table->mft_table_id);
230 pool_put(ip6_main.mfibs, mfib_table);
234 ip6_mfib_interface_enable_disable (u32 sw_if_index, int is_enable)
236 const fib_route_path_t path = {
237 .frp_proto = DPO_PROTO_IP6,
238 .frp_addr = zero_addr,
239 .frp_sw_if_index = sw_if_index,
242 .frp_mitf_flags = MFIB_ITF_FLAG_ACCEPT,
244 mfib_prefix_t pfx = {
245 .fp_proto = FIB_PROTOCOL_IP6,
249 mfib_index = ip6_mfib_table_get_index_for_sw_if_index(sw_if_index);
253 FOR_EACH_IP6_SPECIAL(&pfx,
255 mfib_table_entry_path_update(mfib_index,
263 FOR_EACH_IP6_SPECIAL(&pfx,
265 mfib_table_entry_path_remove(mfib_index,
274 ip6_mfib_table_find_or_create_and_lock (u32 table_id,
279 index = ip6_mfib_index_from_table_id(table_id);
281 return ip6_create_mfib_with_table_id(table_id, src);
282 mfib_table_lock(index, FIB_PROTOCOL_IP6, src);
288 ip6_mfib_table_get_index_for_sw_if_index (u32 sw_if_index)
290 if (sw_if_index >= vec_len(ip6_main.mfib_index_by_sw_if_index))
293 * This is the case for interfaces that are not yet mapped to
298 return (ip6_main.mfib_index_by_sw_if_index[sw_if_index]);
301 #define IPV6_MFIB_GRP_LEN(_len) \
302 (_len > 128 ? 128 : _len)
304 #define IP6_MFIB_MK_KEY(_mfib, _grp, _src, _len, _key) \
306 _key.key[0] = (_grp->as_u64[0] & \
307 ip6_main.fib_masks[IPV6_MFIB_GRP_LEN(_len)].as_u64[0]); \
308 _key.key[1] = (_grp->as_u64[1] & \
309 ip6_main.fib_masks[IPV6_MFIB_GRP_LEN(_len)].as_u64[1]); \
311 _key.key[2] = _src->as_u64[0]; \
312 _key.key[3] = _src->as_u64[1]; \
317 _key.key[4] = _mfib->index; \
318 _key.key[4] = (_key.key[4] << 32) | len; \
322 * ip6_fib_table_lookup_exact_match
324 * Exact match prefix lookup
327 ip6_mfib_table_lookup_exact_match (const ip6_mfib_t *mfib,
328 const ip6_address_t *grp,
329 const ip6_address_t *src,
332 ip6_mfib_key_t key, value;
335 IP6_MFIB_MK_KEY(mfib, grp, src, len, key);
337 rv = clib_bihash_search_inline_2_40_8(&ip6_mfib_table.ip6_mhash,
342 return (FIB_NODE_INDEX_INVALID);
346 * ip6_fib_table_lookup
348 * Longest prefix match for the forwarding plane (no mask given)
351 ip6_mfib_table_fwd_lookup (const ip6_mfib_t *mfib,
352 const ip6_address_t *src,
353 const ip6_address_t *grp)
355 ip6_mfib_table_instance_t *table;
356 ip6_mfib_key_t key, value;
360 table = &ip6_mfib_table;
361 n = vec_len (table->prefix_lengths_in_search_order);
363 for (i = 0; i < n; i++)
365 len = table->prefix_lengths_in_search_order[i];
367 ASSERT(len >= 0 && len <= 256);
368 IP6_MFIB_MK_KEY(mfib, grp, src, len, key);
369 rv = clib_bihash_search_inline_2_40_8(&table->ip6_mhash, &key, &value);
374 return (FIB_NODE_INDEX_INVALID);
379 ip6_mfib_table_get_less_specific (const ip6_mfib_t *mfib,
380 const ip6_address_t *src,
381 const ip6_address_t *grp,
387 * in the absence of a tree structure for the table that allows for an O(1)
388 * parent get, a cheeky way to find the cover is to LPM for the prefix with
390 * there should always be a cover, though it may be the default route. the
391 * default route's cover is the default route.
395 /* go from (S,G) to (*,G*) */
407 return (ip6_mfib_table_lookup(mfib, src, grp, mask_len));
411 * ip6_fib_table_lookup
413 * Longest prefix match
416 ip6_mfib_table_lookup (const ip6_mfib_t *mfib,
417 const ip6_address_t *src,
418 const ip6_address_t *grp,
421 ip6_mfib_table_instance_t *table;
422 ip6_mfib_key_t key, value;
425 table = &ip6_mfib_table;
426 n = vec_len (table->prefix_lengths_in_search_order);
429 * start search from a mask length same length or shorter.
430 * we don't want matches longer than the mask passed
433 while (i < n && table->prefix_lengths_in_search_order[i] > len)
440 len = table->prefix_lengths_in_search_order[i];
443 IP6_MFIB_MK_KEY(mfib, grp, src, len, key);
445 rv = clib_bihash_search_inline_2_40_8(&table->ip6_mhash, &key, &value);
450 return (FIB_NODE_INDEX_INVALID);
454 compute_prefix_lengths_in_search_order (ip6_mfib_table_instance_t *table)
457 vec_reset_length (table->prefix_lengths_in_search_order);
458 /* Note: bitmap reversed so this is in fact a longest prefix match */
459 clib_bitmap_foreach (i, table->non_empty_dst_address_length_bitmap)
461 vec_add1(table->prefix_lengths_in_search_order, (256 - i));
466 ip6_mfib_table_entry_insert (ip6_mfib_t *mfib,
467 const ip6_address_t *grp,
468 const ip6_address_t *src,
470 fib_node_index_t mfib_entry_index)
472 ip6_mfib_table_instance_t *table;
475 table = &ip6_mfib_table;
476 IP6_MFIB_MK_KEY(mfib, grp, src, len, key);
477 key.value = mfib_entry_index;
479 clib_bihash_add_del_40_8(&table->ip6_mhash, &key, 1);
481 if (0 == table->dst_address_length_refcounts[len]++)
483 table->non_empty_dst_address_length_bitmap =
484 clib_bitmap_set (table->non_empty_dst_address_length_bitmap,
486 compute_prefix_lengths_in_search_order (table);
491 ip6_mfib_table_entry_remove (ip6_mfib_t *mfib,
492 const ip6_address_t *grp,
493 const ip6_address_t *src,
496 ip6_mfib_table_instance_t *table;
499 IP6_MFIB_MK_KEY(mfib, grp, src, len, key);
501 table = &ip6_mfib_table;
502 clib_bihash_add_del_40_8(&table->ip6_mhash, &key, 0);
504 ASSERT (table->dst_address_length_refcounts[len] > 0);
505 if (--table->dst_address_length_refcounts[len] == 0)
507 table->non_empty_dst_address_length_bitmap =
508 clib_bitmap_set (table->non_empty_dst_address_length_bitmap,
510 compute_prefix_lengths_in_search_order (table);
514 static clib_error_t *
515 ip6_mfib_module_init (vlib_main_t * vm)
520 VLIB_INIT_FUNCTION(ip6_mfib_module_init);
523 format_ip6_mfib_table_memory (u8 * s, va_list * args)
527 bytes_inuse = alloc_arena_next(&(ip6_mfib_table.ip6_mhash));
529 s = format(s, "%=30s %=6d %=12ld\n",
531 pool_elts(ip6_main.mfibs),
538 ip6_mfib_table_show_one (ip6_mfib_t *mfib,
547 vlib_cli_output(vm, "%U",
549 ip6_mfib_table_get_less_specific(mfib, src, grp, mask_len),
550 MFIB_ENTRY_FORMAT_DETAIL);
554 vlib_cli_output(vm, "%U",
556 ip6_mfib_table_lookup(mfib, src, grp, mask_len),
557 MFIB_ENTRY_FORMAT_DETAIL);
561 typedef struct ip6_mfib_show_ctx_t_ {
562 fib_node_index_t *entries;
563 } ip6_mfib_show_ctx_t;
567 ip6_mfib_table_collect_entries (fib_node_index_t mfei, void *arg)
569 ip6_mfib_show_ctx_t *ctx = arg;
571 vec_add1(ctx->entries, mfei);
573 return (WALK_CONTINUE);
577 ip6_mfib_table_show_all (ip6_mfib_t *mfib,
580 fib_node_index_t *mfib_entry_index;
581 ip6_mfib_show_ctx_t ctx = {
585 ip6_mfib_table_walk(mfib,
586 ip6_mfib_table_collect_entries,
589 vec_sort_with_function(ctx.entries, mfib_entry_cmp_for_sort);
591 vec_foreach(mfib_entry_index, ctx.entries)
593 vlib_cli_output(vm, "%U",
596 MFIB_ENTRY_FORMAT_BRIEF);
599 vec_free(ctx.entries);
603 * @brief Context when walking the IPv6 table. Since all VRFs are in the
604 * same hash table, we need to filter only those we need as we walk
606 typedef struct ip6_mfib_walk_ctx_t_
609 mfib_table_walk_fn_t i6w_fn;
611 } ip6_mfib_walk_ctx_t;
614 ip6_mfib_walk_cb (clib_bihash_kv_40_8_t * kvp,
617 ip6_mfib_walk_ctx_t *ctx = arg;
619 if ((kvp->key[4] >> 32) == ctx->i6w_mfib_index)
621 ctx->i6w_fn(kvp->value, ctx->i6w_ctx);
623 return (BIHASH_WALK_CONTINUE);
627 ip6_mfib_table_walk (ip6_mfib_t *mfib,
628 mfib_table_walk_fn_t fn,
631 ip6_mfib_walk_ctx_t ctx = {
632 .i6w_mfib_index = mfib->index,
637 clib_bihash_foreach_key_value_pair_40_8(
638 &ip6_mfib_table.ip6_mhash,
643 static clib_error_t *
644 ip6_show_mfib (vlib_main_t * vm,
645 unformat_input_t * input,
646 vlib_cli_command_t * cmd)
648 ip6_main_t * im6 = &ip6_main;
649 mfib_table_t *mfib_table;
650 int verbose, matching;
651 ip6_address_t grp, src = {{0}};
652 u32 mask = 128, cover;
653 int table_id = -1, fib_index = ~0;
659 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
661 if (unformat (input, "brief") || unformat (input, "summary")
662 || unformat (input, "sum"))
665 else if (unformat (input, "%U %U",
666 unformat_ip6_address, &src,
667 unformat_ip6_address, &grp))
672 else if (unformat (input, "%U/%d", unformat_ip6_address, &grp, &mask))
674 clib_memset(&src, 0, sizeof(src));
677 else if (unformat (input, "%U", unformat_ip6_address, &grp))
679 clib_memset(&src, 0, sizeof(src));
683 else if (unformat (input, "table %d", &table_id))
685 else if (unformat (input, "index %d", &fib_index))
687 else if (unformat (input, "cover"))
693 pool_foreach (mfib_table, im6->mfibs)
695 ip6_mfib_t *mfib = &mfib_table->v6;
697 if (table_id >= 0 && table_id != (int)mfib->table_id)
699 if (fib_index != ~0 && fib_index != (int)mfib->index)
702 vlib_cli_output (vm, "%U, fib_index %d",
703 format_mfib_table_name, mfib->index, FIB_PROTOCOL_IP6,
709 /* vlib_cli_output (vm, "%=20s%=16s", "Prefix length", "Count"); */
710 /* for (i = 0; i < ARRAY_LEN (mfib->fib_entry_by_dst_address); i++) */
712 /* uword * hash = mfib->fib_entry_by_dst_address[i]; */
713 /* uword n_elts = hash_elts (hash); */
714 /* if (n_elts > 0) */
715 /* vlib_cli_output (vm, "%20d%16d", i, n_elts); */
722 ip6_mfib_table_show_all(mfib, vm);
726 ip6_mfib_table_show_one(mfib, vm, &src, &grp, mask, cover);
733 /* clang-format off */
735 * This command displays the IPv6 MulticasrFIB Tables (VRF Tables) and
736 * the route entries for each table.
738 * @note This command will run for a long time when the FIB tables are
739 * comprised of millions of entries. For those scenarios, consider displaying
740 * a single table or summary mode.
743 * Example of how to display all the IPv6 Multicast FIB tables:
744 * @cliexstart{show ip fib}
745 * ipv6-VRF:0, fib_index 0
746 * (*, 0.0.0.0/0): flags:D,
748 * multicast-ip6-chain
752 * test-eth1: Forward,
753 * test-eth2: Forward,
755 * multicast-ip6-chain
756 * [@2]: dpo-replicate: [index:1 buckets:2 to:[0:0]]
757 * [0] [@1]: ipv6-mcast: test-eth1: IP6: d0:d1:d2:d3:d4:01 -> 01:00:05:00:00:00
758 * [1] [@1]: ipv6-mcast: test-eth2: IP6: d0:d1:d2:d3:d4:02 -> 01:00:05:00:00:00
761 * Example of how to display a summary of all IPv6 FIB tables:
762 * @cliexstart{show ip fib summary}
763 * ipv6-VRF:0, fib_index 0, flow hash: src dst sport dport proto
764 * Prefix length Count
768 * ipv6-VRF:7, fib_index 1, flow hash: src dst sport dport proto
769 * Prefix length Count
776 /* clang-format on */
777 VLIB_CLI_COMMAND (ip6_show_fib_command, static) = {
778 .path = "show ip6 mfib",
779 .short_help = "show ip mfib [summary] [table <table-id>] [index <fib-id>] [<grp-addr>[/<mask>]] [<grp-addr>] [<src-addr> <grp-addr>]",
780 .function = ip6_show_mfib,
783 static clib_error_t *
784 ip6_mfib_init (vlib_main_t * vm)
786 clib_bihash_init_40_8 (&ip6_mfib_table.ip6_mhash,
788 IP6_MFIB_DEFAULT_HASH_NUM_BUCKETS,
789 IP6_MFIB_DEFAULT_HASH_MEMORY_SIZE);
794 VLIB_INIT_FUNCTION (ip6_mfib_init) =
796 .runs_before = VLIB_INITS("ip6_lookup_init"),