2 * Copyright (c) 2016 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
7 * http://www.apache.org/licenses/LICENSE-2.0
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
16 #include <vnet/fib/fib_table.h>
17 #include <vnet/fib/fib_entry.h>
18 #include <vnet/fib/ip4_fib.h>
21 * A table of prefixes to be added to tables and the sources for them
23 typedef struct ip4_fib_table_special_prefix_t_ {
24 fib_prefix_t ift_prefix;
25 fib_source_t ift_source;
26 fib_entry_flag_t ift_flag;
27 } ip4_fib_table_special_prefix_t;
29 static const ip4_fib_table_special_prefix_t ip4_specials[] = {
37 .fp_proto = FIB_PROTOCOL_IP4,
39 .ift_source = FIB_SOURCE_DEFAULT_ROUTE,
40 .ift_flag = FIB_ENTRY_FLAG_DROP,
49 .fp_proto = FIB_PROTOCOL_IP4,
51 .ift_source = FIB_SOURCE_DEFAULT_ROUTE,
52 .ift_flag = FIB_ENTRY_FLAG_DROP,
61 .ip4.data_u32 = 0xf0000000,
64 .fp_proto = FIB_PROTOCOL_IP4,
66 .ift_source = FIB_SOURCE_SPECIAL,
67 .ift_flag = FIB_ENTRY_FLAG_DROP,
77 .ip4.data_u32 = 0xe0000000,
80 .fp_proto = FIB_PROTOCOL_IP4,
82 .ift_source = FIB_SOURCE_SPECIAL,
83 .ift_flag = FIB_ENTRY_FLAG_DROP,
88 * drop, but we'll allow it to be usurped by the likes of DHCP
92 .ip4.data_u32 = 0xffffffff,
95 .fp_proto = FIB_PROTOCOL_IP4,
97 .ift_source = FIB_SOURCE_DEFAULT_ROUTE,
98 .ift_flag = FIB_ENTRY_FLAG_DROP,
104 ip4_create_fib_with_table_id (u32 table_id,
107 fib_table_t *fib_table;
111 pool_get(ip4_main.fibs, fib_table);
112 clib_memset(fib_table, 0, sizeof(*fib_table));
114 old_heap = clib_mem_set_heap (ip4_main.mtrie_mheap);
115 pool_get_aligned(ip4_main.v4_fibs, v4_fib, CLIB_CACHE_LINE_BYTES);
116 clib_mem_set_heap (old_heap);
118 ASSERT((fib_table - ip4_main.fibs) ==
119 (v4_fib - ip4_main.v4_fibs));
121 fib_table->ft_proto = FIB_PROTOCOL_IP4;
122 fib_table->ft_index =
124 (fib_table - ip4_main.fibs);
126 hash_set (ip4_main.fib_index_by_table_id, table_id, fib_table->ft_index);
128 fib_table->ft_table_id =
131 fib_table->ft_flow_hash_config = IP_FLOW_HASH_DEFAULT;
133 fib_table_lock(fib_table->ft_index, FIB_PROTOCOL_IP4, src);
135 ip4_mtrie_init(&v4_fib->mtrie);
138 * add the special entries into the new FIB
142 for (ii = 0; ii < ARRAY_LEN(ip4_specials); ii++)
144 fib_prefix_t prefix = ip4_specials[ii].ift_prefix;
146 prefix.fp_addr.ip4.data_u32 =
147 clib_host_to_net_u32(prefix.fp_addr.ip4.data_u32);
149 fib_table_entry_special_add(fib_table->ft_index,
151 ip4_specials[ii].ift_source,
152 ip4_specials[ii].ift_flag);
155 return (fib_table->ft_index);
159 ip4_fib_table_destroy (u32 fib_index)
161 fib_table_t *fib_table = pool_elt_at_index(ip4_main.fibs, fib_index);
162 ip4_fib_t *v4_fib = pool_elt_at_index(ip4_main.v4_fibs, fib_index);
167 * remove all the specials we added when the table was created.
168 * In reverse order so the default route is last.
170 for (ii = ARRAY_LEN(ip4_specials) - 1; ii >= 0; ii--)
172 fib_prefix_t prefix = ip4_specials[ii].ift_prefix;
174 prefix.fp_addr.ip4.data_u32 =
175 clib_host_to_net_u32(prefix.fp_addr.ip4.data_u32);
177 fib_table_entry_special_remove(fib_table->ft_index,
179 ip4_specials[ii].ift_source);
183 * validate no more routes.
185 ASSERT(0 == fib_table->ft_total_route_counts);
187 vec_foreach(n_locks, fib_table->ft_src_route_counts)
189 ASSERT(0 == *n_locks);
192 if (~0 != fib_table->ft_table_id)
194 hash_unset (ip4_main.fib_index_by_table_id, fib_table->ft_table_id);
197 vec_free(fib_table->ft_src_route_counts);
198 ip4_mtrie_free(&v4_fib->mtrie);
200 pool_put(ip4_main.v4_fibs, v4_fib);
201 pool_put(ip4_main.fibs, fib_table);
206 ip4_fib_table_find_or_create_and_lock (u32 table_id,
211 index = ip4_fib_index_from_table_id(table_id);
213 return ip4_create_fib_with_table_id(table_id, src);
215 fib_table_lock(index, FIB_PROTOCOL_IP4, src);
221 ip4_fib_table_create_and_lock (fib_source_t src)
223 return (ip4_create_fib_with_table_id(~0, src));
227 ip4_fib_table_get_index_for_sw_if_index (u32 sw_if_index)
229 if (sw_if_index >= vec_len(ip4_main.fib_index_by_sw_if_index))
232 * This is the case for interfaces that are not yet mapped to
237 return (ip4_main.fib_index_by_sw_if_index[sw_if_index]);
241 * ip4_fib_table_lookup_exact_match
243 * Exact match prefix lookup
246 ip4_fib_table_lookup_exact_match (const ip4_fib_t *fib,
247 const ip4_address_t *addr,
250 uword * hash, * result;
253 hash = fib->fib_entry_by_dst_address[len];
254 key = (addr->data_u32 & ip4_main.fib_masks[len]);
256 result = hash_get(hash, key);
258 if (NULL != result) {
261 return (FIB_NODE_INDEX_INVALID);
265 * ip4_fib_table_lookup_adj
267 * Longest prefix match
270 ip4_fib_table_lookup_lb (ip4_fib_t *fib,
271 const ip4_address_t *addr)
273 fib_node_index_t fei;
275 fei = ip4_fib_table_lookup(fib, addr, 32);
277 if (FIB_NODE_INDEX_INVALID != fei)
281 dpo = fib_entry_contribute_ip_forwarding(fei);
283 return (dpo->dpoi_index);
285 return (INDEX_INVALID);
289 * ip4_fib_table_lookup
291 * Longest prefix match
294 ip4_fib_table_lookup (const ip4_fib_t *fib,
295 const ip4_address_t *addr,
298 uword * hash, * result;
302 for (mask_len = len; mask_len >= 0; mask_len--)
304 hash = fib->fib_entry_by_dst_address[mask_len];
305 key = (addr->data_u32 & ip4_main.fib_masks[mask_len]);
307 result = hash_get (hash, key);
309 if (NULL != result) {
313 return (FIB_NODE_INDEX_INVALID);
317 ip4_fib_table_entry_insert (ip4_fib_t *fib,
318 const ip4_address_t *addr,
320 fib_node_index_t fib_entry_index)
322 uword * hash, * result;
325 key = (addr->data_u32 & ip4_main.fib_masks[len]);
326 hash = fib->fib_entry_by_dst_address[len];
327 result = hash_get (hash, key);
329 if (NULL == result) {
334 old_heap = clib_mem_set_heap (ip4_main.mtrie_mheap);
337 hash = hash_create (32 /* elts */, sizeof (uword));
338 hash_set_flags (hash, HASH_FLAG_NO_AUTO_SHRINK);
341 hash = hash_set(hash, key, fib_entry_index);
342 fib->fib_entry_by_dst_address[len] = hash;
343 clib_mem_set_heap (old_heap);
352 ip4_fib_table_entry_remove (ip4_fib_t *fib,
353 const ip4_address_t *addr,
356 uword * hash, * result;
359 key = (addr->data_u32 & ip4_main.fib_masks[len]);
360 hash = fib->fib_entry_by_dst_address[len];
361 result = hash_get (hash, key);
366 * removing a non-existent entry. i'll allow it.
373 old_heap = clib_mem_set_heap (ip4_main.mtrie_mheap);
374 hash_unset(hash, key);
375 clib_mem_set_heap (old_heap);
378 fib->fib_entry_by_dst_address[len] = hash;
382 ip4_fib_table_fwding_dpo_update (ip4_fib_t *fib,
383 const ip4_address_t *addr,
387 ip4_fib_mtrie_route_add(&fib->mtrie, addr, len, dpo->dpoi_index);
391 ip4_fib_table_fwding_dpo_remove (ip4_fib_t *fib,
392 const ip4_address_t *addr,
397 const fib_prefix_t *cover_prefix;
398 const dpo_id_t *cover_dpo;
401 * We need to pass the MTRIE the LB index and address length of the
402 * covering prefix, so it can fill the plys with the correct replacement
403 * for the entry being removed
405 cover_prefix = fib_entry_get_prefix(cover_index);
406 cover_dpo = fib_entry_contribute_ip_forwarding(cover_index);
408 ip4_fib_mtrie_route_del(&fib->mtrie,
409 addr, len, dpo->dpoi_index,
410 cover_prefix->fp_len,
411 cover_dpo->dpoi_index);
415 ip4_fib_table_walk (ip4_fib_t *fib,
416 fib_table_walk_fn_t fn,
419 fib_prefix_t root = {
420 .fp_proto = FIB_PROTOCOL_IP4,
421 // address and length default to all 0
425 * A full tree walk is the dengenerate case of a sub-tree from
428 return (ip4_fib_table_sub_tree_walk(fib, &root, fn, ctx));
432 ip4_fib_table_sub_tree_walk (ip4_fib_t *fib,
433 const fib_prefix_t *root,
434 fib_table_walk_fn_t fn,
437 fib_prefix_t *sub_trees = NULL;
441 * There is no efficient way to walk this array of hash tables.
442 * so we walk each table with a mask length greater than and equal to
443 * the required root and check it is covered by the root.
445 for (i = root->fp_len;
446 i < ARRAY_LEN (fib->fib_entry_by_dst_address);
449 uword * hash = fib->fib_entry_by_dst_address[i];
456 hash_foreach_pair (p, hash,
459 if (ip4_destination_matches_route(&ip4_main,
464 const fib_prefix_t *sub_tree;
468 * exclude sub-trees the walk does not want to explore
470 vec_foreach(sub_tree, sub_trees)
472 if (ip4_destination_matches_route(&ip4_main,
474 &sub_tree->fp_addr.ip4,
484 switch (fn(p->value[0], ctx))
486 case FIB_TABLE_WALK_CONTINUE:
488 case FIB_TABLE_WALK_SUB_TREE_STOP: {
490 .fp_proto = FIB_PROTOCOL_IP4,
494 vec_add1(sub_trees, pfx);
497 case FIB_TABLE_WALK_STOP:
513 typedef struct ip4_fib_show_walk_ctx_t_
515 fib_node_index_t *ifsw_indicies;
516 } ip4_fib_show_walk_ctx_t;
518 static fib_table_walk_rc_t
519 ip4_fib_show_walk_cb (fib_node_index_t fib_entry_index,
522 ip4_fib_show_walk_ctx_t *ctx = arg;
524 vec_add1(ctx->ifsw_indicies, fib_entry_index);
526 return (FIB_TABLE_WALK_CONTINUE);
530 ip4_fib_table_show_all (ip4_fib_t *fib,
533 ip4_fib_show_walk_ctx_t ctx = {
534 .ifsw_indicies = NULL,
536 fib_node_index_t *fib_entry_index;
538 ip4_fib_table_walk(fib, ip4_fib_show_walk_cb, &ctx);
539 vec_sort_with_function(ctx.ifsw_indicies,
540 fib_entry_cmp_for_sort);
542 vec_foreach(fib_entry_index, ctx.ifsw_indicies)
544 vlib_cli_output(vm, "%U",
547 FIB_ENTRY_FORMAT_BRIEF);
550 vec_free(ctx.ifsw_indicies);
554 ip4_fib_table_show_one (ip4_fib_t *fib,
556 ip4_address_t *address,
560 vlib_cli_output(vm, "%U",
562 ip4_fib_table_lookup(fib, address, mask_len),
564 FIB_ENTRY_FORMAT_DETAIL2 :
565 FIB_ENTRY_FORMAT_DETAIL));
569 format_ip4_fib_table_memory (u8 * s, va_list * args)
571 #if USE_DLMALLOC == 0
572 s = format(s, "%=30s %=6d %=12ld\n",
574 pool_elts(ip4_main.fibs),
575 mheap_bytes(ip4_main.mtrie_mheap));
577 s = format(s, "%=30s %=6d %=12ld\n",
579 pool_elts(ip4_main.fibs),
580 mspace_footprint(ip4_main.mtrie_mheap));
587 static clib_error_t *
588 ip4_show_fib (vlib_main_t * vm,
589 unformat_input_t * input,
590 vlib_cli_command_t * cmd)
592 ip4_main_t * im4 = &ip4_main;
593 fib_table_t * fib_table;
594 u64 total_mtrie_memory, total_hash_memory;
595 int verbose, matching, mtrie, memory;
596 ip4_address_t matching_address;
597 u32 matching_mask = 32;
598 int i, table_id = -1, fib_index = ~0;
602 matching = mtrie = memory = 0;
603 total_hash_memory = total_mtrie_memory = 0;
605 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
607 if (unformat (input, "brief") || unformat (input, "summary")
608 || unformat (input, "sum"))
611 else if (unformat (input, "detail") || unformat (input, "det"))
614 else if (unformat (input, "mtrie"))
617 else if (unformat (input, "mem") ||
618 unformat (input, "memory"))
621 else if (unformat (input, "%U/%d",
622 unformat_ip4_address, &matching_address, &matching_mask))
625 else if (unformat (input, "%U", unformat_ip4_address, &matching_address))
628 else if (unformat (input, "table %d", &table_id))
630 else if (unformat (input, "index %d", &fib_index))
636 pool_foreach (fib_table, im4->fibs,
638 ip4_fib_t *fib = pool_elt_at_index(im4->v4_fibs, fib_table->ft_index);
642 if (table_id >= 0 && table_id != (int)fib->table_id)
644 if (fib_index != ~0 && fib_index != (int)fib->index)
649 uword mtrie_size, hash_size, *old_heap;
652 mtrie_size = ip4_fib_mtrie_memory_usage(&fib->mtrie);
655 old_heap = clib_mem_set_heap (ip4_main.mtrie_mheap);
656 for (i = 0; i < ARRAY_LEN (fib->fib_entry_by_dst_address); i++)
658 uword * hash = fib->fib_entry_by_dst_address[i];
661 hash_size += hash_bytes(hash);
664 clib_mem_set_heap (old_heap);
667 vlib_cli_output (vm, "%U mtrie:%d hash:%d",
668 format_fib_table_name, fib->index,
672 total_mtrie_memory += mtrie_size;
673 total_hash_memory += hash_size;
677 s = format(s, "%U, fib_index:%d, flow hash:[%U] epoch:%d flags:%U locks:[",
678 format_fib_table_name, fib->index,
681 format_ip_flow_hash_config,
682 fib_table->ft_flow_hash_config,
684 format_fib_table_flags, fib_table->ft_flags);
685 vec_foreach_index(source, fib_table->ft_locks)
687 if (0 != fib_table->ft_locks[source])
689 s = format(s, "%U:%d, ",
690 format_fib_source, source,
691 fib_table->ft_locks[source]);
695 vlib_cli_output (vm, "%v", s);
701 vlib_cli_output (vm, "%U", format_ip4_fib_mtrie, &fib->mtrie, verbose);
706 vlib_cli_output (vm, "%=20s%=16s", "Prefix length", "Count");
707 for (i = 0; i < ARRAY_LEN (fib->fib_entry_by_dst_address); i++)
709 uword * hash = fib->fib_entry_by_dst_address[i];
710 uword n_elts = hash_elts (hash);
712 vlib_cli_output (vm, "%20d%16d", i, n_elts);
719 ip4_fib_table_show_all(fib, vm);
723 ip4_fib_table_show_one(fib, vm, &matching_address,
724 matching_mask, detail);
730 vlib_cli_output (vm, "totals: mtrie:%ld hash:%ld all:%ld",
733 total_mtrie_memory + total_hash_memory);
734 vlib_cli_output (vm, "\nMtrie Mheap Usage: %U\n",
735 format_mheap, ip4_main.mtrie_mheap, 1);
741 * This command displays the IPv4 FIB Tables (VRF Tables) and the route
742 * entries for each table.
744 * @note This command will run for a long time when the FIB tables are
745 * comprised of millions of entries. For those senarios, consider displaying
746 * a single table or summary mode.
749 * Example of how to display all the IPv4 FIB tables:
750 * @cliexstart{show ip fib}
751 * ipv4-VRF:0, fib_index 0, flow hash: src dst sport dport proto
754 * [@0]: dpo-load-balance: [index:0 buckets:1 uRPF:0 to:[0:0]]
755 * [0] [@0]: dpo-drop ip6
758 * [@0]: dpo-load-balance: [index:1 buckets:1 uRPF:1 to:[0:0]]
759 * [0] [@0]: dpo-drop ip6
762 * [@0]: dpo-load-balance: [index:30 buckets:1 uRPF:29 to:[0:0]]
763 * [0] [@3]: arp-ipv4: via 6.0.0.1 af_packet0
766 * [@0]: dpo-load-balance: [index:31 buckets:4 uRPF:30 to:[0:0]]
767 * [0] [@3]: arp-ipv4: via 6.0.0.2 af_packet0
768 * [1] [@3]: arp-ipv4: via 6.0.0.2 af_packet0
769 * [2] [@3]: arp-ipv4: via 6.0.0.2 af_packet0
770 * [3] [@3]: arp-ipv4: via 6.0.0.1 af_packet0
773 * [@0]: dpo-load-balance: [index:3 buckets:1 uRPF:3 to:[0:0]]
774 * [0] [@0]: dpo-drop ip6
777 * [@0]: dpo-load-balance: [index:2 buckets:1 uRPF:2 to:[0:0]]
778 * [0] [@0]: dpo-drop ip6
781 * [@0]: dpo-load-balance: [index:4 buckets:1 uRPF:4 to:[0:0]]
782 * [0] [@0]: dpo-drop ip6
783 * ipv4-VRF:7, fib_index 1, flow hash: src dst sport dport proto
786 * [@0]: dpo-load-balance: [index:12 buckets:1 uRPF:11 to:[0:0]]
787 * [0] [@0]: dpo-drop ip6
790 * [@0]: dpo-load-balance: [index:13 buckets:1 uRPF:12 to:[0:0]]
791 * [0] [@0]: dpo-drop ip6
794 * [@0]: dpo-load-balance: [index:17 buckets:1 uRPF:16 to:[0:0]]
795 * [0] [@4]: ipv4-glean: af_packet0
798 * [@0]: dpo-load-balance: [index:18 buckets:1 uRPF:17 to:[1:84]]
799 * [0] [@2]: dpo-receive: 172.16.1.1 on af_packet0
802 * [@0]: dpo-load-balance: [index:21 buckets:1 uRPF:20 to:[0:0]]
803 * [0] [@5]: ipv4 via 172.16.1.2 af_packet0: IP4: 02:fe:9e:70:7a:2b -> 26:a5:f6:9c:3a:36
806 * [@0]: dpo-load-balance: [index:19 buckets:1 uRPF:18 to:[0:0]]
807 * [0] [@4]: ipv4-glean: af_packet1
810 * [@0]: dpo-load-balance: [index:20 buckets:1 uRPF:19 to:[0:0]]
811 * [0] [@2]: dpo-receive: 172.16.2.1 on af_packet1
814 * [@0]: dpo-load-balance: [index:15 buckets:1 uRPF:14 to:[0:0]]
815 * [0] [@0]: dpo-drop ip6
818 * [@0]: dpo-load-balance: [index:14 buckets:1 uRPF:13 to:[0:0]]
819 * [0] [@0]: dpo-drop ip6
822 * [@0]: dpo-load-balance: [index:16 buckets:1 uRPF:15 to:[0:0]]
823 * [0] [@0]: dpo-drop ip6
825 * Example of how to display a single IPv4 FIB table:
826 * @cliexstart{show ip fib table 7}
827 * ipv4-VRF:7, fib_index 1, flow hash: src dst sport dport proto
830 * [@0]: dpo-load-balance: [index:12 buckets:1 uRPF:11 to:[0:0]]
831 * [0] [@0]: dpo-drop ip6
834 * [@0]: dpo-load-balance: [index:13 buckets:1 uRPF:12 to:[0:0]]
835 * [0] [@0]: dpo-drop ip6
838 * [@0]: dpo-load-balance: [index:17 buckets:1 uRPF:16 to:[0:0]]
839 * [0] [@4]: ipv4-glean: af_packet0
842 * [@0]: dpo-load-balance: [index:18 buckets:1 uRPF:17 to:[1:84]]
843 * [0] [@2]: dpo-receive: 172.16.1.1 on af_packet0
846 * [@0]: dpo-load-balance: [index:21 buckets:1 uRPF:20 to:[0:0]]
847 * [0] [@5]: ipv4 via 172.16.1.2 af_packet0: IP4: 02:fe:9e:70:7a:2b -> 26:a5:f6:9c:3a:36
850 * [@0]: dpo-load-balance: [index:19 buckets:1 uRPF:18 to:[0:0]]
851 * [0] [@4]: ipv4-glean: af_packet1
854 * [@0]: dpo-load-balance: [index:20 buckets:1 uRPF:19 to:[0:0]]
855 * [0] [@2]: dpo-receive: 172.16.2.1 on af_packet1
858 * [@0]: dpo-load-balance: [index:15 buckets:1 uRPF:14 to:[0:0]]
859 * [0] [@0]: dpo-drop ip6
862 * [@0]: dpo-load-balance: [index:14 buckets:1 uRPF:13 to:[0:0]]
863 * [0] [@0]: dpo-drop ip6
866 * [@0]: dpo-load-balance: [index:16 buckets:1 uRPF:15 to:[0:0]]
867 * [0] [@0]: dpo-drop ip6
869 * Example of how to display a summary of all IPv4 FIB tables:
870 * @cliexstart{show ip fib summary}
871 * ipv4-VRF:0, fib_index 0, flow hash: src dst sport dport proto
872 * Prefix length Count
876 * ipv4-VRF:7, fib_index 1, flow hash: src dst sport dport proto
877 * Prefix length Count
885 VLIB_CLI_COMMAND (ip4_show_fib_command, static) = {
886 .path = "show ip fib",
887 .short_help = "show ip fib [summary] [table <table-id>] [index <fib-id>] [<ip4-addr>[/<mask>]] [mtrie] [detail]",
888 .function = ip4_show_fib,