2 * Copyright (c) 2016 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
7 * http://www.apache.org/licenses/LICENSE-2.0
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
16 #include <vnet/adj/adj_nbr.h>
17 #include <vnet/adj/adj_internal.h>
18 #include <vnet/ethernet/arp_packet.h>
19 #include <vnet/fib/fib_walk.h>
22 * Vector Hash tables of neighbour (traditional) adjacencies
23 * Key: interface(for the vector index), address (and its proto),
24 * link-type/ether-type.
26 static uword **adj_nbr_tables[FIB_PROTOCOL_IP_MAX];
28 typedef struct adj_nbr_key_t_
30 ip46_address_t ank_ip;
34 #define ADJ_NBR_SET_KEY(_key, _lt, _nh) \
36 ip46_address_copy(&(_key).ank_ip, (_nh)); \
37 _key.ank_linkt = (_lt); \
40 #define ADJ_NBR_ITF_OK(_proto, _itf) \
41 (((_itf) < vec_len(adj_nbr_tables[_proto])) && \
42 (NULL != adj_nbr_tables[_proto][(_itf)]))
44 #define ADJ_NBR_ASSERT_NH_PROTO(nh_proto, err) \
46 ASSERT (nh_proto < FIB_PROTOCOL_IP_MAX); \
47 const fib_protocol_t nh_proto__ = (nh_proto); \
48 if (nh_proto__ >= FIB_PROTOCOL_IP_MAX) \
50 clib_warning ("BUG: protocol %d > %d\n", \
52 FIB_PROTOCOL_IP_MAX); \
58 adj_nbr_insert (fib_protocol_t nh_proto,
59 vnet_link_t link_type,
60 const ip46_address_t *nh_addr,
62 adj_index_t adj_index)
66 ADJ_NBR_ASSERT_NH_PROTO (nh_proto,);
68 if (sw_if_index >= vec_len(adj_nbr_tables[nh_proto]))
70 vec_validate(adj_nbr_tables[nh_proto], sw_if_index);
72 if (NULL == adj_nbr_tables[nh_proto][sw_if_index])
74 adj_nbr_tables[nh_proto][sw_if_index] =
75 hash_create_mem(0, sizeof(adj_nbr_key_t), sizeof(adj_index_t));
78 ADJ_NBR_SET_KEY(kv, link_type, nh_addr);
80 hash_set_mem_alloc (&adj_nbr_tables[nh_proto][sw_if_index],
85 adj_nbr_remove (adj_index_t ai,
86 fib_protocol_t nh_proto,
87 vnet_link_t link_type,
88 const ip46_address_t *nh_addr,
93 ADJ_NBR_ASSERT_NH_PROTO (nh_proto,);
95 if (!ADJ_NBR_ITF_OK(nh_proto, sw_if_index))
98 ADJ_NBR_SET_KEY(kv, link_type, nh_addr);
100 hash_unset_mem_free(&adj_nbr_tables[nh_proto][sw_if_index], &kv);
102 if (0 == hash_elts(adj_nbr_tables[nh_proto][sw_if_index]))
104 hash_free(adj_nbr_tables[nh_proto][sw_if_index]);
108 typedef struct adj_nbr_get_n_adjs_walk_ctx_t_
112 } adj_nbr_get_n_adjs_walk_ctx_t;
115 adj_nbr_get_n_adjs_walk (adj_index_t ai,
118 adj_nbr_get_n_adjs_walk_ctx_t *ctx = data;
119 const ip_adjacency_t *adj;
123 if (ctx->linkt == adj->ia_link)
126 return (ADJ_WALK_RC_CONTINUE);
130 adj_nbr_get_n_adjs (vnet_link_t link_type, u32 sw_if_index)
132 adj_nbr_get_n_adjs_walk_ctx_t ctx = {
135 fib_protocol_t fproto;
137 FOR_EACH_FIB_IP_PROTOCOL(fproto)
139 adj_nbr_walk (sw_if_index,
141 adj_nbr_get_n_adjs_walk,
149 adj_nbr_find (fib_protocol_t nh_proto,
150 vnet_link_t link_type,
151 const ip46_address_t *nh_addr,
157 ADJ_NBR_ASSERT_NH_PROTO (nh_proto, ADJ_INDEX_INVALID);
159 ADJ_NBR_SET_KEY(kv, link_type, nh_addr);
161 if (!ADJ_NBR_ITF_OK(nh_proto, sw_if_index))
162 return (ADJ_INDEX_INVALID);
164 p = hash_get_mem(adj_nbr_tables[nh_proto][sw_if_index], &kv);
170 return (ADJ_INDEX_INVALID);
174 adj_get_nd_node (fib_protocol_t proto)
177 case FIB_PROTOCOL_IP4:
178 return (ip4_arp_node.index);
179 case FIB_PROTOCOL_IP6:
180 return (ip6_discover_neighbor_node.index);
181 case FIB_PROTOCOL_MPLS:
185 return (ip4_arp_node.index);
189 * @brief Check and set feature flags if o/p interface has any o/p features.
192 adj_nbr_evaluate_feature (adj_index_t ai)
195 vnet_feature_main_t *fm = &feature_main;
202 switch (adj->ia_link)
205 arc_index = ip4_main.lookup_main.output_feature_arc_index;
208 arc_index = ip6_main.lookup_main.output_feature_arc_index;
211 arc_index = mpls_main.output_feature_arc_index;
217 sw_if_index = adj->rewrite_header.sw_if_index;
218 if (vec_len(fm->feature_count_by_sw_if_index[arc_index]) > sw_if_index)
220 feature_count = fm->feature_count_by_sw_if_index[arc_index][sw_if_index];
221 if (feature_count > 0)
223 vnet_feature_config_main_t *cm;
225 adj->rewrite_header.flags |= VNET_REWRITE_HAS_FEATURES;
226 cm = &fm->feature_config_mains[arc_index];
228 adj->ia_cfg_index = vec_elt (cm->config_index_by_sw_if_index,
235 static ip_adjacency_t*
236 adj_nbr_alloc (fib_protocol_t nh_proto,
237 vnet_link_t link_type,
238 const ip46_address_t *nh_addr,
243 adj = adj_alloc(nh_proto);
245 adj_nbr_insert(nh_proto, link_type, nh_addr,
250 * since we just added the ADJ we have no rewrite string for it,
253 adj->lookup_next_index = IP_LOOKUP_NEXT_ARP;
254 adj->sub_type.nbr.next_hop = *nh_addr;
255 adj->ia_link = link_type;
256 adj->ia_nh_proto = nh_proto;
257 adj->rewrite_header.sw_if_index = sw_if_index;
258 vnet_rewrite_update_mtu(vnet_get_main(), adj->ia_link,
259 &adj->rewrite_header);
261 adj_nbr_evaluate_feature (adj_get_index(adj));
266 adj_nbr_set_mtu (adj_index_t adj_index, u16 mtu)
270 ASSERT(ADJ_INDEX_INVALID != adj_index);
272 adj = adj_get(adj_index);
275 vnet_rewrite_update_mtu(vnet_get_main(), adj->ia_link,
276 &adj->rewrite_header);
279 vnet_rewrite_update_mtu(vnet_get_main(), adj->ia_link,
280 &adj->rewrite_header);
281 adj->rewrite_header.max_l3_packet_bytes =
282 clib_min (adj->rewrite_header.max_l3_packet_bytes, mtu);
287 * adj_nbr_add_or_lock
289 * Add an adjacency for the neighbour requested.
291 * The key for an adj is:
292 * - the Next-hops protocol (i.e. v4 or v6)
293 * - the address of the next-hop
294 * - the interface the next-hop is reachable through
297 adj_nbr_add_or_lock (fib_protocol_t nh_proto,
298 vnet_link_t link_type,
299 const ip46_address_t *nh_addr,
302 adj_index_t adj_index;
304 adj_index = adj_nbr_find(nh_proto, link_type, nh_addr, sw_if_index);
306 if (ADJ_INDEX_INVALID == adj_index)
311 vnm = vnet_get_main();
312 adj = adj_nbr_alloc(nh_proto, link_type, nh_addr, sw_if_index);
313 adj_index = adj_get_index(adj);
316 if (ip46_address_is_equal(&ADJ_BCAST_ADDR, nh_addr))
318 adj->lookup_next_index = IP_LOOKUP_NEXT_BCAST;
321 vnet_rewrite_init(vnm, sw_if_index, link_type,
322 adj_get_nd_node(nh_proto),
323 vnet_tx_node_index_for_sw_interface(vnm, sw_if_index),
324 &adj->rewrite_header);
327 * we need a rewrite where the destination IP address is converted
328 * to the appropriate link-layer address. This is interface specific.
329 * So ask the interface to do it.
331 vnet_update_adjacency_for_sw_interface(vnm, sw_if_index, adj_index);
332 adj_delegate_adj_created(adj_get(adj_index));
343 adj_nbr_add_or_lock_w_rewrite (fib_protocol_t nh_proto,
344 vnet_link_t link_type,
345 const ip46_address_t *nh_addr,
349 adj_index_t adj_index;
351 adj_index = adj_nbr_find(nh_proto, link_type, nh_addr, sw_if_index);
353 if (ADJ_INDEX_INVALID == adj_index)
357 adj = adj_nbr_alloc(nh_proto, link_type, nh_addr, sw_if_index);
358 adj->rewrite_header.sw_if_index = sw_if_index;
359 adj_index = adj_get_index(adj);
363 adj_nbr_update_rewrite(adj_index,
364 ADJ_NBR_REWRITE_FLAG_COMPLETE,
367 adj_delegate_adj_created(adj_get(adj_index));
373 * adj_nbr_update_rewrite
375 * Update the adjacency's rewrite string. A NULL string implies the
376 * rewrite is reset (i.e. when ARP/ND entry is gone).
377 * NB: the adj being updated may be handling traffic in the DP.
380 adj_nbr_update_rewrite (adj_index_t adj_index,
381 adj_nbr_rewrite_flag_t flags,
386 ASSERT(ADJ_INDEX_INVALID != adj_index);
388 adj = adj_get(adj_index);
390 if (flags & ADJ_NBR_REWRITE_FLAG_COMPLETE)
393 * update the adj's rewrite string and build the arc
394 * from the rewrite node to the interface's TX node
396 adj_nbr_update_rewrite_internal(adj, IP_LOOKUP_NEXT_REWRITE,
397 adj_get_rewrite_node(adj->ia_link),
398 vnet_tx_node_index_for_sw_interface(
400 adj->rewrite_header.sw_if_index),
405 adj_nbr_update_rewrite_internal(adj, IP_LOOKUP_NEXT_ARP,
406 adj_get_nd_node(adj->ia_nh_proto),
407 vnet_tx_node_index_for_sw_interface(
409 adj->rewrite_header.sw_if_index),
415 * adj_nbr_update_rewrite_internal
417 * Update the adjacency's rewrite string. A NULL string implies the
418 * rewrite is reset (i.e. when ARP/ND entry is gone).
419 * NB: the adj being updated may be handling traffic in the DP.
422 adj_nbr_update_rewrite_internal (ip_adjacency_t *adj,
423 ip_lookup_next_t adj_next_index,
428 ip_adjacency_t *walk_adj;
429 adj_index_t walk_ai, ai;
434 vm = vlib_get_main();
435 old_next = adj->lookup_next_index;
437 ai = walk_ai = adj_get_index(adj);
438 if (VNET_LINK_MPLS == adj->ia_link)
441 * The link type MPLS has no children in the control plane graph, it only
442 * has children in the data-plane graph. The backwalk is up the former.
443 * So we need to walk from its IP cousin.
445 walk_ai = adj_nbr_find(adj->ia_nh_proto,
446 fib_proto_to_link(adj->ia_nh_proto),
447 &adj->sub_type.nbr.next_hop,
448 adj->rewrite_header.sw_if_index);
452 * Don't call the walk re-entrantly
454 if (ADJ_INDEX_INVALID != walk_ai)
456 walk_adj = adj_get(walk_ai);
457 if (ADJ_FLAG_SYNC_WALK_ACTIVE & walk_adj->ia_flags)
464 * Prevent re-entrant walk of the same adj
466 walk_adj->ia_flags |= ADJ_FLAG_SYNC_WALK_ACTIVE;
476 * lock the adjacencies that are affected by updates this walk will provoke.
477 * Since the aim of the walk is to update children to link to a different
478 * DPO, this adj will no longer be in use and its lock count will drop to 0.
479 * We don't want it to be deleted as part of this endeavour.
485 * Updating a rewrite string is not atomic;
486 * - the rewrite string is too long to write in one instruction
487 * - when swapping from incomplete to complete, we also need to update
488 * the VLIB graph next-index of the adj.
489 * ideally we would only want to suspend forwarding via this adj whilst we
490 * do this, but we do not have that level of granularity - it's suspend all
491 * worker threads or nothing.
492 * The other choices are:
493 * - to mark the adj down and back walk so child load-balances drop this adj
495 * - update the next_node index of this adj to point to error-drop
496 * both of which will mean for MAC change we will drop for this adj
497 * which is not acceptable. However, when the adj changes type (from
498 * complete to incomplete and vice-versa) the child DPOs, which have the
499 * VLIB graph next node index, will be sending packets to the wrong graph
500 * node. So from the options above, updating the next_node of the adj to
501 * be drop will work, but it relies on each graph node v4/v6/mpls, rewrite/
502 * arp/midchain always be valid w.r.t. a mis-match of adj type and node type
503 * (i.e. a rewrite adj in the arp node). This is not enforceable. Getting it
504 * wrong will lead to hard to find bugs since its a race condition. So we
505 * choose the more reliable method of updating the children to use the drop,
506 * then switching adj's type, then updating the children again. Did I mention
507 * that this doesn't happen often...
508 * So we need to distinguish between the two cases:
510 * 2 - adj type change
513 old_next != adj_next_index &&
514 ADJ_INDEX_INVALID != walk_ai)
517 * the adj is changing type. we need to fix all children so that they
518 * stack momentarily on a drop, while the adj changes. If we don't do
519 * this the children will send packets to a VLIB graph node that does
520 * not correspond to the adj's type - and it goes downhill from there.
522 fib_node_back_walk_ctx_t bw_ctx = {
523 .fnbw_reason = FIB_NODE_BW_REASON_FLAG_ADJ_DOWN,
525 * force this walk to be synchronous. if we don't and a node in the graph
526 * (a heavily shared path-list) chooses to back-ground the walk (make it
527 * async) then it will pause and we will do the adj update below, before
528 * all the children are updated. not good.
530 .fnbw_flags = FIB_NODE_BW_FLAG_FORCE_SYNC,
533 fib_walk_sync(FIB_NODE_TYPE_ADJ, walk_ai, &bw_ctx);
535 * fib_walk_sync may allocate a new adjacency and potentially cause a
536 * realloc for adj_pool. When that happens, adj pointer is no longer
537 * valid here. We refresh the adj pointer accordingly.
543 * If we are just updating the MAC string of the adj (which we also can't
544 * do atomically), then we need to stop packets switching through the adj.
545 * We can't do that on a per-adj basis, so it's all the packets.
546 * If we are updating the type, and we walked back to the children above,
547 * then this barrier serves to flush the queues/frames.
549 vlib_worker_thread_barrier_sync(vm);
551 adj->lookup_next_index = adj_next_index;
552 adj->ia_node_index = this_node;
557 * new rewrite provided.
558 * fill in the adj's rewrite string, and build the VLIB graph arc.
560 vnet_rewrite_set_data_internal(&adj->rewrite_header,
561 sizeof(adj->rewrite_data),
568 vnet_rewrite_clear_data_internal(&adj->rewrite_header,
569 sizeof(adj->rewrite_data));
571 adj->rewrite_header.next_index = vlib_node_add_next(vlib_get_main(),
576 * done with the rewrite update - let the workers loose.
578 vlib_worker_thread_barrier_release(vm);
581 (old_next != adj->lookup_next_index) &&
582 (ADJ_INDEX_INVALID != walk_ai))
585 * backwalk to the children so they can stack on the now updated
588 fib_node_back_walk_ctx_t bw_ctx = {
589 .fnbw_reason = FIB_NODE_BW_REASON_FLAG_ADJ_UPDATE,
592 fib_walk_sync(FIB_NODE_TYPE_ADJ, walk_ai, &bw_ctx);
595 * Prevent re-entrant walk of the same adj
599 walk_adj = adj_get(walk_ai);
600 walk_adj->ia_flags &= ~ADJ_FLAG_SYNC_WALK_ACTIVE;
603 adj_delegate_adj_modified(adj_get(ai));
609 adj_nbr_db_size (void)
611 fib_protocol_t proto;
615 for (proto = FIB_PROTOCOL_IP4; proto <= FIB_PROTOCOL_IP6; proto++)
617 vec_foreach_index(sw_if_index, adj_nbr_tables[proto])
619 if (NULL != adj_nbr_tables[proto][sw_if_index])
621 count += hash_elts(adj_nbr_tables[proto][sw_if_index]);
629 * @brief Walk all adjacencies on a link for a given next-hop protocol
632 adj_nbr_walk (u32 sw_if_index,
633 fib_protocol_t adj_nh_proto,
637 adj_index_t ai, *ais, *aip;
640 ADJ_NBR_ASSERT_NH_PROTO (adj_nh_proto,);
642 if (!ADJ_NBR_ITF_OK(adj_nh_proto, sw_if_index))
647 /* elements may be removed from the table during the walk, so
648 * collect the set first then process them */
649 hash_foreach_mem (key, ai, adj_nbr_tables[adj_nh_proto][sw_if_index],
654 vec_foreach(aip, ais)
656 /* An adj may be deleted during the walk so check first */
657 if (!pool_is_free_index(adj_pool, *aip))
664 * @brief Walk adjacencies on a link with a given v4 next-hop.
665 * that is visit the adjacencies with different link types.
668 adj_nbr_walk_nh4 (u32 sw_if_index,
669 const ip4_address_t *addr,
673 if (!ADJ_NBR_ITF_OK(FIB_PROTOCOL_IP4, sw_if_index))
676 ip46_address_t nh = {
682 FOR_EACH_VNET_LINK(linkt)
684 ai = adj_nbr_find (FIB_PROTOCOL_IP4, linkt, &nh, sw_if_index);
686 if (INDEX_INVALID != ai)
692 * @brief Walk adjacencies on a link with a given v6 next-hop.
693 * that is visit the adjacencies with different link types.
696 adj_nbr_walk_nh6 (u32 sw_if_index,
697 const ip6_address_t *addr,
701 if (!ADJ_NBR_ITF_OK(FIB_PROTOCOL_IP6, sw_if_index))
704 ip46_address_t nh = {
710 FOR_EACH_VNET_LINK(linkt)
712 ai = adj_nbr_find (FIB_PROTOCOL_IP6, linkt, &nh, sw_if_index);
714 if (INDEX_INVALID != ai)
720 * @brief Walk adjacencies on a link with a given next-hop.
721 * that is visit the adjacencies with different link types.
724 adj_nbr_walk_nh (u32 sw_if_index,
725 fib_protocol_t adj_nh_proto,
726 const ip46_address_t *nh,
730 ADJ_NBR_ASSERT_NH_PROTO (adj_nh_proto,);
732 if (!ADJ_NBR_ITF_OK(adj_nh_proto, sw_if_index))
735 switch (adj_nh_proto)
737 case FIB_PROTOCOL_IP4:
738 adj_nbr_walk_nh4(sw_if_index, &nh->ip4, cb, ctx);
740 case FIB_PROTOCOL_IP6:
741 adj_nbr_walk_nh6(sw_if_index, &nh->ip6, cb, ctx);
743 case FIB_PROTOCOL_MPLS:
750 * Flags associated with the interface state walks
752 typedef enum adj_nbr_interface_flags_t_
754 ADJ_NBR_INTERFACE_UP = (1 << 0),
755 } adj_nbr_interface_flags_t;
758 * Context for the state change walk of the DB
760 typedef struct adj_nbr_interface_state_change_ctx_t_
763 * Flags on the interface
765 adj_nbr_interface_flags_t flags;
766 } adj_nbr_interface_state_change_ctx_t;
769 adj_nbr_interface_state_change_one (adj_index_t ai,
773 * Back walk the graph to inform the forwarding entries
774 * that this interface state has changed. Do this synchronously
775 * since this is the walk that provides convergence
777 adj_nbr_interface_state_change_ctx_t *ctx = arg;
778 fib_node_back_walk_ctx_t bw_ctx = {
779 .fnbw_reason = ((ctx->flags & ADJ_NBR_INTERFACE_UP) ?
780 FIB_NODE_BW_REASON_FLAG_INTERFACE_UP :
781 FIB_NODE_BW_REASON_FLAG_INTERFACE_DOWN),
783 * the force sync applies only as far as the first fib_entry.
784 * And it's the fib_entry's we need to converge away from
785 * the adjacencies on the now down link
787 .fnbw_flags = (!(ctx->flags & ADJ_NBR_INTERFACE_UP) ?
788 FIB_NODE_BW_FLAG_FORCE_SYNC :
789 FIB_NODE_BW_FLAG_NONE),
796 adj->ia_flags |= ADJ_FLAG_SYNC_WALK_ACTIVE;
797 fib_walk_sync(FIB_NODE_TYPE_ADJ, ai, &bw_ctx);
800 * fib_walk_sync may allocate a new adjacency and potentially cause a
801 * realloc for adj_pool. When that happens, adj pointer is no longer
802 * valid here. We refresh the adj pointer accordingly.
805 adj->ia_flags &= ~ADJ_FLAG_SYNC_WALK_ACTIVE;
808 return (ADJ_WALK_RC_CONTINUE);
812 * @brief Registered function for SW interface state changes
814 static clib_error_t *
815 adj_nbr_sw_interface_state_change (vnet_main_t * vnm,
819 fib_protocol_t proto;
822 * walk each adj on the interface and trigger a walk from that adj
824 for (proto = FIB_PROTOCOL_IP4; proto <= FIB_PROTOCOL_IP6; proto++)
826 adj_nbr_interface_state_change_ctx_t ctx = {
827 .flags = ((flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP) ?
828 ADJ_NBR_INTERFACE_UP :
832 adj_nbr_walk(sw_if_index, proto,
833 adj_nbr_interface_state_change_one,
840 VNET_SW_INTERFACE_ADMIN_UP_DOWN_FUNCTION_PRIO(
841 adj_nbr_sw_interface_state_change,
842 VNET_ITF_FUNC_PRIORITY_HIGH);
845 * @brief Invoked on each SW interface of a HW interface when the
846 * HW interface state changes
849 adj_nbr_hw_sw_interface_state_change (vnet_main_t * vnm,
853 adj_nbr_interface_state_change_ctx_t *ctx = arg;
854 fib_protocol_t proto;
857 * walk each adj on the interface and trigger a walk from that adj
859 for (proto = FIB_PROTOCOL_IP4; proto <= FIB_PROTOCOL_IP6; proto++)
861 adj_nbr_walk(sw_if_index, proto,
862 adj_nbr_interface_state_change_one,
865 return (WALK_CONTINUE);
869 * @brief Registered callback for HW interface state changes
871 static clib_error_t *
872 adj_nbr_hw_interface_state_change (vnet_main_t * vnm,
877 * walk SW interface on the HW
879 adj_nbr_interface_state_change_ctx_t ctx = {
880 .flags = ((flags & VNET_HW_INTERFACE_FLAG_LINK_UP) ?
881 ADJ_NBR_INTERFACE_UP :
885 vnet_hw_interface_walk_sw(vnm, hw_if_index,
886 adj_nbr_hw_sw_interface_state_change,
892 VNET_HW_INTERFACE_LINK_UP_DOWN_FUNCTION_PRIO(
893 adj_nbr_hw_interface_state_change,
894 VNET_ITF_FUNC_PRIORITY_HIGH);
897 adj_nbr_interface_delete_one (adj_index_t ai,
901 * Back walk the graph to inform the forwarding entries
902 * that this interface has been deleted.
904 fib_node_back_walk_ctx_t bw_ctx = {
905 .fnbw_reason = FIB_NODE_BW_REASON_FLAG_INTERFACE_DELETE,
912 adj->ia_flags |= ADJ_FLAG_SYNC_WALK_ACTIVE;
913 fib_walk_sync(FIB_NODE_TYPE_ADJ, ai, &bw_ctx);
916 * fib_walk_sync may allocate a new adjacency and potentially cause a
917 * realloc for adj_pool. When that happens, adj pointer is no longer
918 * valid here. We refresh the adj pointer accordingly.
921 adj->ia_flags &= ~ADJ_FLAG_SYNC_WALK_ACTIVE;
924 return (ADJ_WALK_RC_CONTINUE);
928 * adj_nbr_interface_add_del
930 * Registered to receive interface Add and delete notifications
932 static clib_error_t *
933 adj_nbr_interface_add_del (vnet_main_t * vnm,
937 fib_protocol_t proto;
942 * not interested in interface additions. we will not back walk
943 * to resolve paths through newly added interfaces. Why? The control
944 * plane should have the brains to add interfaces first, then routes.
945 * So the case where there are paths with a interface that matches
946 * one just created is the case where the path resolved through an
947 * interface that was deleted, and still has not been removed. The
948 * new interface added, is NO GUARANTEE that the interface being
949 * added now, even though it may have the same sw_if_index, is the
950 * same interface that the path needs. So tough!
951 * If the control plane wants these routes to resolve it needs to
952 * remove and add them again.
957 for (proto = FIB_PROTOCOL_IP4; proto <= FIB_PROTOCOL_IP6; proto++)
959 adj_nbr_walk(sw_if_index, proto,
960 adj_nbr_interface_delete_one,
967 VNET_SW_INTERFACE_ADD_DEL_FUNCTION(adj_nbr_interface_add_del);
971 adj_nbr_ethernet_mac_change_one (adj_index_t ai,
974 vnet_update_adjacency_for_sw_interface(vnet_get_main(),
975 adj_get_sw_if_index(ai),
978 return (ADJ_WALK_RC_CONTINUE);
982 * Callback function invoked when an interface's MAC Address changes
985 adj_nbr_ethernet_change_mac (ethernet_main_t * em,
986 u32 sw_if_index, uword opaque)
988 fib_protocol_t proto;
990 FOR_EACH_FIB_IP_PROTOCOL(proto)
992 adj_nbr_walk(sw_if_index, proto,
993 adj_nbr_ethernet_mac_change_one,
999 adj_nbr_show_one (adj_index_t ai,
1002 vlib_cli_output (arg, "[@%d] %U",
1004 format_ip_adjacency, ai,
1005 FORMAT_IP_ADJACENCY_NONE);
1007 return (ADJ_WALK_RC_CONTINUE);
1010 static clib_error_t *
1011 adj_nbr_show (vlib_main_t * vm,
1012 unformat_input_t * input,
1013 vlib_cli_command_t * cmd)
1015 adj_index_t ai = ADJ_INDEX_INVALID;
1016 ip46_address_t nh = ip46_address_initializer;
1017 u32 sw_if_index = ~0;
1019 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
1021 if (unformat (input, "%U",
1022 unformat_vnet_sw_interface, vnet_get_main(),
1025 else if (unformat (input, "%U",
1026 unformat_ip46_address, &nh, IP46_TYPE_ANY))
1028 else if (unformat (input, "%d", &ai))
1034 if (ADJ_INDEX_INVALID != ai)
1036 vlib_cli_output (vm, "[@%d] %U",
1038 format_ip_adjacency, ai,
1039 FORMAT_IP_ADJACENCY_DETAIL);
1041 else if (~0 != sw_if_index)
1043 fib_protocol_t proto;
1045 if (ip46_address_is_zero(&nh))
1047 for (proto = FIB_PROTOCOL_IP4; proto <= FIB_PROTOCOL_IP6; proto++)
1049 adj_nbr_walk(sw_if_index, proto,
1056 proto = (ip46_address_is_ip4(&nh) ?
1059 adj_nbr_walk_nh(sw_if_index, proto, &nh,
1066 fib_protocol_t proto;
1068 for (proto = FIB_PROTOCOL_IP4; proto <= FIB_PROTOCOL_IP6; proto++)
1070 vec_foreach_index(sw_if_index, adj_nbr_tables[proto])
1072 adj_nbr_walk(sw_if_index, proto,
1083 * Show all neighbour adjacencies.
1085 * @cliexstart{sh adj nbr}
1086 * [@2] ipv4 via 1.0.0.2 loop0: IP4: 00:00:22:aa:bb:cc -> 00:00:11:aa:bb:cc
1087 * [@3] mpls via 1.0.0.2 loop0: MPLS_UNICAST: 00:00:22:aa:bb:cc -> 00:00:11:aa:bb:cc
1088 * [@4] ipv4 via 1.0.0.3 loop0: IP4: 00:00:22:aa:bb:cc -> 00:00:11:aa:bb:cc
1089 * [@5] mpls via 1.0.0.3 loop0: MPLS_UNICAST: 00:00:22:aa:bb:cc -> 00:00:11:aa:bb:cc
1092 VLIB_CLI_COMMAND (ip4_show_fib_command, static) = {
1093 .path = "show adj nbr",
1094 .short_help = "show adj nbr [<adj_index>] [interface]",
1095 .function = adj_nbr_show,
1099 format_adj_nbr_incomplete (u8* s, va_list *ap)
1101 index_t index = va_arg(*ap, index_t);
1102 CLIB_UNUSED(u32 indent) = va_arg(*ap, u32);
1103 vnet_main_t * vnm = vnet_get_main();
1104 ip_adjacency_t * adj = adj_get(index);
1106 s = format (s, "arp-%U", format_vnet_link, adj->ia_link);
1107 s = format (s, ": via %U",
1108 format_ip46_address, &adj->sub_type.nbr.next_hop,
1109 adj_proto_to_46(adj->ia_nh_proto));
1110 s = format (s, " %U",
1111 format_vnet_sw_if_index_name,
1112 vnm, adj->rewrite_header.sw_if_index);
1118 format_adj_nbr (u8* s, va_list *ap)
1120 index_t index = va_arg(*ap, index_t);
1121 CLIB_UNUSED(u32 indent) = va_arg(*ap, u32);
1122 ip_adjacency_t * adj = adj_get(index);
1124 s = format (s, "%U", format_vnet_link, adj->ia_link);
1125 s = format (s, " via %U ",
1126 format_ip46_address, &adj->sub_type.nbr.next_hop,
1127 adj_proto_to_46(adj->ia_nh_proto));
1128 s = format (s, "%U",
1129 format_vnet_rewrite,
1130 &adj->rewrite_header, sizeof (adj->rewrite_data), 0);
1136 adj_dpo_lock (dpo_id_t *dpo)
1138 adj_lock(dpo->dpoi_index);
1141 adj_dpo_unlock (dpo_id_t *dpo)
1143 adj_unlock(dpo->dpoi_index);
1149 fib_show_memory_usage("Adjacency",
1150 pool_elts(adj_pool),
1152 sizeof(ip_adjacency_t));
1155 const static dpo_vft_t adj_nbr_dpo_vft = {
1156 .dv_lock = adj_dpo_lock,
1157 .dv_unlock = adj_dpo_unlock,
1158 .dv_format = format_adj_nbr,
1159 .dv_mem_show = adj_mem_show,
1160 .dv_get_urpf = adj_dpo_get_urpf,
1161 .dv_get_mtu = adj_dpo_get_mtu,
1163 const static dpo_vft_t adj_nbr_incompl_dpo_vft = {
1164 .dv_lock = adj_dpo_lock,
1165 .dv_unlock = adj_dpo_unlock,
1166 .dv_format = format_adj_nbr_incomplete,
1167 .dv_get_urpf = adj_dpo_get_urpf,
1168 .dv_get_mtu = adj_dpo_get_mtu,
1172 * @brief The per-protocol VLIB graph nodes that are assigned to an adjacency
1175 * this means that these graph nodes are ones from which a nbr is the
1176 * parent object in the DPO-graph.
1178 const static char* const nbr_ip4_nodes[] =
1183 const static char* const nbr_ip6_nodes[] =
1188 const static char* const nbr_mpls_nodes[] =
1193 const static char* const nbr_ethernet_nodes[] =
1198 const static char* const * const nbr_nodes[DPO_PROTO_NUM] =
1200 [DPO_PROTO_IP4] = nbr_ip4_nodes,
1201 [DPO_PROTO_IP6] = nbr_ip6_nodes,
1202 [DPO_PROTO_MPLS] = nbr_mpls_nodes,
1203 [DPO_PROTO_ETHERNET] = nbr_ethernet_nodes,
1206 const static char* const nbr_incomplete_ip4_nodes[] =
1211 const static char* const nbr_incomplete_ip6_nodes[] =
1213 "ip6-discover-neighbor",
1216 const static char* const nbr_incomplete_mpls_nodes[] =
1218 "mpls-adj-incomplete",
1222 const static char* const * const nbr_incomplete_nodes[DPO_PROTO_NUM] =
1224 [DPO_PROTO_IP4] = nbr_incomplete_ip4_nodes,
1225 [DPO_PROTO_IP6] = nbr_incomplete_ip6_nodes,
1226 [DPO_PROTO_MPLS] = nbr_incomplete_mpls_nodes,
1230 adj_nbr_module_init (void)
1232 dpo_register(DPO_ADJACENCY,
1235 dpo_register(DPO_ADJACENCY_INCOMPLETE,
1236 &adj_nbr_incompl_dpo_vft,
1237 nbr_incomplete_nodes);
1239 ethernet_address_change_ctx_t ctx = {
1240 .function = adj_nbr_ethernet_change_mac,
1241 .function_opaque = 0,
1243 vec_add1 (ethernet_main.address_change_callbacks, ctx);