2 * ethernet/arp.c: IP v4 ARP node
4 * Copyright (c) 2010 Cisco and/or its affiliates.
5 * Licensed under the Apache License, Version 2.0 (the "License");
6 * you may not use this file except in compliance with the License.
7 * You may obtain a copy of the License at:
9 * http://www.apache.org/licenses/LICENSE-2.0
11 * Unless required by applicable law or agreed to in writing, software
12 * distributed under the License is distributed on an "AS IS" BASIS,
13 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14 * See the License for the specific language governing permissions and
15 * limitations under the License.
18 #include <vnet/ip/ip.h>
19 #include <vnet/ethernet/ethernet.h>
20 #include <vnet/ethernet/arp_packet.h>
21 #include <vnet/l2/l2_input.h>
22 #include <vppinfra/mhash.h>
24 void vl_api_rpc_call_main_thread (void *fp, u8 * data, u32 data_length);
30 ip4_address_t ip4_address;
31 } ethernet_arp_ip4_key_t;
35 ethernet_arp_ip4_key_t key;
36 u8 ethernet_address[6];
39 #define ETHERNET_ARP_IP4_ENTRY_FLAG_STATIC (1 << 0)
40 #define ETHERNET_ARP_IP4_ENTRY_FLAG_GLEAN (2 << 0)
42 u64 cpu_time_last_updated;
45 } ethernet_arp_ip4_entry_t;
52 } ethernet_proxy_arp_t;
60 /* Used for arp event notification only */
63 } pending_resolution_t;
67 /* Hash tables mapping name to opcode. */
68 uword *opcode_by_name;
70 /* lite beer "glean" adjacency handling */
71 uword *pending_resolutions_by_address;
72 pending_resolution_t *pending_resolutions;
74 /* Mac address change notification */
75 uword *mac_changes_by_address;
76 pending_resolution_t *mac_changes;
78 ethernet_arp_ip4_entry_t *ip4_entry_pool;
80 mhash_t ip4_entry_by_key;
82 /* ARP attack mitigation */
84 u32 limit_arp_cache_size;
86 /* Proxy arp vector */
87 ethernet_proxy_arp_t *proxy_arps;
88 } ethernet_arp_main_t;
90 static ethernet_arp_main_t ethernet_arp_main;
93 format_ethernet_arp_hardware_type (u8 * s, va_list * va)
95 ethernet_arp_hardware_type_t h = va_arg (*va, ethernet_arp_hardware_type_t);
99 #define _(n,f) case n: t = #f; break;
100 foreach_ethernet_arp_hardware_type;
104 return format (s, "unknown 0x%x", h);
107 return format (s, "%s", t);
111 format_ethernet_arp_opcode (u8 * s, va_list * va)
113 ethernet_arp_opcode_t o = va_arg (*va, ethernet_arp_opcode_t);
117 #define _(f) case ETHERNET_ARP_OPCODE_##f: t = #f; break;
118 foreach_ethernet_arp_opcode;
122 return format (s, "unknown 0x%x", o);
125 return format (s, "%s", t);
129 unformat_ethernet_arp_opcode_host_byte_order (unformat_input_t * input,
132 int *result = va_arg (*args, int *);
133 ethernet_arp_main_t *am = ðernet_arp_main;
136 /* Numeric opcode. */
137 if (unformat (input, "0x%x", &x) || unformat (input, "%d", &x))
146 if (unformat_user (input, unformat_vlib_number_by_name,
147 am->opcode_by_name, &i))
157 unformat_ethernet_arp_opcode_net_byte_order (unformat_input_t * input,
160 int *result = va_arg (*args, int *);
162 (input, unformat_ethernet_arp_opcode_host_byte_order, result))
165 *result = clib_host_to_net_u16 ((u16) * result);
170 format_ethernet_arp_header (u8 * s, va_list * va)
172 ethernet_arp_header_t *a = va_arg (*va, ethernet_arp_header_t *);
173 u32 max_header_bytes = va_arg (*va, u32);
175 u16 l2_type, l3_type;
177 if (max_header_bytes != 0 && sizeof (a[0]) > max_header_bytes)
178 return format (s, "ARP header truncated");
180 l2_type = clib_net_to_host_u16 (a->l2_type);
181 l3_type = clib_net_to_host_u16 (a->l3_type);
183 indent = format_get_indent (s);
185 s = format (s, "%U, type %U/%U, address size %d/%d",
186 format_ethernet_arp_opcode, clib_net_to_host_u16 (a->opcode),
187 format_ethernet_arp_hardware_type, l2_type,
188 format_ethernet_type, l3_type,
189 a->n_l2_address_bytes, a->n_l3_address_bytes);
191 if (l2_type == ETHERNET_ARP_HARDWARE_TYPE_ethernet
192 && l3_type == ETHERNET_TYPE_IP4)
194 s = format (s, "\n%U%U/%U -> %U/%U",
195 format_white_space, indent,
196 format_ethernet_address, a->ip4_over_ethernet[0].ethernet,
197 format_ip4_address, &a->ip4_over_ethernet[0].ip4,
198 format_ethernet_address, a->ip4_over_ethernet[1].ethernet,
199 format_ip4_address, &a->ip4_over_ethernet[1].ip4);
203 uword n2 = a->n_l2_address_bytes;
204 uword n3 = a->n_l3_address_bytes;
205 s = format (s, "\n%U%U/%U -> %U/%U",
206 format_white_space, indent,
207 format_hex_bytes, a->data + 0 * n2 + 0 * n3, n2,
208 format_hex_bytes, a->data + 1 * n2 + 0 * n3, n3,
209 format_hex_bytes, a->data + 1 * n2 + 1 * n3, n2,
210 format_hex_bytes, a->data + 2 * n2 + 1 * n3, n3);
217 format_ethernet_arp_ip4_entry (u8 * s, va_list * va)
219 vnet_main_t *vnm = va_arg (*va, vnet_main_t *);
220 ethernet_arp_ip4_entry_t *e = va_arg (*va, ethernet_arp_ip4_entry_t *);
221 vnet_sw_interface_t *si;
226 return format (s, "%=12s%=6s%=16s%=6s%=20s%=24s", "Time", "FIB", "IP4",
227 "Flags", "Ethernet", "Interface");
229 fib = find_ip4_fib_by_table_index_or_id (&ip4_main, e->key.fib_index,
230 IP4_ROUTE_FLAG_FIB_INDEX);
231 si = vnet_get_sw_interface (vnm, e->key.sw_if_index);
233 if (e->flags & ETHERNET_ARP_IP4_ENTRY_FLAG_GLEAN)
234 flags = format (flags, "G");
236 if (e->flags & ETHERNET_ARP_IP4_ENTRY_FLAG_STATIC)
237 flags = format (flags, "S");
239 s = format (s, "%=12U%=6u%=16U%=6s%=20U%=24U",
240 format_vlib_cpu_time, vnm->vlib_main, e->cpu_time_last_updated,
242 format_ip4_address, &e->key.ip4_address,
243 flags ? (char *) flags : "",
244 format_ethernet_address, e->ethernet_address,
245 format_vnet_sw_interface_name, vnm, si);
254 } ethernet_arp_input_trace_t;
257 format_ethernet_arp_input_trace (u8 * s, va_list * va)
259 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*va, vlib_main_t *);
260 CLIB_UNUSED (vlib_node_t * node) = va_arg (*va, vlib_node_t *);
261 ethernet_arp_input_trace_t *t = va_arg (*va, ethernet_arp_input_trace_t *);
264 format_ethernet_arp_header,
265 t->packet_data, sizeof (t->packet_data));
271 ethernet_arp_sw_interface_up_down (vnet_main_t * vnm,
272 u32 sw_if_index, u32 flags)
274 ethernet_arp_main_t *am = ðernet_arp_main;
275 ethernet_arp_ip4_entry_t *e;
280 pool_foreach (e, am->ip4_entry_pool, ({
281 if (e->key.sw_if_index == sw_if_index)
282 vec_add1 (to_add_del, e - am->ip4_entry_pool);
286 for (i = 0; i < vec_len (to_add_del); i++)
288 ethernet_arp_ip4_over_ethernet_address_t arp_add;
289 e = pool_elt_at_index (am->ip4_entry_pool, to_add_del[i]);
291 clib_memcpy (&arp_add.ethernet, e->ethernet_address, 6);
292 arp_add.ip4.as_u32 = e->key.ip4_address.as_u32;
294 if (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
296 vnet_arp_set_ip4_over_ethernet (vnm,
298 e->key.fib_index, &arp_add,
300 ETHERNET_ARP_IP4_ENTRY_FLAG_STATIC);
302 else if ((e->flags & ETHERNET_ARP_IP4_ENTRY_FLAG_STATIC) == 0)
304 vnet_arp_unset_ip4_over_ethernet (vnm,
306 e->key.fib_index, &arp_add);
310 vec_free (to_add_del);
314 VNET_SW_INTERFACE_ADMIN_UP_DOWN_FUNCTION (ethernet_arp_sw_interface_up_down);
317 vnet_arp_set_ip4_over_ethernet_internal (vnet_main_t * vnm,
320 void *a_arg, int is_static);
323 vnet_arp_unset_ip4_over_ethernet_internal (vnet_main_t * vnm,
325 u32 fib_index, void *a_arg);
331 ethernet_arp_ip4_over_ethernet_address_t a;
333 int is_remove; /* set is_remove=1 to clear arp entry */
334 } vnet_arp_set_ip4_over_ethernet_rpc_args_t;
336 static void set_ip4_over_ethernet_rpc_callback
337 (vnet_arp_set_ip4_over_ethernet_rpc_args_t * a)
339 vnet_main_t *vm = vnet_get_main ();
340 ASSERT (os_get_cpu_number () == 0);
343 vnet_arp_unset_ip4_over_ethernet_internal (vm,
345 a->fib_index, &(a->a));
347 vnet_arp_set_ip4_over_ethernet_internal (vm,
350 &(a->a), a->is_static);
354 vnet_arp_set_ip4_over_ethernet (vnet_main_t * vnm,
356 u32 fib_index, void *a_arg, int is_static)
358 ethernet_arp_ip4_over_ethernet_address_t *a = a_arg;
359 vnet_arp_set_ip4_over_ethernet_rpc_args_t args;
361 args.sw_if_index = sw_if_index;
362 args.fib_index = fib_index;
363 args.is_static = is_static;
365 clib_memcpy (&args.a, a, sizeof (*a));
367 vl_api_rpc_call_main_thread (set_ip4_over_ethernet_rpc_callback,
368 (u8 *) & args, sizeof (args));
373 vnet_arp_set_ip4_over_ethernet_internal (vnet_main_t * vnm,
376 void *a_arg, int is_static)
378 ethernet_arp_ip4_key_t k;
379 ethernet_arp_ip4_entry_t *e = 0;
380 ethernet_arp_main_t *am = ðernet_arp_main;
381 ethernet_arp_ip4_over_ethernet_address_t *a = a_arg;
382 vlib_main_t *vm = vlib_get_main ();
383 ip4_main_t *im = &ip4_main;
384 ip_lookup_main_t *lm = &im->lookup_main;
385 int make_new_arp_cache_entry = 1;
387 ip4_add_del_route_args_t args;
388 ip_adjacency_t adj, *existing_adj;
389 pending_resolution_t *pr, *mc;
394 fib_index = (fib_index != (u32) ~ 0)
395 ? fib_index : im->fib_index_by_sw_if_index[sw_if_index];
397 k.sw_if_index = sw_if_index;
398 k.ip4_address = a->ip4;
399 k.fib_index = fib_index;
401 p = mhash_get (&am->ip4_entry_by_key, &k);
404 e = pool_elt_at_index (am->ip4_entry_pool, p[0]);
406 /* Refuse to over-write static arp. */
407 if (!is_static && (e->flags & ETHERNET_ARP_IP4_ENTRY_FLAG_STATIC))
409 make_new_arp_cache_entry = 0;
412 /* Note: always install the route. It might have been deleted */
413 memset (&adj, 0, sizeof (adj));
414 adj.lookup_next_index = IP_LOOKUP_NEXT_REWRITE;
415 adj.n_adj = 1; /* otherwise signature compare fails */
417 vnet_rewrite_for_sw_interface (vnm, VNET_L3_PACKET_TYPE_IP4, sw_if_index, ip4_rewrite_node.index, a->ethernet, /* destination address */
419 sizeof (adj.rewrite_data));
421 /* result of this lookup should be next-hop adjacency */
422 adj_index = ip4_fib_lookup_with_table (im, fib_index, &a->ip4, 0);
423 existing_adj = ip_get_adjacency (lm, adj_index);
425 if (existing_adj->lookup_next_index == IP_LOOKUP_NEXT_ARP &&
426 existing_adj->arp.next_hop.ip4.as_u32 == a->ip4.as_u32)
429 u32 *adjs = vec_dup (e->adjacencies);
430 /* Update all adj assigned to this arp entry */
431 vec_foreach (ai, adjs)
434 ip_adjacency_t *uadj = ip_get_adjacency (lm, *ai);
435 for (i = 0; i < uadj->n_adj; i++)
436 if (uadj[i].lookup_next_index == IP_LOOKUP_NEXT_ARP &&
437 uadj[i].arp.next_hop.ip4.as_u32 == a->ip4.as_u32)
438 ip_update_adjacency (lm, *ai + i, &adj);
444 /* Check that new adjacency actually isn't exactly the same as
445 * what is already there. If we over-write the adjacency with
446 * exactly the same info, its technically a new adjacency with
447 * new counters, but to user it appears as counters reset.
449 if (vnet_ip_adjacency_share_compare (&adj, existing_adj) == 0)
452 args.table_index_or_table_id = fib_index;
454 IP4_ROUTE_FLAG_FIB_INDEX | IP4_ROUTE_FLAG_ADD |
455 IP4_ROUTE_FLAG_NEIGHBOR;
456 args.dst_address = a->ip4;
457 args.dst_address_length = 32;
461 ip4_add_del_route (im, &args);
465 if (make_new_arp_cache_entry)
467 pool_get (am->ip4_entry_pool, e);
468 mhash_set (&am->ip4_entry_by_key, &k, e - am->ip4_entry_pool,
473 /* Update time stamp and ethernet address. */
474 clib_memcpy (e->ethernet_address, a->ethernet,
475 sizeof (e->ethernet_address));
476 e->cpu_time_last_updated = clib_cpu_time_now ();
478 e->flags |= ETHERNET_ARP_IP4_ENTRY_FLAG_STATIC;
480 /* Customer(s) waiting for this address to be resolved? */
481 p = hash_get (am->pending_resolutions_by_address, a->ip4.as_u32);
486 while (next_index != (u32) ~ 0)
488 pr = pool_elt_at_index (am->pending_resolutions, next_index);
489 vlib_process_signal_event (vm, pr->node_index,
490 pr->type_opaque, pr->data);
491 next_index = pr->next_index;
492 pool_put (am->pending_resolutions, pr);
495 hash_unset (am->pending_resolutions_by_address, a->ip4.as_u32);
498 /* Customer(s) requesting ARP event for this address? */
499 p = hash_get (am->mac_changes_by_address, a->ip4.as_u32);
504 while (next_index != (u32) ~ 0)
506 int (*fp) (u32, u8 *, u32, u32);
508 mc = pool_elt_at_index (am->mac_changes, next_index);
509 fp = mc->data_callback;
511 /* Call the user's data callback, return 1 to suppress dup events */
513 rv = (*fp) (mc->data, a->ethernet, sw_if_index, 0);
516 * Signal the resolver process, as long as the user
517 * says they want to be notified
520 vlib_process_signal_event (vm, mc->node_index,
521 mc->type_opaque, mc->data);
522 next_index = mc->next_index;
530 vnet_register_ip4_arp_resolution_event (vnet_main_t * vnm,
533 uword type_opaque, uword data)
535 ethernet_arp_main_t *am = ðernet_arp_main;
536 ip4_address_t *address = address_arg;
538 pending_resolution_t *pr;
540 pool_get (am->pending_resolutions, pr);
543 pr->node_index = node_index;
544 pr->type_opaque = type_opaque;
546 pr->data_callback = 0;
548 p = hash_get (am->pending_resolutions_by_address, address->as_u32);
551 /* Insert new resolution at the head of the list */
552 pr->next_index = p[0];
553 hash_unset (am->pending_resolutions_by_address, address->as_u32);
556 hash_set (am->pending_resolutions_by_address, address->as_u32,
557 pr - am->pending_resolutions);
561 vnet_add_del_ip4_arp_change_event (vnet_main_t * vnm,
566 uword type_opaque, uword data, int is_add)
568 ethernet_arp_main_t *am = ðernet_arp_main;
569 ip4_address_t *address = address_arg;
571 pending_resolution_t *mc;
572 void (*fp) (u32, u8 *) = data_callback;
576 pool_get (am->mac_changes, mc);
579 mc->node_index = node_index;
580 mc->type_opaque = type_opaque;
582 mc->data_callback = data_callback;
585 p = hash_get (am->mac_changes_by_address, address->as_u32);
588 /* Insert new resolution at the head of the list */
589 mc->next_index = p[0];
590 hash_unset (am->mac_changes_by_address, address->as_u32);
593 hash_set (am->mac_changes_by_address, address->as_u32,
594 mc - am->mac_changes);
600 pending_resolution_t *mc_last = 0;
602 p = hash_get (am->mac_changes_by_address, address->as_u32);
604 return VNET_API_ERROR_NO_SUCH_ENTRY;
608 while (index != (u32) ~ 0)
610 mc = pool_elt_at_index (am->mac_changes, index);
611 if (mc->node_index == node_index &&
612 mc->type_opaque == type_opaque && mc->pid == pid)
614 /* Clients may need to clean up pool entries, too */
616 (*fp) (mc->data, 0 /* no new mac addrs */ );
619 hash_unset (am->mac_changes_by_address, address->as_u32);
620 if (mc->next_index != ~0)
621 hash_set (am->mac_changes_by_address, address->as_u32,
623 pool_put (am->mac_changes, mc);
629 mc_last->next_index = mc->next_index;
630 pool_put (am->mac_changes, mc);
635 index = mc->next_index;
638 return VNET_API_ERROR_NO_SUCH_ENTRY;
642 /* Either we drop the packet or we send a reply to the sender. */
646 ARP_INPUT_NEXT_REPLY_TX,
650 #define foreach_ethernet_arp_error \
651 _ (replies_sent, "ARP replies sent") \
652 _ (l2_type_not_ethernet, "L2 type not ethernet") \
653 _ (l3_type_not_ip4, "L3 type not IP4") \
654 _ (l3_src_address_not_local, "IP4 source address not local to subnet") \
655 _ (l3_dst_address_not_local, "IP4 destination address not local to subnet") \
656 _ (l3_src_address_is_local, "IP4 source address matches local interface") \
657 _ (l3_src_address_learned, "ARP request IP4 source address learned") \
658 _ (replies_received, "ARP replies received") \
659 _ (opcode_not_request, "ARP opcode not request") \
660 _ (proxy_arp_replies_sent, "Proxy ARP replies sent") \
661 _ (l2_address_mismatch, "ARP hw addr does not match L2 frame src addr") \
662 _ (missing_interface_address, "ARP missing interface address") \
663 _ (gratuitous_arp, "ARP probe or announcement dropped") \
667 #define _(sym,string) ETHERNET_ARP_ERROR_##sym,
668 foreach_ethernet_arp_error
670 ETHERNET_ARP_N_ERROR,
671 } ethernet_arp_input_error_t;
673 /* get first interface address */
675 ip4_interface_first_address (ip4_main_t * im, u32 sw_if_index,
676 ip_interface_address_t ** result_ia)
678 ip_lookup_main_t *lm = &im->lookup_main;
679 ip_interface_address_t *ia = 0;
680 ip4_address_t *result = 0;
683 foreach_ip_interface_address (lm, ia, sw_if_index,
684 1 /* honor unnumbered */ ,
687 ip_interface_address_get_address (lm, ia);
693 *result_ia = result ? ia : 0;
698 unset_random_arp_entry (void)
700 ethernet_arp_main_t *am = ðernet_arp_main;
701 ethernet_arp_ip4_entry_t *e;
702 vnet_main_t *vnm = vnet_get_main ();
703 ethernet_arp_ip4_over_ethernet_address_t delme;
706 index = pool_next_index (am->ip4_entry_pool, am->arp_delete_rotor);
707 am->arp_delete_rotor = index;
709 /* Try again from elt 0, could happen if an intfc goes down */
712 index = pool_next_index (am->ip4_entry_pool, am->arp_delete_rotor);
713 am->arp_delete_rotor = index;
716 /* Nothing left in the pool */
720 e = pool_elt_at_index (am->ip4_entry_pool, index);
722 clib_memcpy (&delme.ethernet, e->ethernet_address, 6);
723 delme.ip4.as_u32 = e->key.ip4_address.as_u32;
725 vnet_arp_unset_ip4_over_ethernet (vnm, e->key.sw_if_index,
726 e->key.fib_index, &delme);
730 arp_unnumbered (vlib_buffer_t * p0,
732 ethernet_header_t * eth0, ip_interface_address_t * ifa0)
734 vlib_main_t *vm = vlib_get_main ();
735 vnet_main_t *vnm = vnet_get_main ();
736 vnet_interface_main_t *vim = &vnm->interface_main;
737 vnet_sw_interface_t *si;
738 vnet_hw_interface_t *hi;
739 u32 unnum_src_sw_if_index;
740 u32 *broadcast_swifs = 0;
745 u8 dst_mac_address[6];
747 ethernet_arp_header_t *arp0;
749 /* Save the dst mac address */
750 clib_memcpy (dst_mac_address, eth0->dst_address, sizeof (dst_mac_address));
752 /* Figure out which sw_if_index supplied the address */
753 unnum_src_sw_if_index = ifa0->sw_if_index;
755 /* Track down all users of the unnumbered source */
757 pool_foreach (si, vim->sw_interfaces,
759 if (si->flags & VNET_SW_INTERFACE_FLAG_UNNUMBERED &&
760 (si->unnumbered_sw_if_index == unnum_src_sw_if_index))
762 vec_add1 (broadcast_swifs, si->sw_if_index);
767 ASSERT (vec_len (broadcast_swifs));
769 /* Allocate buffering if we need it */
770 if (vec_len (broadcast_swifs) > 1)
772 vec_validate (buffers, vec_len (broadcast_swifs) - 2);
773 n_alloc = vlib_buffer_alloc (vm, buffers, vec_len (buffers));
774 _vec_len (buffers) = n_alloc;
775 for (i = 0; i < n_alloc; i++)
777 b0 = vlib_get_buffer (vm, buffers[i]);
779 /* xerox (partially built) ARP pkt */
780 clib_memcpy (b0->data, p0->data,
781 p0->current_length + p0->current_data);
782 b0->current_data = p0->current_data;
783 b0->current_length = p0->current_length;
784 vnet_buffer (b0)->sw_if_index[VLIB_RX] =
785 vnet_buffer (p0)->sw_if_index[VLIB_RX];
789 vec_insert (buffers, 1, 0);
792 for (i = 0; i < vec_len (buffers); i++)
794 b0 = vlib_get_buffer (vm, buffers[i]);
795 arp0 = vlib_buffer_get_current (b0);
797 hi = vnet_get_sup_hw_interface (vnm, broadcast_swifs[i]);
798 si = vnet_get_sw_interface (vnm, broadcast_swifs[i]);
800 /* For decoration, most likely */
801 vnet_buffer (b0)->sw_if_index[VLIB_TX] = hi->sw_if_index;
803 /* Fix ARP pkt src address */
804 clib_memcpy (arp0->ip4_over_ethernet[0].ethernet, hi->hw_address, 6);
806 /* Build L2 encaps for this swif */
807 header_size = sizeof (ethernet_header_t);
808 if (si->sub.eth.flags.one_tag)
810 else if (si->sub.eth.flags.two_tags)
813 vlib_buffer_advance (b0, -header_size);
814 eth0 = vlib_buffer_get_current (b0);
816 if (si->sub.eth.flags.one_tag)
818 ethernet_vlan_header_t *outer = (void *) (eth0 + 1);
820 eth0->type = si->sub.eth.flags.dot1ad ?
821 clib_host_to_net_u16 (ETHERNET_TYPE_DOT1AD) :
822 clib_host_to_net_u16 (ETHERNET_TYPE_VLAN);
823 outer->priority_cfi_and_id =
824 clib_host_to_net_u16 (si->sub.eth.outer_vlan_id);
825 outer->type = clib_host_to_net_u16 (ETHERNET_TYPE_ARP);
828 else if (si->sub.eth.flags.two_tags)
830 ethernet_vlan_header_t *outer = (void *) (eth0 + 1);
831 ethernet_vlan_header_t *inner = (void *) (outer + 1);
833 eth0->type = si->sub.eth.flags.dot1ad ?
834 clib_host_to_net_u16 (ETHERNET_TYPE_DOT1AD) :
835 clib_host_to_net_u16 (ETHERNET_TYPE_VLAN);
836 outer->priority_cfi_and_id =
837 clib_host_to_net_u16 (si->sub.eth.outer_vlan_id);
838 outer->type = clib_host_to_net_u16 (ETHERNET_TYPE_VLAN);
839 inner->priority_cfi_and_id =
840 clib_host_to_net_u16 (si->sub.eth.inner_vlan_id);
841 inner->type = clib_host_to_net_u16 (ETHERNET_TYPE_ARP);
846 eth0->type = clib_host_to_net_u16 (ETHERNET_TYPE_ARP);
849 /* Restore the original dst address, set src address */
850 clib_memcpy (eth0->dst_address, dst_mac_address,
851 sizeof (eth0->dst_address));
852 clib_memcpy (eth0->src_address, hi->hw_address,
853 sizeof (eth0->src_address));
855 /* Transmit replicas */
859 vlib_get_frame_to_node (vm, hi->output_node_index);
860 u32 *to_next = vlib_frame_vector_args (f);
861 to_next[0] = buffers[i];
863 vlib_put_frame_to_node (vm, hi->output_node_index, f);
867 /* The regular path outputs the original pkt.. */
868 vnet_buffer (p0)->sw_if_index[VLIB_TX] = broadcast_swifs[0];
870 vec_free (broadcast_swifs);
875 arp_input (vlib_main_t * vm, vlib_node_runtime_t * node, vlib_frame_t * frame)
877 ethernet_arp_main_t *am = ðernet_arp_main;
878 vnet_main_t *vnm = vnet_get_main ();
879 ip4_main_t *im4 = &ip4_main;
880 u32 n_left_from, next_index, *from, *to_next;
881 u32 n_replies_sent = 0, n_proxy_arp_replies_sent = 0;
883 from = vlib_frame_vector_args (frame);
884 n_left_from = frame->n_vectors;
885 next_index = node->cached_next_index;
887 if (node->flags & VLIB_NODE_FLAG_TRACE)
888 vlib_trace_frame_buffers_only (vm, node, from, frame->n_vectors,
890 sizeof (ethernet_arp_input_trace_t));
892 while (n_left_from > 0)
896 vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next);
898 while (n_left_from > 0 && n_left_to_next > 0)
901 vnet_hw_interface_t *hw_if0;
902 ethernet_arp_header_t *arp0;
903 ethernet_header_t *eth0;
904 ip_interface_address_t *ifa0;
905 ip_adjacency_t *adj0;
906 ip4_address_t *if_addr0;
907 ip4_address_t proxy_src;
908 u32 pi0, error0, next0, sw_if_index0;
909 u8 is_request0, src_is_local0, dst_is_local0, is_unnum0;
910 ethernet_proxy_arp_t *pa;
919 p0 = vlib_get_buffer (vm, pi0);
920 arp0 = vlib_buffer_get_current (p0);
922 is_request0 = arp0->opcode
923 == clib_host_to_net_u16 (ETHERNET_ARP_OPCODE_request);
925 error0 = ETHERNET_ARP_ERROR_replies_sent;
929 clib_net_to_host_u16 (ETHERNET_ARP_HARDWARE_TYPE_ethernet) ?
930 ETHERNET_ARP_ERROR_l2_type_not_ethernet : error0);
933 clib_net_to_host_u16 (ETHERNET_TYPE_IP4) ?
934 ETHERNET_ARP_ERROR_l3_type_not_ip4 : error0);
936 sw_if_index0 = vnet_buffer (p0)->sw_if_index[VLIB_RX];
941 /* Check that IP address is local and matches incoming interface. */
943 ip4_interface_address_matching_destination (im4,
945 ip4_over_ethernet[1].
950 error0 = ETHERNET_ARP_ERROR_l3_dst_address_not_local;
954 /* Honor unnumbered interface, if any */
955 is_unnum0 = sw_if_index0 != ifa0->sw_if_index;
957 /* Source must also be local to subnet of matching interface address. */
958 if (!ip4_destination_matches_interface
959 (im4, &arp0->ip4_over_ethernet[0].ip4, ifa0))
961 error0 = ETHERNET_ARP_ERROR_l3_src_address_not_local;
965 /* Reject requests/replies with our local interface address. */
967 if_addr0->as_u32 == arp0->ip4_over_ethernet[0].ip4.as_u32;
970 error0 = ETHERNET_ARP_ERROR_l3_src_address_is_local;
975 if_addr0->as_u32 == arp0->ip4_over_ethernet[1].ip4.as_u32;
977 /* Fill in ethernet header. */
978 eth0 = ethernet_buffer_get_header (p0);
980 /* Trash ARP packets whose ARP-level source addresses do not
981 match their L2-frame-level source addresses */
982 if (memcmp (eth0->src_address, arp0->ip4_over_ethernet[0].ethernet,
983 sizeof (eth0->src_address)))
985 error0 = ETHERNET_ARP_ERROR_l2_address_mismatch;
989 /* Learn or update sender's mapping only for requests or unicasts
990 that don't match local interface address. */
991 if (ethernet_address_cast (eth0->dst_address) ==
992 ETHERNET_ADDRESS_UNICAST || is_request0)
994 if (am->limit_arp_cache_size &&
995 pool_elts (am->ip4_entry_pool) >= am->limit_arp_cache_size)
996 unset_random_arp_entry ();
998 vnet_arp_set_ip4_over_ethernet (vnm, sw_if_index0,
999 (u32) ~ 0 /* default fib */ ,
1000 &arp0->ip4_over_ethernet[0],
1001 0 /* is_static */ );
1002 error0 = ETHERNET_ARP_ERROR_l3_src_address_learned;
1005 /* Only send a reply for requests sent which match a local interface. */
1006 if (!(is_request0 && dst_is_local0))
1010 clib_host_to_net_u16 (ETHERNET_ARP_OPCODE_reply) ?
1011 ETHERNET_ARP_ERROR_replies_received : error0);
1017 vnet_buffer (p0)->sw_if_index[VLIB_TX] = sw_if_index0;
1018 hw_if0 = vnet_get_sup_hw_interface (vnm, sw_if_index0);
1020 /* Send reply back through input interface */
1021 vnet_buffer (p0)->sw_if_index[VLIB_TX] = sw_if_index0;
1022 next0 = ARP_INPUT_NEXT_REPLY_TX;
1024 arp0->opcode = clib_host_to_net_u16 (ETHERNET_ARP_OPCODE_reply);
1026 arp0->ip4_over_ethernet[1] = arp0->ip4_over_ethernet[0];
1028 clib_memcpy (arp0->ip4_over_ethernet[0].ethernet,
1029 hw_if0->hw_address, 6);
1030 clib_mem_unaligned (&arp0->ip4_over_ethernet[0].ip4.data_u32, u32) =
1033 /* Hardware must be ethernet-like. */
1034 ASSERT (vec_len (hw_if0->hw_address) == 6);
1036 clib_memcpy (eth0->dst_address, eth0->src_address, 6);
1037 clib_memcpy (eth0->src_address, hw_if0->hw_address, 6);
1039 /* Figure out how much to rewind current data from adjacency. */
1042 adj0 = ip_get_adjacency (&ip4_main.lookup_main,
1043 ifa0->neighbor_probe_adj_index);
1044 if (adj0->lookup_next_index != IP_LOOKUP_NEXT_ARP)
1046 error0 = ETHERNET_ARP_ERROR_missing_interface_address;
1050 arp_unnumbered (p0, pi0, eth0, ifa0);
1052 vlib_buffer_advance (p0, -adj0->rewrite_header.data_bytes);
1055 vlib_validate_buffer_enqueue_x1 (vm, node, next_index, to_next,
1056 n_left_to_next, pi0, next0);
1058 n_replies_sent += 1;
1062 if (0 == arp0->ip4_over_ethernet[0].ip4.as_u32 ||
1063 (arp0->ip4_over_ethernet[0].ip4.as_u32 ==
1064 arp0->ip4_over_ethernet[1].ip4.as_u32))
1066 error0 = ETHERNET_ARP_ERROR_gratuitous_arp;
1069 /* See if proxy arp is configured for the address */
1072 vnet_sw_interface_t *si;
1073 u32 this_addr = clib_net_to_host_u32
1074 (arp0->ip4_over_ethernet[1].ip4.as_u32);
1077 si = vnet_get_sw_interface (vnm, sw_if_index0);
1079 if (!(si->flags & VNET_SW_INTERFACE_FLAG_PROXY_ARP))
1082 fib_index0 = vec_elt (im4->fib_index_by_sw_if_index,
1085 vec_foreach (pa, am->proxy_arps)
1087 u32 lo_addr = clib_net_to_host_u32 (pa->lo_addr);
1088 u32 hi_addr = clib_net_to_host_u32 (pa->hi_addr);
1090 /* an ARP request hit in the proxy-arp table? */
1091 if ((this_addr >= lo_addr && this_addr <= hi_addr) &&
1092 (fib_index0 == pa->fib_index))
1094 eth0 = ethernet_buffer_get_header (p0);
1096 arp0->ip4_over_ethernet[1].ip4.data_u32;
1099 * Rewind buffer, direct code above not to
1100 * think too hard about it.
1101 * $$$ is the answer ever anything other than
1102 * vlib_buffer_reset(..)?
1105 if_addr0 = &proxy_src;
1106 vlib_buffer_reset (p0);
1107 n_proxy_arp_replies_sent++;
1115 next0 = ARP_INPUT_NEXT_DROP;
1116 p0->error = node->errors[error0];
1118 vlib_validate_buffer_enqueue_x1 (vm, node, next_index, to_next,
1119 n_left_to_next, pi0, next0);
1122 vlib_put_next_frame (vm, node, next_index, n_left_to_next);
1125 vlib_error_count (vm, node->node_index,
1126 ETHERNET_ARP_ERROR_replies_sent,
1127 n_replies_sent - n_proxy_arp_replies_sent);
1129 vlib_error_count (vm, node->node_index,
1130 ETHERNET_ARP_ERROR_proxy_arp_replies_sent,
1131 n_proxy_arp_replies_sent);
1132 return frame->n_vectors;
1135 static char *ethernet_arp_error_strings[] = {
1136 #define _(sym,string) string,
1137 foreach_ethernet_arp_error
1142 VLIB_REGISTER_NODE (arp_input_node, static) =
1144 .function = arp_input,
1145 .name = "arp-input",
1146 .vector_size = sizeof (u32),
1147 .n_errors = ETHERNET_ARP_N_ERROR,
1148 .error_strings = ethernet_arp_error_strings,
1149 .n_next_nodes = ARP_INPUT_N_NEXT,
1151 [ARP_INPUT_NEXT_DROP] = "error-drop",
1152 [ARP_INPUT_NEXT_REPLY_TX] = "interface-output",
1154 .format_buffer = format_ethernet_arp_header,
1155 .format_trace = format_ethernet_arp_input_trace,
1160 ip4_arp_entry_sort (void *a1, void *a2)
1162 ethernet_arp_ip4_entry_t *e1 = a1;
1163 ethernet_arp_ip4_entry_t *e2 = a2;
1166 vnet_main_t *vnm = vnet_get_main ();
1168 cmp = vnet_sw_interface_compare
1169 (vnm, e1->key.sw_if_index, e2->key.sw_if_index);
1171 cmp = ip4_address_compare (&e1->key.ip4_address, &e2->key.ip4_address);
1175 static clib_error_t *
1176 show_ip4_arp (vlib_main_t * vm,
1177 unformat_input_t * input, vlib_cli_command_t * cmd)
1179 vnet_main_t *vnm = vnet_get_main ();
1180 ethernet_arp_main_t *am = ðernet_arp_main;
1181 ethernet_arp_ip4_entry_t *e, *es;
1182 ethernet_proxy_arp_t *pa;
1183 clib_error_t *error = 0;
1186 /* Filter entries by interface if given. */
1188 (void) unformat_user (input, unformat_vnet_sw_interface, vnm, &sw_if_index);
1192 pool_foreach (e, am->ip4_entry_pool,
1194 vec_add1 (es, e[0]);
1200 vec_sort_with_function (es, ip4_arp_entry_sort);
1201 vlib_cli_output (vm, "%U", format_ethernet_arp_ip4_entry, vnm, 0);
1204 if (sw_if_index != ~0 && e->key.sw_if_index != sw_if_index)
1206 vlib_cli_output (vm, "%U", format_ethernet_arp_ip4_entry, vnm, e);
1211 if (vec_len (am->proxy_arps))
1213 vlib_cli_output (vm, "Proxy arps enabled for:");
1214 vec_foreach (pa, am->proxy_arps)
1216 vlib_cli_output (vm, "Fib_index %d %U - %U ",
1218 format_ip4_address, &pa->lo_addr,
1219 format_ip4_address, &pa->hi_addr);
1227 VLIB_CLI_COMMAND (show_ip4_arp_command, static) = {
1228 .path = "show ip arp",
1229 .function = show_ip4_arp,
1230 .short_help = "Show ARP table",
1236 pg_edit_t l2_type, l3_type;
1237 pg_edit_t n_l2_address_bytes, n_l3_address_bytes;
1243 } ip4_over_ethernet[2];
1244 } pg_ethernet_arp_header_t;
1247 pg_ethernet_arp_header_init (pg_ethernet_arp_header_t * p)
1249 /* Initialize fields that are not bit fields in the IP header. */
1250 #define _(f) pg_edit_init (&p->f, ethernet_arp_header_t, f);
1253 _(n_l2_address_bytes);
1254 _(n_l3_address_bytes);
1256 _(ip4_over_ethernet[0].ethernet);
1257 _(ip4_over_ethernet[0].ip4);
1258 _(ip4_over_ethernet[1].ethernet);
1259 _(ip4_over_ethernet[1].ip4);
1264 unformat_pg_arp_header (unformat_input_t * input, va_list * args)
1266 pg_stream_t *s = va_arg (*args, pg_stream_t *);
1267 pg_ethernet_arp_header_t *p;
1270 p = pg_create_edit_group (s, sizeof (p[0]), sizeof (ethernet_arp_header_t),
1272 pg_ethernet_arp_header_init (p);
1275 pg_edit_set_fixed (&p->l2_type, ETHERNET_ARP_HARDWARE_TYPE_ethernet);
1276 pg_edit_set_fixed (&p->l3_type, ETHERNET_TYPE_IP4);
1277 pg_edit_set_fixed (&p->n_l2_address_bytes, 6);
1278 pg_edit_set_fixed (&p->n_l3_address_bytes, 4);
1280 if (!unformat (input, "%U: %U/%U -> %U/%U",
1282 unformat_ethernet_arp_opcode_net_byte_order, &p->opcode,
1284 unformat_ethernet_address, &p->ip4_over_ethernet[0].ethernet,
1286 unformat_ip4_address, &p->ip4_over_ethernet[0].ip4,
1288 unformat_ethernet_address, &p->ip4_over_ethernet[1].ethernet,
1290 unformat_ip4_address, &p->ip4_over_ethernet[1].ip4))
1292 /* Free up any edits we may have added. */
1293 pg_free_edit_group (s);
1300 ip4_set_arp_limit (u32 arp_limit)
1302 ethernet_arp_main_t *am = ðernet_arp_main;
1304 am->limit_arp_cache_size = arp_limit;
1309 arp_ip4_entry_del_adj (ethernet_arp_ip4_entry_t * e, u32 adj_index)
1316 vec_foreach_index (i, e->adjacencies)
1317 if (vec_elt (e->adjacencies, i) == adj_index)
1319 vec_del1 (e->adjacencies, i);
1327 arp_ip4_entry_add_adj (ethernet_arp_ip4_entry_t * e, u32 adj_index)
1330 vec_foreach_index (i, e->adjacencies)
1331 if (vec_elt (e->adjacencies, i) == adj_index)
1333 vec_add1 (e->adjacencies, adj_index);
1337 arp_add_del_adj_cb (struct ip_lookup_main_t *lm,
1338 u32 adj_index, ip_adjacency_t * adj, u32 is_del)
1340 ethernet_arp_main_t *am = ðernet_arp_main;
1341 ip4_main_t *im = &ip4_main;
1342 ethernet_arp_ip4_key_t k;
1343 ethernet_arp_ip4_entry_t *e = 0;
1347 for (ai = adj->heap_handle; ai < adj->heap_handle + adj->n_adj; ai++)
1349 adj = ip_get_adjacency (lm, ai);
1350 if (adj->lookup_next_index == IP_LOOKUP_NEXT_ARP
1351 && adj->arp.next_hop.ip4.as_u32)
1353 k.sw_if_index = adj->rewrite_header.sw_if_index;
1354 k.ip4_address.as_u32 = adj->arp.next_hop.ip4.as_u32;
1356 im->fib_index_by_sw_if_index[adj->rewrite_header.sw_if_index];
1357 p = mhash_get (&am->ip4_entry_by_key, &k);
1359 e = pool_elt_at_index (am->ip4_entry_pool, p[0]);
1367 clib_warning ("Adjacency contains unknown ARP next hop %U (del)",
1368 format_ip46_address, &adj->arp.next_hop,
1371 arp_ip4_entry_del_adj (e, adj->heap_handle);
1376 clib_warning ("Adjacency contains unknown ARP next hop %U (add)",
1377 format_ip46_address, &adj->arp.next_hop,
1380 arp_ip4_entry_add_adj (e, adj->heap_handle);
1385 static clib_error_t *
1386 ethernet_arp_init (vlib_main_t * vm)
1388 ethernet_arp_main_t *am = ðernet_arp_main;
1390 clib_error_t *error;
1391 ip4_main_t *im = &ip4_main;
1392 ip_lookup_main_t *lm = &im->lookup_main;
1394 if ((error = vlib_call_init_function (vm, ethernet_init)))
1397 ethernet_register_input_type (vm, ETHERNET_TYPE_ARP, arp_input_node.index);
1399 pn = pg_get_node (arp_input_node.index);
1400 pn->unformat_edit = unformat_pg_arp_header;
1402 am->opcode_by_name = hash_create_string (0, sizeof (uword));
1403 #define _(o) hash_set_mem (am->opcode_by_name, #o, ETHERNET_ARP_OPCODE_##o);
1404 foreach_ethernet_arp_opcode;
1407 mhash_init (&am->ip4_entry_by_key,
1408 /* value size */ sizeof (uword),
1409 /* key size */ sizeof (ethernet_arp_ip4_key_t));
1411 /* $$$ configurable */
1412 am->limit_arp_cache_size = 50000;
1414 am->pending_resolutions_by_address = hash_create (0, sizeof (uword));
1415 am->mac_changes_by_address = hash_create (0, sizeof (uword));
1417 /* don't trace ARP error packets */
1419 vlib_node_runtime_t *rt =
1420 vlib_node_get_runtime (vm, arp_input_node.index);
1423 vnet_pcap_drop_trace_filter_add_del \
1424 (rt->errors[ETHERNET_ARP_ERROR_##a], \
1426 foreach_ethernet_arp_error
1430 ip_register_add_del_adjacency_callback (lm, arp_add_del_adj_cb);
1435 VLIB_INIT_FUNCTION (ethernet_arp_init);
1438 vnet_arp_unset_ip4_over_ethernet (vnet_main_t * vnm,
1439 u32 sw_if_index, u32 fib_index, void *a_arg)
1441 ethernet_arp_ip4_over_ethernet_address_t *a = a_arg;
1442 vnet_arp_set_ip4_over_ethernet_rpc_args_t args;
1444 args.sw_if_index = sw_if_index;
1445 args.fib_index = fib_index;
1447 clib_memcpy (&args.a, a, sizeof (*a));
1449 vl_api_rpc_call_main_thread (set_ip4_over_ethernet_rpc_callback,
1450 (u8 *) & args, sizeof (args));
1455 vnet_arp_unset_ip4_over_ethernet_internal (vnet_main_t * vnm,
1457 u32 fib_index, void *a_arg)
1459 ethernet_arp_ip4_entry_t *e;
1460 ethernet_arp_main_t *am = ðernet_arp_main;
1461 ethernet_arp_ip4_over_ethernet_address_t *a = a_arg;
1462 ethernet_arp_ip4_key_t k;
1464 ip4_add_del_route_args_t args;
1465 ip4_main_t *im = &ip4_main;
1466 ip_lookup_main_t *lm = &im->lookup_main;
1468 ip_adjacency_t *adj;
1470 k.sw_if_index = sw_if_index;
1471 k.ip4_address = a->ip4;
1472 k.fib_index = fib_index;
1473 p = mhash_get (&am->ip4_entry_by_key, &k);
1477 memset (&args, 0, sizeof (args));
1480 * Make sure that the route actually exists before we try to delete it,
1481 * and make sure that it's a rewrite adjacency.
1483 * If we point 1-N unnumbered interfaces at a loopback interface and
1484 * shut down the loopback before shutting down 1-N unnumbered
1485 * interfaces, the ARP cache will still have an entry,
1486 * but the route will have disappeared.
1488 * See also ip4_del_interface_routes (...)
1489 * -> ip4_delete_matching_routes (...).
1492 adj_index = ip4_fib_lookup_with_table
1493 (im, fib_index, &a->ip4, 1 /* disable default route */ );
1495 /* Miss adj? Forget it... */
1496 if (adj_index != lm->miss_adj_index)
1498 adj = ip_get_adjacency (lm, adj_index);
1500 * Stupid control-plane trick:
1501 * admin down an interface (removes arp routes from fib),
1502 * bring the interface back up (does not reinstall them)
1503 * then remove the arp cache entry (yuck). When that happens,
1504 * the adj we find here will be the interface subnet ARP adj.
1506 if (adj->lookup_next_index == IP_LOOKUP_NEXT_REWRITE)
1508 args.table_index_or_table_id = fib_index;
1509 args.flags = IP4_ROUTE_FLAG_FIB_INDEX | IP4_ROUTE_FLAG_DEL
1510 | IP4_ROUTE_FLAG_NEIGHBOR;
1511 args.dst_address = a->ip4;
1512 args.dst_address_length = 32;
1513 ip4_add_del_route (im, &args);
1514 ip4_maybe_remap_adjacencies (im, fib_index, args.flags);
1518 e = pool_elt_at_index (am->ip4_entry_pool, p[0]);
1519 mhash_unset (&am->ip4_entry_by_key, &e->key, 0);
1520 pool_put (am->ip4_entry_pool, e);
1525 increment_ip4_and_mac_address (ethernet_arp_ip4_over_ethernet_address_t * a)
1530 for (i = 3; i >= 0; i--)
1532 old = a->ip4.as_u8[i];
1533 a->ip4.as_u8[i] += 1;
1534 if (old < a->ip4.as_u8[i])
1538 for (i = 5; i >= 0; i--)
1540 old = a->ethernet[i];
1541 a->ethernet[i] += 1;
1542 if (old < a->ethernet[i])
1548 vnet_proxy_arp_add_del (ip4_address_t * lo_addr,
1549 ip4_address_t * hi_addr, u32 fib_index, int is_del)
1551 ethernet_arp_main_t *am = ðernet_arp_main;
1552 ethernet_proxy_arp_t *pa;
1553 u32 found_at_index = ~0;
1555 vec_foreach (pa, am->proxy_arps)
1557 if (pa->lo_addr == lo_addr->as_u32
1558 && pa->hi_addr == hi_addr->as_u32 && pa->fib_index == fib_index)
1560 found_at_index = pa - am->proxy_arps;
1565 if (found_at_index != ~0)
1567 /* Delete, otherwise it's already in the table */
1569 vec_delete (am->proxy_arps, 1, found_at_index);
1572 /* delete, no such entry */
1574 return VNET_API_ERROR_NO_SUCH_ENTRY;
1576 /* add, not in table */
1577 vec_add2 (am->proxy_arps, pa, 1);
1578 pa->lo_addr = lo_addr->as_u32;
1579 pa->hi_addr = hi_addr->as_u32;
1580 pa->fib_index = fib_index;
1585 * Remove any proxy arp entries asdociated with the
1589 vnet_proxy_arp_fib_reset (u32 fib_id)
1591 ip4_main_t *im = &ip4_main;
1592 ethernet_arp_main_t *am = ðernet_arp_main;
1593 ethernet_proxy_arp_t *pa;
1594 u32 *entries_to_delete = 0;
1599 p = hash_get (im->fib_index_by_table_id, fib_id);
1601 return VNET_API_ERROR_NO_SUCH_ENTRY;
1604 vec_foreach (pa, am->proxy_arps)
1606 if (pa->fib_index == fib_index)
1608 vec_add1 (entries_to_delete, pa - am->proxy_arps);
1612 for (i = 0; i < vec_len (entries_to_delete); i++)
1614 vec_delete (am->proxy_arps, 1, entries_to_delete[i]);
1617 vec_free (entries_to_delete);
1623 vnet_arp_glean_add (u32 fib_index, void *next_hop_arg)
1625 ethernet_arp_main_t *am = ðernet_arp_main;
1626 ip4_main_t *im = &ip4_main;
1627 ip_lookup_main_t *lm = &im->lookup_main;
1628 ip4_address_t *next_hop = next_hop_arg;
1629 ip_adjacency_t add_adj, *adj;
1630 ip4_add_del_route_args_t args;
1631 ethernet_arp_ip4_entry_t *e;
1632 ethernet_arp_ip4_key_t k;
1635 adj_index = ip4_fib_lookup_with_table (im, fib_index, next_hop, 0);
1636 adj = ip_get_adjacency (lm, adj_index);
1638 if (!adj || adj->lookup_next_index != IP_LOOKUP_NEXT_ARP)
1641 if (adj->arp.next_hop.ip4.as_u32 != 0)
1644 k.sw_if_index = adj->rewrite_header.sw_if_index;
1645 k.fib_index = fib_index;
1646 k.ip4_address.as_u32 = next_hop->as_u32;
1648 if (mhash_get (&am->ip4_entry_by_key, &k))
1651 pool_get (am->ip4_entry_pool, e);
1652 mhash_set (&am->ip4_entry_by_key, &k, e - am->ip4_entry_pool,
1655 e->cpu_time_last_updated = clib_cpu_time_now ();
1656 e->flags = ETHERNET_ARP_IP4_ENTRY_FLAG_GLEAN;
1658 memset (&args, 0, sizeof (args));
1659 clib_memcpy (&add_adj, adj, sizeof (add_adj));
1660 ip46_address_set_ip4 (&add_adj.arp.next_hop, next_hop); /* install neighbor /32 route */
1661 args.table_index_or_table_id = fib_index;
1663 IP4_ROUTE_FLAG_FIB_INDEX | IP4_ROUTE_FLAG_ADD | IP4_ROUTE_FLAG_NEIGHBOR;
1664 args.dst_address.as_u32 = next_hop->as_u32;
1665 args.dst_address_length = 32;
1666 args.adj_index = ~0;
1667 args.add_adj = &add_adj;
1669 ip4_add_del_route (im, &args);
1670 return ip4_fib_lookup_with_table (im, fib_index, next_hop, 0);
1673 static clib_error_t *
1674 ip_arp_add_del_command_fn (vlib_main_t * vm,
1675 unformat_input_t * input, vlib_cli_command_t * cmd)
1677 vnet_main_t *vnm = vnet_get_main ();
1679 ethernet_arp_ip4_over_ethernet_address_t lo_addr, hi_addr, addr;
1688 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
1690 /* set ip arp TenGigE1/1/0/1 1.2.3.4 aa:bb:... or aabb.ccdd... */
1691 if (unformat (input, "%U %U %U",
1692 unformat_vnet_sw_interface, vnm, &sw_if_index,
1693 unformat_ip4_address, &addr.ip4,
1694 unformat_ethernet_address, &addr.ethernet))
1697 else if (unformat (input, "delete") || unformat (input, "del"))
1700 else if (unformat (input, "static"))
1703 else if (unformat (input, "count %d", &count))
1706 else if (unformat (input, "fib-id %d", &fib_id))
1708 ip4_main_t *im = &ip4_main;
1709 uword *p = hash_get (im->fib_index_by_table_id, fib_id);
1711 return clib_error_return (0, "fib ID %d doesn't exist\n", fib_id);
1715 else if (unformat (input, "proxy %U - %U",
1716 unformat_ip4_address, &lo_addr.ip4,
1717 unformat_ip4_address, &hi_addr.ip4))
1725 (void) vnet_proxy_arp_add_del (&lo_addr.ip4, &hi_addr.ip4,
1734 for (i = 0; i < count; i++)
1738 uword event_type, *event_data = 0;
1740 /* Park the debug CLI until the arp entry is installed */
1741 vnet_register_ip4_arp_resolution_event
1742 (vnm, &addr.ip4, vlib_current_process (vm),
1743 1 /* type */ , 0 /* data */ );
1745 vnet_arp_set_ip4_over_ethernet
1746 (vnm, sw_if_index, fib_index, &addr, is_static);
1748 vlib_process_wait_for_event (vm);
1749 event_type = vlib_process_get_events (vm, &event_data);
1750 vec_reset_length (event_data);
1751 if (event_type != 1)
1752 clib_warning ("event type %d unexpected", event_type);
1755 vnet_arp_unset_ip4_over_ethernet
1756 (vnm, sw_if_index, fib_index, &addr);
1758 increment_ip4_and_mac_address (&addr);
1763 return clib_error_return (0, "unknown input `%U'",
1764 format_unformat_error, input);
1771 VLIB_CLI_COMMAND (ip_arp_add_del_command, static) = {
1772 .path = "set ip arp",
1774 "set ip arp [del] <intfc> <ip-address> <mac-address> [static] [count <count>] [fib-id <fib-id>] [proxy <lo-addr> - <hi-addr>]",
1775 .function = ip_arp_add_del_command_fn,
1779 static clib_error_t *
1780 set_int_proxy_arp_command_fn (vlib_main_t * vm,
1781 unformat_input_t * input,
1782 vlib_cli_command_t * cmd)
1784 vnet_main_t *vnm = vnet_get_main ();
1786 vnet_sw_interface_t *si;
1790 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
1792 if (unformat (input, "%U", unformat_vnet_sw_interface,
1795 else if (unformat (input, "enable") || unformat (input, "on"))
1797 else if (unformat (input, "disable") || unformat (input, "off"))
1804 return clib_error_return (0, "unknown input '%U'",
1805 format_unformat_error, input);
1807 si = vnet_get_sw_interface (vnm, sw_if_index);
1810 si->flags |= VNET_SW_INTERFACE_FLAG_PROXY_ARP;
1812 si->flags &= ~VNET_SW_INTERFACE_FLAG_PROXY_ARP;
1818 VLIB_CLI_COMMAND (set_int_proxy_enable_command, static) = {
1819 .path = "set interface proxy-arp",
1821 "set interface proxy-arp <intfc> [enable|disable]",
1822 .function = set_int_proxy_arp_command_fn,
1828 * ARP Termination in a L2 Bridge Domain based on an
1829 * IP4 to MAC hash table mac_by_ip4 for each BD.
1833 ARP_TERM_NEXT_L2_OUTPUT,
1838 u32 arp_term_next_node_index[32];
1841 arp_term_l2bd (vlib_main_t * vm,
1842 vlib_node_runtime_t * node, vlib_frame_t * frame)
1844 l2input_main_t *l2im = &l2input_main;
1845 u32 n_left_from, next_index, *from, *to_next;
1846 u32 n_replies_sent = 0;
1847 u16 last_bd_index = ~0;
1848 l2_bridge_domain_t *last_bd_config = 0;
1849 l2_input_config_t *cfg0;
1851 from = vlib_frame_vector_args (frame);
1852 n_left_from = frame->n_vectors;
1853 next_index = node->cached_next_index;
1855 while (n_left_from > 0)
1859 vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next);
1861 while (n_left_from > 0 && n_left_to_next > 0)
1864 ethernet_header_t *eth0;
1865 ethernet_arp_header_t *arp0;
1867 u32 pi0, error0, next0, sw_if_index0;
1878 n_left_to_next -= 1;
1880 p0 = vlib_get_buffer (vm, pi0);
1881 eth0 = vlib_buffer_get_current (p0);
1882 l3h0 = (u8 *) eth0 + vnet_buffer (p0)->l2.l2_len;
1883 ethertype0 = clib_net_to_host_u16 (*(u16 *) (l3h0 - 2));
1884 arp0 = (ethernet_arp_header_t *) l3h0;
1886 if (PREDICT_FALSE ((node->flags & VLIB_NODE_FLAG_TRACE) &&
1887 (p0->flags & VLIB_BUFFER_IS_TRACED)))
1889 u8 *t0 = vlib_add_trace (vm, node, p0,
1890 sizeof (ethernet_arp_input_trace_t));
1891 clib_memcpy (t0, l3h0, sizeof (ethernet_arp_input_trace_t));
1894 if (PREDICT_FALSE ((ethertype0 != ETHERNET_TYPE_ARP) ||
1896 clib_host_to_net_u16
1897 (ETHERNET_ARP_OPCODE_request))))
1898 goto next_l2_feature;
1900 error0 = ETHERNET_ARP_ERROR_replies_sent;
1903 clib_net_to_host_u16 (ETHERNET_ARP_HARDWARE_TYPE_ethernet) ?
1904 ETHERNET_ARP_ERROR_l2_type_not_ethernet : error0);
1907 clib_net_to_host_u16 (ETHERNET_TYPE_IP4) ?
1908 ETHERNET_ARP_ERROR_l3_type_not_ip4 : error0);
1910 sw_if_index0 = vnet_buffer (p0)->sw_if_index[VLIB_RX];
1915 // Trash ARP packets whose ARP-level source addresses do not
1916 // match their L2-frame-level source addresses */
1919 (eth0->src_address, arp0->ip4_over_ethernet[0].ethernet,
1920 sizeof (eth0->src_address))))
1922 error0 = ETHERNET_ARP_ERROR_l2_address_mismatch;
1926 // Check if anyone want ARP request events for L2 BDs
1928 pending_resolution_t *mc;
1929 ethernet_arp_main_t *am = ðernet_arp_main;
1930 uword *p = hash_get (am->mac_changes_by_address, 0);
1931 if (p && (vnet_buffer (p0)->l2.shg == 0))
1932 { // Only SHG 0 interface which is more likely local
1933 u32 next_index = p[0];
1934 while (next_index != (u32) ~ 0)
1936 int (*fp) (u32, u8 *, u32, u32);
1938 mc = pool_elt_at_index (am->mac_changes, next_index);
1939 fp = mc->data_callback;
1940 // Call the callback, return 1 to suppress dup events */
1942 rv = (*fp) (mc->data,
1943 arp0->ip4_over_ethernet[0].ethernet,
1945 arp0->ip4_over_ethernet[0].ip4.as_u32);
1946 // Signal the resolver process
1948 vlib_process_signal_event (vm, mc->node_index,
1949 mc->type_opaque, mc->data);
1950 next_index = mc->next_index;
1955 // lookup BD mac_by_ip4 hash table for MAC entry
1956 ip0 = arp0->ip4_over_ethernet[1].ip4.as_u32;
1957 bd_index0 = vnet_buffer (p0)->l2.bd_index;
1958 if (PREDICT_FALSE ((bd_index0 != last_bd_index)
1959 || (last_bd_index == (u16) ~ 0)))
1961 last_bd_index = bd_index0;
1962 last_bd_config = vec_elt_at_index (l2im->bd_configs, bd_index0);
1964 macp0 = (u8 *) hash_get (last_bd_config->mac_by_ip4, ip0);
1966 if (PREDICT_FALSE (!macp0))
1967 goto next_l2_feature; // MAC not found
1969 // MAC found, send ARP reply -
1970 // Convert ARP request packet to ARP reply
1971 arp0->opcode = clib_host_to_net_u16 (ETHERNET_ARP_OPCODE_reply);
1972 arp0->ip4_over_ethernet[1] = arp0->ip4_over_ethernet[0];
1973 arp0->ip4_over_ethernet[0].ip4.as_u32 = ip0;
1974 clib_memcpy (arp0->ip4_over_ethernet[0].ethernet, macp0, 6);
1975 clib_memcpy (eth0->dst_address, eth0->src_address, 6);
1976 clib_memcpy (eth0->src_address, macp0, 6);
1977 n_replies_sent += 1;
1979 // For BVI, need to use l2-fwd node to send ARP reply as
1980 // l2-output node cannot output packet to BVI properly
1981 cfg0 = vec_elt_at_index (l2im->configs, sw_if_index0);
1982 if (PREDICT_FALSE (cfg0->bvi))
1984 vnet_buffer (p0)->l2.feature_bitmap |= L2INPUT_FEAT_FWD;
1985 vnet_buffer (p0)->sw_if_index[VLIB_RX] = 0;
1986 goto next_l2_feature;
1989 // Send ARP reply back out input interface through l2-output
1990 vnet_buffer (p0)->sw_if_index[VLIB_TX] = sw_if_index0;
1991 next0 = ARP_TERM_NEXT_L2_OUTPUT;
1992 // Note that output to VXLAN tunnel will fail due to SHG which
1993 // is probably desireable since ARP termination is not intended
1994 // for ARP requests from other hosts. If output to VXLAN tunnel is
1995 // required, however, can just clear the SHG in packet as follows:
1996 // vnet_buffer(p0)->l2.shg = 0;
1998 vlib_validate_buffer_enqueue_x1 (vm, node, next_index, to_next,
1999 n_left_to_next, pi0, next0);
2004 u32 feature_bitmap0 =
2005 vnet_buffer (p0)->l2.feature_bitmap & ~L2INPUT_FEAT_ARP_TERM;
2006 vnet_buffer (p0)->l2.feature_bitmap = feature_bitmap0;
2007 next0 = feat_bitmap_get_next_node_index (arp_term_next_node_index,
2009 vlib_validate_buffer_enqueue_x1 (vm, node, next_index, to_next,
2010 n_left_to_next, pi0, next0);
2015 if (0 == arp0->ip4_over_ethernet[0].ip4.as_u32 ||
2016 (arp0->ip4_over_ethernet[0].ip4.as_u32 ==
2017 arp0->ip4_over_ethernet[1].ip4.as_u32))
2019 error0 = ETHERNET_ARP_ERROR_gratuitous_arp;
2021 next0 = ARP_TERM_NEXT_DROP;
2022 p0->error = node->errors[error0];
2024 vlib_validate_buffer_enqueue_x1 (vm, node, next_index, to_next,
2025 n_left_to_next, pi0, next0);
2028 vlib_put_next_frame (vm, node, next_index, n_left_to_next);
2031 vlib_error_count (vm, node->node_index,
2032 ETHERNET_ARP_ERROR_replies_sent, n_replies_sent);
2033 return frame->n_vectors;
2037 VLIB_REGISTER_NODE (arp_term_l2bd_node, static) = {
2038 .function = arp_term_l2bd,
2039 .name = "arp-term-l2bd",
2040 .vector_size = sizeof (u32),
2041 .n_errors = ETHERNET_ARP_N_ERROR,
2042 .error_strings = ethernet_arp_error_strings,
2043 .n_next_nodes = ARP_TERM_N_NEXT,
2045 [ARP_TERM_NEXT_L2_OUTPUT] = "l2-output",
2046 [ARP_TERM_NEXT_DROP] = "error-drop",
2048 .format_buffer = format_ethernet_arp_header,
2049 .format_trace = format_ethernet_arp_input_trace,
2054 arp_term_init (vlib_main_t * vm)
2055 { // Initialize the feature next-node indexes
2056 feat_bitmap_init_next_nodes (vm,
2057 arp_term_l2bd_node.index,
2059 l2input_get_feat_names (),
2060 arp_term_next_node_index);
2064 VLIB_INIT_FUNCTION (arp_term_init);
2067 * fd.io coding-style-patch-verification: ON
2070 * eval: (c-set-style "gnu")