2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
7 * http://www.apache.org/licenses/LICENSE-2.0
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
16 * ethernet_interface.c: ethernet interfaces
18 * Copyright (c) 2008 Eliot Dresselhaus
20 * Permission is hereby granted, free of charge, to any person obtaining
21 * a copy of this software and associated documentation files (the
22 * "Software"), to deal in the Software without restriction, including
23 * without limitation the rights to use, copy, modify, merge, publish,
24 * distribute, sublicense, and/or sell copies of the Software, and to
25 * permit persons to whom the Software is furnished to do so, subject to
26 * the following conditions:
28 * The above copyright notice and this permission notice shall be
29 * included in all copies or substantial portions of the Software.
31 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35 * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36 * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37 * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
40 #include <vnet/vnet.h>
41 #include <vnet/ip/ip.h>
42 #include <vnet/pg/pg.h>
43 #include <vnet/ethernet/ethernet.h>
44 //#include <vnet/ethernet/arp.h>
45 #include <vnet/l2/l2_input.h>
46 #include <vnet/l2/l2_bd.h>
47 #include <vnet/adj/adj.h>
48 #include <vnet/adj/adj_mcast.h>
49 #include <vnet/ip-neighbor/ip_neighbor.h>
53 * @brief Loopback Interfaces.
55 * This file contains code to manage loopback interfaces.
59 ethernet_ip4_mcast_dst_addr (void)
61 const static u8 ethernet_mcast_dst_mac[] = {
62 0x1, 0x0, 0x5e, 0x0, 0x0, 0x0,
65 return (ethernet_mcast_dst_mac);
69 ethernet_ip6_mcast_dst_addr (void)
71 const static u8 ethernet_mcast_dst_mac[] = {
72 0x33, 0x33, 0x00, 0x0, 0x0, 0x0,
75 return (ethernet_mcast_dst_mac);
79 * @brief build a rewrite string to use for sending packets of type 'link_type'
83 ethernet_build_rewrite (vnet_main_t * vnm,
85 vnet_link_t link_type, const void *dst_address)
87 vnet_sw_interface_t *sub_sw = vnet_get_sw_interface (vnm, sw_if_index);
88 vnet_sw_interface_t *sup_sw = vnet_get_sup_sw_interface (vnm, sw_if_index);
89 vnet_hw_interface_t *hw = vnet_get_sup_hw_interface (vnm, sw_if_index);
90 ethernet_main_t *em = ðernet_main;
91 ethernet_interface_t *ei;
94 uword n_bytes = sizeof (h[0]);
98 if ((sub_sw->type == VNET_SW_INTERFACE_TYPE_P2P) ||
99 (sub_sw->type == VNET_SW_INTERFACE_TYPE_PIPE))
101 if (sub_sw != sup_sw)
103 if (sub_sw->sub.eth.flags.one_tag)
105 n_bytes += sizeof (ethernet_vlan_header_t);
107 else if (sub_sw->sub.eth.flags.two_tags)
109 n_bytes += 2 * (sizeof (ethernet_vlan_header_t));
111 else if (PREDICT_FALSE (is_p2p))
113 n_bytes = sizeof (ethernet_header_t);
115 if (PREDICT_FALSE (!is_p2p))
117 // Check for encaps that are not supported for L3 interfaces
118 if (!(sub_sw->sub.eth.flags.exact_match) ||
119 (sub_sw->sub.eth.flags.default_sub) ||
120 (sub_sw->sub.eth.flags.outer_vlan_id_any) ||
121 (sub_sw->sub.eth.flags.inner_vlan_id_any))
128 n_bytes = sizeof (ethernet_header_t);
134 #define _(a,b) case VNET_LINK_##a: type = ETHERNET_TYPE_##b; break
144 vec_validate (rewrite, n_bytes - 1);
145 h = (ethernet_header_t *) rewrite;
146 ei = pool_elt_at_index (em->interfaces, hw->hw_instance);
147 clib_memcpy (h->src_address, &ei->address, sizeof (h->src_address));
150 clib_memcpy (h->dst_address, sub_sw->p2p.client_mac,
151 sizeof (h->dst_address));
156 clib_memcpy (h->dst_address, dst_address, sizeof (h->dst_address));
158 clib_memset (h->dst_address, ~0, sizeof (h->dst_address)); /* broadcast */
161 if (PREDICT_FALSE (!is_p2p) && sub_sw->sub.eth.flags.one_tag)
163 ethernet_vlan_header_t *outer = (void *) (h + 1);
165 h->type = sub_sw->sub.eth.flags.dot1ad ?
166 clib_host_to_net_u16 (ETHERNET_TYPE_DOT1AD) :
167 clib_host_to_net_u16 (ETHERNET_TYPE_VLAN);
168 outer->priority_cfi_and_id =
169 clib_host_to_net_u16 (sub_sw->sub.eth.outer_vlan_id);
170 outer->type = clib_host_to_net_u16 (type);
173 else if (PREDICT_FALSE (!is_p2p) && sub_sw->sub.eth.flags.two_tags)
175 ethernet_vlan_header_t *outer = (void *) (h + 1);
176 ethernet_vlan_header_t *inner = (void *) (outer + 1);
178 h->type = sub_sw->sub.eth.flags.dot1ad ?
179 clib_host_to_net_u16 (ETHERNET_TYPE_DOT1AD) :
180 clib_host_to_net_u16 (ETHERNET_TYPE_VLAN);
181 outer->priority_cfi_and_id =
182 clib_host_to_net_u16 (sub_sw->sub.eth.outer_vlan_id);
183 outer->type = clib_host_to_net_u16 (ETHERNET_TYPE_VLAN);
184 inner->priority_cfi_and_id =
185 clib_host_to_net_u16 (sub_sw->sub.eth.inner_vlan_id);
186 inner->type = clib_host_to_net_u16 (type);
191 h->type = clib_host_to_net_u16 (type);
198 ethernet_update_adjacency (vnet_main_t * vnm, u32 sw_if_index, u32 ai)
200 vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
202 if ((si->type == VNET_SW_INTERFACE_TYPE_P2P) ||
203 (si->type == VNET_SW_INTERFACE_TYPE_PIPE))
205 default_update_adjacency (vnm, sw_if_index, ai);
213 switch (adj->lookup_next_index)
215 case IP_LOOKUP_NEXT_GLEAN:
216 adj_glean_update_rewrite (ai);
218 case IP_LOOKUP_NEXT_ARP:
219 case IP_LOOKUP_NEXT_REWRITE:
220 ip_neighbor_update (vnm, ai);
222 case IP_LOOKUP_NEXT_BCAST:
223 adj_nbr_update_rewrite (ai,
224 ADJ_NBR_REWRITE_FLAG_COMPLETE,
225 ethernet_build_rewrite
227 adj->rewrite_header.sw_if_index,
229 VNET_REWRITE_FOR_SW_INTERFACE_ADDRESS_BROADCAST));
231 case IP_LOOKUP_NEXT_MCAST:
234 * Construct a partial rewrite from the known ethernet mcast dest MAC
239 rewrite = ethernet_build_rewrite
243 (adj->ia_nh_proto == FIB_PROTOCOL_IP6 ?
244 ethernet_ip6_mcast_dst_addr () :
245 ethernet_ip4_mcast_dst_addr ()));
248 * Complete the remaining fields of the adj's rewrite to direct the
249 * complete of the rewrite at switch time by copying in the IP
250 * dst address's bytes.
251 * Ofset is 2 bytes into the destintation address.
253 offset = vec_len (rewrite) - 2;
254 adj_mcast_update_rewrite (ai, rewrite, offset);
258 case IP_LOOKUP_NEXT_DROP:
259 case IP_LOOKUP_NEXT_PUNT:
260 case IP_LOOKUP_NEXT_LOCAL:
261 case IP_LOOKUP_NEXT_MCAST_MIDCHAIN:
262 case IP_LOOKUP_NEXT_MIDCHAIN:
263 case IP_LOOKUP_NEXT_ICMP_ERROR:
264 case IP_LOOKUP_N_NEXT:
272 ethernet_interface_address_copy (ethernet_interface_address_t * dst,
275 clib_memcpy (&dst->mac, (u8 *) mac, sizeof (dst->mac));
277 * ethernet dataplane loads mac as u64, makes sure the last 2 bytes are 0
278 * for comparison purpose
284 ethernet_set_mac (vnet_hw_interface_t * hi, ethernet_interface_t * ei,
285 const u8 * mac_address)
287 vec_validate (hi->hw_address, sizeof (mac_address_t) - 1);
288 clib_memcpy (hi->hw_address, mac_address, sizeof (mac_address_t));
289 ethernet_interface_address_copy (&ei->address, mac_address);
292 static clib_error_t *
293 ethernet_mac_change (vnet_hw_interface_t * hi,
294 const u8 * old_address, const u8 * mac_address)
296 ethernet_interface_t *ei;
300 ei = pool_elt_at_index (em->interfaces, hi->hw_instance);
302 ethernet_set_mac (hi, ei, mac_address);
305 ethernet_address_change_ctx_t *cb;
307 vec_foreach (cb, em->address_change_callbacks)
309 cb->function (em, hi->sw_if_index, cb->function_opaque);
310 /* clang-format off */
311 hash_foreach (id, sw_if_index, hi->sub_interface_sw_if_index_by_id,
313 cb->function (em, sw_if_index, cb->function_opaque);
315 /* clang-format on */
322 static clib_error_t *
323 ethernet_set_max_frame_size (vnet_main_t *vnm, vnet_hw_interface_t *hi,
326 ethernet_interface_t *ei =
327 pool_elt_at_index (ethernet_main.interfaces, hi->hw_instance);
329 if (ei->cb.set_max_frame_size)
330 return ei->cb.set_max_frame_size (vnm, hi, frame_size);
333 VNET_ERR_UNSUPPORTED,
334 "underlying driver doesn't support changing Max Frame Size");
337 VNET_HW_INTERFACE_CLASS (ethernet_hw_interface_class) = {
339 .tx_hash_fn_type = VNET_HASH_FN_TYPE_ETHERNET,
340 .format_address = format_ethernet_address,
341 .format_header = format_ethernet_header_with_length,
342 .unformat_hw_address = unformat_ethernet_address,
343 .unformat_header = unformat_ethernet_header,
344 .build_rewrite = ethernet_build_rewrite,
345 .update_adjacency = ethernet_update_adjacency,
346 .mac_addr_change_function = ethernet_mac_change,
347 .set_max_frame_size = ethernet_set_max_frame_size,
351 unformat_ethernet_interface (unformat_input_t * input, va_list * args)
353 vnet_main_t *vnm = va_arg (*args, vnet_main_t *);
354 u32 *result = va_arg (*args, u32 *);
356 ethernet_main_t *em = ðernet_main;
357 ethernet_interface_t *eif;
359 if (!unformat_user (input, unformat_vnet_hw_interface, vnm, &hw_if_index))
362 eif = ethernet_get_interface (em, hw_if_index);
365 *result = hw_if_index;
372 vnet_eth_register_interface (vnet_main_t *vnm,
373 vnet_eth_interface_registration_t *r)
375 ethernet_main_t *em = ðernet_main;
376 ethernet_interface_t *ei;
377 vnet_hw_interface_t *hi;
380 pool_get (em->interfaces, ei);
381 clib_memcpy (&ei->cb, &r->cb, sizeof (vnet_eth_if_callbacks_t));
383 hw_if_index = vnet_register_interface (
384 vnm, r->dev_class_index, r->dev_instance,
385 ethernet_hw_interface_class.index, ei - em->interfaces);
387 hi = vnet_get_hw_interface (vnm, hw_if_index);
389 ethernet_setup_node (vnm->vlib_main, hi->output_node_index);
391 hi->min_frame_size = ETHERNET_MIN_PACKET_BYTES;
395 sizeof (ethernet_header_t) + 2 * sizeof (ethernet_vlan_header_t);
396 hi->max_frame_size = r->max_frame_size ?
398 ethernet_main.default_mtu + hi->frame_overhead;
401 /* Default ethernet MTU, 9000 unless set by ethernet_config see below */
402 vnet_sw_interface_set_mtu (vnm, hi->sw_if_index, em->default_mtu);
404 ethernet_set_mac (hi, ei, r->address);
409 ethernet_delete_interface (vnet_main_t * vnm, u32 hw_if_index)
411 ethernet_main_t *em = ðernet_main;
412 ethernet_interface_t *ei;
413 vnet_hw_interface_t *hi;
414 main_intf_t *main_intf;
415 vlan_table_t *vlan_table;
418 hi = vnet_get_hw_interface (vnm, hw_if_index);
419 ei = pool_elt_at_index (em->interfaces, hi->hw_instance);
421 /* Delete vlan mapping table for dot1q and dot1ad. */
422 main_intf = vec_elt_at_index (em->main_intfs, hi->hw_if_index);
423 if (main_intf->dot1q_vlans)
425 vlan_table = vec_elt_at_index (em->vlan_pool, main_intf->dot1q_vlans);
426 for (idx = 0; idx < ETHERNET_N_VLAN; idx++)
428 if (vlan_table->vlans[idx].qinqs)
430 pool_put_index (em->qinq_pool, vlan_table->vlans[idx].qinqs);
431 vlan_table->vlans[idx].qinqs = 0;
434 pool_put_index (em->vlan_pool, main_intf->dot1q_vlans);
435 main_intf->dot1q_vlans = 0;
437 if (main_intf->dot1ad_vlans)
439 vlan_table = vec_elt_at_index (em->vlan_pool, main_intf->dot1ad_vlans);
440 for (idx = 0; idx < ETHERNET_N_VLAN; idx++)
442 if (vlan_table->vlans[idx].qinqs)
444 pool_put_index (em->qinq_pool, vlan_table->vlans[idx].qinqs);
445 vlan_table->vlans[idx].qinqs = 0;
448 pool_put_index (em->vlan_pool, main_intf->dot1ad_vlans);
449 main_intf->dot1ad_vlans = 0;
452 vnet_delete_hw_interface (vnm, hw_if_index);
453 pool_put (em->interfaces, ei);
457 ethernet_set_flags (vnet_main_t * vnm, u32 hw_if_index, u32 flags)
459 ethernet_main_t *em = ðernet_main;
460 vnet_hw_interface_t *hi;
461 ethernet_interface_t *ei;
462 u32 opn_flags = flags & ETHERNET_INTERFACE_FLAGS_SET_OPN_MASK;
464 hi = vnet_get_hw_interface (vnm, hw_if_index);
466 ASSERT (hi->hw_class_index == ethernet_hw_interface_class.index);
468 ei = pool_elt_at_index (em->interfaces, hi->hw_instance);
470 /* preserve status bits and update last set operation bits */
471 ei->flags = (ei->flags & ETHERNET_INTERFACE_FLAGS_STATUS_MASK) | opn_flags;
473 if (ei->cb.flag_change)
477 case ETHERNET_INTERFACE_FLAG_DEFAULT_L3:
478 if (hi->caps & VNET_HW_IF_CAP_MAC_FILTER)
480 if (ei->cb.flag_change (vnm, hi, opn_flags) != ~0)
482 ei->flags |= ETHERNET_INTERFACE_FLAG_STATUS_L3;
485 ei->flags &= ~ETHERNET_INTERFACE_FLAG_STATUS_L3;
489 case ETHERNET_INTERFACE_FLAG_ACCEPT_ALL:
490 ei->flags &= ~ETHERNET_INTERFACE_FLAG_STATUS_L3;
491 return ei->cb.flag_change (vnm, hi, opn_flags);
500 * Echo packets back to ethernet/l2-input.
503 simulated_ethernet_interface_tx (vlib_main_t * vm,
504 vlib_node_runtime_t *
505 node, vlib_frame_t * frame)
507 u32 n_left_from, *from;
510 u32 thread_index = vm->thread_index;
511 vnet_main_t *vnm = vnet_get_main ();
512 vnet_interface_main_t *im = &vnm->interface_main;
513 l2_input_config_t *config;
514 vlib_buffer_t *bufs[VLIB_FRAME_SIZE], **b;
515 u16 nexts[VLIB_FRAME_SIZE], *next;
516 u32 new_rx_sw_if_index = ~0;
517 u32 new_tx_sw_if_index = ~0;
519 n_left_from = frame->n_vectors;
520 from = vlib_frame_vector_args (frame);
522 vlib_get_buffers (vm, from, bufs, n_left_from);
526 /* Ordinarily, this is the only config lookup. */
527 config = l2input_intf_config (vnet_buffer (b[0])->sw_if_index[VLIB_TX]);
528 next_index = (l2_input_is_bridge (config) ?
529 VNET_SIMULATED_ETHERNET_TX_NEXT_L2_INPUT :
530 VNET_SIMULATED_ETHERNET_TX_NEXT_ETHERNET_INPUT);
531 new_tx_sw_if_index = l2_input_is_bvi (config) ? L2INPUT_BVI : ~0;
532 new_rx_sw_if_index = vnet_buffer (b[0])->sw_if_index[VLIB_TX];
534 while (n_left_from >= 4)
536 u32 sw_if_index0, sw_if_index1, sw_if_index2, sw_if_index3;
539 /* Prefetch next iteration. */
540 if (PREDICT_TRUE (n_left_from >= 8))
542 vlib_prefetch_buffer_header (b[4], STORE);
543 vlib_prefetch_buffer_header (b[5], STORE);
544 vlib_prefetch_buffer_header (b[6], STORE);
545 vlib_prefetch_buffer_header (b[7], STORE);
548 /* Make sure all pkts were transmitted on the same (loop) intfc */
549 sw_if_index0 = vnet_buffer (b[0])->sw_if_index[VLIB_TX];
550 sw_if_index1 = vnet_buffer (b[1])->sw_if_index[VLIB_TX];
551 sw_if_index2 = vnet_buffer (b[2])->sw_if_index[VLIB_TX];
552 sw_if_index3 = vnet_buffer (b[3])->sw_if_index[VLIB_TX];
554 xor_ifx4 = u32x4_gather (&sw_if_index0, &sw_if_index1, &sw_if_index2,
557 /* Speed path / expected case: all pkts on the same intfc */
558 if (PREDICT_TRUE (u32x4_is_all_equal (xor_ifx4, new_rx_sw_if_index)))
560 next[0] = next_index;
561 next[1] = next_index;
562 next[2] = next_index;
563 next[3] = next_index;
564 vnet_buffer (b[0])->sw_if_index[VLIB_RX] = new_rx_sw_if_index;
565 vnet_buffer (b[1])->sw_if_index[VLIB_RX] = new_rx_sw_if_index;
566 vnet_buffer (b[2])->sw_if_index[VLIB_RX] = new_rx_sw_if_index;
567 vnet_buffer (b[3])->sw_if_index[VLIB_RX] = new_rx_sw_if_index;
568 vnet_buffer (b[0])->sw_if_index[VLIB_TX] = new_tx_sw_if_index;
569 vnet_buffer (b[1])->sw_if_index[VLIB_TX] = new_tx_sw_if_index;
570 vnet_buffer (b[2])->sw_if_index[VLIB_TX] = new_tx_sw_if_index;
571 vnet_buffer (b[3])->sw_if_index[VLIB_TX] = new_tx_sw_if_index;
572 n_bytes = vlib_buffer_length_in_chain (vm, b[0]);
573 n_bytes += vlib_buffer_length_in_chain (vm, b[1]);
574 n_bytes += vlib_buffer_length_in_chain (vm, b[2]);
575 n_bytes += vlib_buffer_length_in_chain (vm, b[3]);
577 if (next_index == VNET_SIMULATED_ETHERNET_TX_NEXT_L2_INPUT)
579 vnet_update_l2_len (b[0]);
580 vnet_update_l2_len (b[1]);
581 vnet_update_l2_len (b[2]);
582 vnet_update_l2_len (b[3]);
585 /* increment TX interface stat */
586 vlib_increment_combined_counter (im->combined_sw_if_counters +
587 VNET_INTERFACE_COUNTER_TX,
588 thread_index, new_rx_sw_if_index,
589 4 /* pkts */ , n_bytes);
597 * Slow path: we know that at least one of the pkts
598 * was transmitted on a different sw_if_index, so
599 * check each sw_if_index against the cached data and proceed
602 * This shouldn't happen, but code can (and does) bypass the
603 * per-interface output node, so deal with it.
605 if (PREDICT_FALSE (vnet_buffer (b[0])->sw_if_index[VLIB_TX]
606 != new_rx_sw_if_index))
608 config = l2input_intf_config
609 (vnet_buffer (b[0])->sw_if_index[VLIB_TX]);
610 next_index = (l2_input_is_bridge (config) ?
611 VNET_SIMULATED_ETHERNET_TX_NEXT_L2_INPUT :
612 VNET_SIMULATED_ETHERNET_TX_NEXT_ETHERNET_INPUT);
613 new_tx_sw_if_index = l2_input_is_bvi (config) ? L2INPUT_BVI : ~0;
614 new_rx_sw_if_index = vnet_buffer (b[0])->sw_if_index[VLIB_TX];
616 next[0] = next_index;
617 vnet_buffer (b[0])->sw_if_index[VLIB_RX] = new_rx_sw_if_index;
618 vnet_buffer (b[0])->sw_if_index[VLIB_TX] = new_tx_sw_if_index;
619 n_bytes = vlib_buffer_length_in_chain (vm, b[0]);
620 if (next_index == VNET_SIMULATED_ETHERNET_TX_NEXT_L2_INPUT)
621 vnet_update_l2_len (b[0]);
623 vlib_increment_combined_counter (im->combined_sw_if_counters +
624 VNET_INTERFACE_COUNTER_TX,
625 thread_index, new_rx_sw_if_index,
626 1 /* pkts */ , n_bytes);
628 if (PREDICT_FALSE (vnet_buffer (b[1])->sw_if_index[VLIB_TX]
629 != new_rx_sw_if_index))
631 config = l2input_intf_config
632 (vnet_buffer (b[1])->sw_if_index[VLIB_TX]);
633 next_index = (l2_input_is_bridge (config) ?
634 VNET_SIMULATED_ETHERNET_TX_NEXT_L2_INPUT :
635 VNET_SIMULATED_ETHERNET_TX_NEXT_ETHERNET_INPUT);
636 new_rx_sw_if_index = vnet_buffer (b[1])->sw_if_index[VLIB_TX];
637 new_tx_sw_if_index = l2_input_is_bvi (config) ? L2INPUT_BVI : ~0;
639 next[1] = next_index;
640 vnet_buffer (b[1])->sw_if_index[VLIB_RX] = new_rx_sw_if_index;
641 vnet_buffer (b[1])->sw_if_index[VLIB_TX] = new_tx_sw_if_index;
642 n_bytes = vlib_buffer_length_in_chain (vm, b[1]);
643 if (next_index == VNET_SIMULATED_ETHERNET_TX_NEXT_L2_INPUT)
644 vnet_update_l2_len (b[1]);
646 vlib_increment_combined_counter (im->combined_sw_if_counters +
647 VNET_INTERFACE_COUNTER_TX,
648 thread_index, new_rx_sw_if_index,
649 1 /* pkts */ , n_bytes);
651 if (PREDICT_FALSE (vnet_buffer (b[2])->sw_if_index[VLIB_TX]
652 != new_rx_sw_if_index))
654 config = l2input_intf_config
655 (vnet_buffer (b[2])->sw_if_index[VLIB_TX]);
656 next_index = (l2_input_is_bridge (config) ?
657 VNET_SIMULATED_ETHERNET_TX_NEXT_L2_INPUT :
658 VNET_SIMULATED_ETHERNET_TX_NEXT_ETHERNET_INPUT);
659 new_rx_sw_if_index = vnet_buffer (b[2])->sw_if_index[VLIB_TX];
660 new_tx_sw_if_index = l2_input_is_bvi (config) ? L2INPUT_BVI : ~0;
662 next[2] = next_index;
663 vnet_buffer (b[2])->sw_if_index[VLIB_RX] = new_rx_sw_if_index;
664 vnet_buffer (b[2])->sw_if_index[VLIB_TX] = new_tx_sw_if_index;
665 n_bytes = vlib_buffer_length_in_chain (vm, b[2]);
666 if (next_index == VNET_SIMULATED_ETHERNET_TX_NEXT_L2_INPUT)
667 vnet_update_l2_len (b[2]);
669 vlib_increment_combined_counter (im->combined_sw_if_counters +
670 VNET_INTERFACE_COUNTER_TX,
671 thread_index, new_rx_sw_if_index,
672 1 /* pkts */ , n_bytes);
674 if (PREDICT_FALSE (vnet_buffer (b[3])->sw_if_index[VLIB_TX]
675 != new_rx_sw_if_index))
677 config = l2input_intf_config
678 (vnet_buffer (b[3])->sw_if_index[VLIB_TX]);
679 next_index = (l2_input_is_bridge (config) ?
680 VNET_SIMULATED_ETHERNET_TX_NEXT_L2_INPUT :
681 VNET_SIMULATED_ETHERNET_TX_NEXT_ETHERNET_INPUT);
682 new_rx_sw_if_index = vnet_buffer (b[3])->sw_if_index[VLIB_TX];
683 new_tx_sw_if_index = l2_input_is_bvi (config) ? L2INPUT_BVI : ~0;
685 next[3] = next_index;
686 vnet_buffer (b[3])->sw_if_index[VLIB_RX] = new_rx_sw_if_index;
687 vnet_buffer (b[3])->sw_if_index[VLIB_TX] = new_tx_sw_if_index;
688 n_bytes = vlib_buffer_length_in_chain (vm, b[3]);
689 if (next_index == VNET_SIMULATED_ETHERNET_TX_NEXT_L2_INPUT)
690 vnet_update_l2_len (b[3]);
692 vlib_increment_combined_counter (im->combined_sw_if_counters +
693 VNET_INTERFACE_COUNTER_TX,
694 thread_index, new_rx_sw_if_index,
695 1 /* pkts */ , n_bytes);
700 while (n_left_from > 0)
702 if (PREDICT_FALSE (vnet_buffer (b[0])->sw_if_index[VLIB_TX]
703 != new_rx_sw_if_index))
705 config = l2input_intf_config
706 (vnet_buffer (b[0])->sw_if_index[VLIB_TX]);
707 next_index = (l2_input_is_bridge (config) ?
708 VNET_SIMULATED_ETHERNET_TX_NEXT_L2_INPUT :
709 VNET_SIMULATED_ETHERNET_TX_NEXT_ETHERNET_INPUT);
710 new_tx_sw_if_index = l2_input_is_bvi (config) ? L2INPUT_BVI : ~0;
711 new_rx_sw_if_index = vnet_buffer (b[0])->sw_if_index[VLIB_TX];
713 next[0] = next_index;
714 vnet_buffer (b[0])->sw_if_index[VLIB_RX] = new_rx_sw_if_index;
715 vnet_buffer (b[0])->sw_if_index[VLIB_TX] = new_tx_sw_if_index;
716 n_bytes = vlib_buffer_length_in_chain (vm, b[0]);
717 if (next_index == VNET_SIMULATED_ETHERNET_TX_NEXT_L2_INPUT)
718 vnet_update_l2_len (b[0]);
720 vlib_increment_combined_counter (im->combined_sw_if_counters +
721 VNET_INTERFACE_COUNTER_TX,
722 thread_index, new_rx_sw_if_index,
723 1 /* pkts */ , n_bytes);
729 vlib_buffer_enqueue_to_next (vm, node, from, nexts, frame->n_vectors);
731 return frame->n_vectors;
735 format_simulated_ethernet_name (u8 * s, va_list * args)
737 u32 dev_instance = va_arg (*args, u32);
738 return format (s, "loop%d", dev_instance);
741 static clib_error_t *
742 simulated_ethernet_admin_up_down (vnet_main_t * vnm, u32 hw_if_index,
745 u32 hw_flags = (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP) ?
746 VNET_HW_INTERFACE_FLAG_LINK_UP : 0;
747 vnet_hw_interface_set_flags (vnm, hw_if_index, hw_flags);
751 static clib_error_t *
752 simulated_ethernet_mac_change (vnet_hw_interface_t * hi,
753 const u8 * old_address, const u8 * mac_address)
755 l2input_interface_mac_change (hi->sw_if_index, old_address, mac_address);
761 VNET_DEVICE_CLASS (ethernet_simulated_device_class) = {
763 .format_device_name = format_simulated_ethernet_name,
764 .tx_function = simulated_ethernet_interface_tx,
765 .admin_up_down_function = simulated_ethernet_admin_up_down,
766 .mac_addr_change_function = simulated_ethernet_mac_change,
770 * Maintain a bitmap of allocated loopback instance numbers.
772 #define LOOPBACK_MAX_INSTANCE (16 * 1024)
775 loopback_instance_alloc (u8 is_specified, u32 want)
777 ethernet_main_t *em = ðernet_main;
780 * Check for dynamically allocaetd instance number.
786 bit = clib_bitmap_first_clear (em->bm_loopback_instances);
787 if (bit >= LOOPBACK_MAX_INSTANCE)
791 em->bm_loopback_instances = clib_bitmap_set (em->bm_loopback_instances,
799 if (want >= LOOPBACK_MAX_INSTANCE)
807 if (clib_bitmap_get (em->bm_loopback_instances, want))
813 * Grant allocation request.
815 em->bm_loopback_instances = clib_bitmap_set (em->bm_loopback_instances,
822 loopback_instance_free (u32 instance)
824 ethernet_main_t *em = ðernet_main;
826 if (instance >= LOOPBACK_MAX_INSTANCE)
831 if (clib_bitmap_get (em->bm_loopback_instances, instance) == 0)
836 em->bm_loopback_instances = clib_bitmap_set (em->bm_loopback_instances,
842 vnet_create_loopback_interface (u32 * sw_if_indexp, u8 * mac_address,
843 u8 is_specified, u32 user_instance)
845 vnet_main_t *vnm = vnet_get_main ();
846 vlib_main_t *vm = vlib_get_main ();
850 vnet_hw_interface_t *hw_if;
853 ASSERT (sw_if_indexp);
855 *sw_if_indexp = (u32) ~ 0;
857 clib_memset (address, 0, sizeof (address));
860 * Allocate a loopback instance. Either select on dynamically
861 * or try to use the desired user_instance number.
863 instance = loopback_instance_alloc (is_specified, user_instance);
866 return VNET_API_ERROR_INVALID_REGISTRATION;
870 * Default MAC address (dead:0000:0000 + instance) is allocated
871 * if zero mac_address is configured. Otherwise, user-configurable MAC
872 * address is programmed on the loopback interface.
874 if (memcmp (address, mac_address, sizeof (address)))
875 clib_memcpy (address, mac_address, sizeof (address));
880 address[5] = instance;
883 vnet_eth_interface_registration_t eir = {};
884 eir.dev_class_index = ethernet_simulated_device_class.index;
885 eir.dev_instance = instance;
886 eir.address = address;
887 hw_if_index = vnet_eth_register_interface (vnm, &eir);
888 hw_if = vnet_get_hw_interface (vnm, hw_if_index);
889 slot = vlib_node_add_named_next_with_slot
890 (vm, hw_if->tx_node_index,
891 "ethernet-input", VNET_SIMULATED_ETHERNET_TX_NEXT_ETHERNET_INPUT);
892 ASSERT (slot == VNET_SIMULATED_ETHERNET_TX_NEXT_ETHERNET_INPUT);
894 slot = vlib_node_add_named_next_with_slot
895 (vm, hw_if->tx_node_index,
896 "l2-input", VNET_SIMULATED_ETHERNET_TX_NEXT_L2_INPUT);
897 ASSERT (slot == VNET_SIMULATED_ETHERNET_TX_NEXT_L2_INPUT);
900 vnet_sw_interface_t *si = vnet_get_hw_sw_interface (vnm, hw_if_index);
901 *sw_if_indexp = si->sw_if_index;
903 /* By default don't flood to loopbacks, as packets just keep
904 * coming back ... If this loopback becomes a BVI, we'll change it */
905 si->flood_class = VNET_FLOOD_CLASS_NO_FLOOD;
911 static clib_error_t *
912 create_simulated_ethernet_interfaces (vlib_main_t * vm,
913 unformat_input_t * input,
914 vlib_cli_command_t * cmd)
920 u32 user_instance = 0;
922 clib_memset (mac_address, 0, sizeof (mac_address));
924 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
926 if (unformat (input, "mac %U", unformat_ethernet_address, mac_address))
928 if (unformat (input, "instance %d", &user_instance))
934 rv = vnet_create_loopback_interface (&sw_if_index, mac_address,
935 is_specified, user_instance);
938 return clib_error_return (0, "vnet_create_loopback_interface failed");
940 vlib_cli_output (vm, "%U\n", format_vnet_sw_if_index_name, vnet_get_main (),
946 * Create a loopback interface. Optionally, a MAC Address can be
947 * provided. If not provided, de:ad:00:00:00:<loopId> will be used.
950 * The following two command syntaxes are equivalent:
951 * @cliexcmd{loopback create-interface [mac <mac-addr>] [instance <instance>]}
952 * @cliexcmd{create loopback interface [mac <mac-addr>] [instance <instance>]}
953 * Example of how to create a loopback interface:
954 * @cliexcmd{loopback create-interface}
956 VLIB_CLI_COMMAND (create_simulated_ethernet_interface_command, static) = {
957 .path = "loopback create-interface",
958 .short_help = "loopback create-interface [mac <mac-addr>] [instance <instance>]",
959 .function = create_simulated_ethernet_interfaces,
963 * Create a loopback interface. Optionally, a MAC Address can be
964 * provided. If not provided, de:ad:00:00:00:<loopId> will be used.
967 * The following two command syntaxes are equivalent:
968 * @cliexcmd{loopback create-interface [mac <mac-addr>] [instance <instance>]}
969 * @cliexcmd{create loopback interface [mac <mac-addr>] [instance <instance>]}
970 * Example of how to create a loopback interface:
971 * @cliexcmd{create loopback interface}
973 VLIB_CLI_COMMAND (create_loopback_interface_command, static) = {
974 .path = "create loopback interface",
975 .short_help = "create loopback interface [mac <mac-addr>] [instance <instance>]",
976 .function = create_simulated_ethernet_interfaces,
979 ethernet_interface_t *
980 ethernet_get_interface (ethernet_main_t * em, u32 hw_if_index)
982 vnet_hw_interface_t *i =
983 vnet_get_hw_interface (vnet_get_main (), hw_if_index);
984 return (i->hw_class_index ==
985 ethernet_hw_interface_class.
986 index ? pool_elt_at_index (em->interfaces, i->hw_instance) : 0);
990 ethernet_interface_add_del_address (ethernet_main_t * em,
991 u32 hw_if_index, const u8 * address,
994 ethernet_interface_t *ei = ethernet_get_interface (em, hw_if_index);
995 ethernet_interface_address_t *if_addr = 0;
998 /* return if there is not an ethernet interface for this hw interface */
1002 /* determine whether the address is configured on the interface */
1003 vec_foreach (if_addr, ei->secondary_addrs)
1005 if (ethernet_mac_address_equal (if_addr->mac.bytes, address))
1016 /* address not found yet: add it */
1017 vec_add2 (ei->secondary_addrs, if_addr, 1);
1018 ethernet_interface_address_copy (if_addr, address);
1020 return &if_addr->mac;
1025 vec_delete (ei->secondary_addrs, 1, if_addr - ei->secondary_addrs);
1031 vnet_delete_loopback_interface (u32 sw_if_index)
1033 vnet_main_t *vnm = vnet_get_main ();
1035 if (pool_is_free_index (vnm->interface_main.sw_interfaces, sw_if_index))
1036 return VNET_API_ERROR_INVALID_SW_IF_INDEX;
1038 vnet_hw_interface_t *hw = vnet_get_sup_hw_interface (vnm, sw_if_index);
1039 if (hw == 0 || hw->dev_class_index != ethernet_simulated_device_class.index)
1040 return VNET_API_ERROR_INVALID_SW_IF_INDEX;
1042 if (loopback_instance_free (hw->dev_instance) < 0)
1043 return VNET_API_ERROR_INVALID_SW_IF_INDEX;
1045 ethernet_delete_interface (vnm, hw->hw_if_index);
1051 vnet_create_sub_interface (u32 sw_if_index, u32 id,
1052 u32 flags, u16 inner_vlan_id, u16 outer_vlan_id,
1053 u32 * sub_sw_if_index)
1055 vnet_main_t *vnm = vnet_get_main ();
1056 vnet_interface_main_t *im = &vnm->interface_main;
1057 vnet_hw_interface_t *hi;
1058 u64 sup_and_sub_key = ((u64) (sw_if_index) << 32) | (u64) id;
1059 vnet_sw_interface_t template;
1063 hi = vnet_get_sup_hw_interface (vnm, sw_if_index);
1065 p = hash_get_mem (im->sw_if_index_by_sup_and_sub, &sup_and_sub_key);
1068 return (VNET_API_ERROR_VLAN_ALREADY_EXISTS);
1071 clib_memset (&template, 0, sizeof (template));
1072 template.type = VNET_SW_INTERFACE_TYPE_SUB;
1073 template.flood_class = VNET_FLOOD_CLASS_NORMAL;
1074 template.sup_sw_if_index = sw_if_index;
1075 template.sub.id = id;
1076 template.sub.eth.raw_flags = flags;
1077 template.sub.eth.outer_vlan_id = outer_vlan_id;
1078 template.sub.eth.inner_vlan_id = inner_vlan_id;
1080 if (vnet_create_sw_interface (vnm, &template, sub_sw_if_index))
1081 return (VNET_API_ERROR_UNSPECIFIED);
1083 kp = clib_mem_alloc (sizeof (*kp));
1084 *kp = sup_and_sub_key;
1086 hash_set (hi->sub_interface_sw_if_index_by_id, id, *sub_sw_if_index);
1087 hash_set_mem (im->sw_if_index_by_sup_and_sub, kp, *sub_sw_if_index);
1093 vnet_delete_sub_interface (u32 sw_if_index)
1095 vnet_main_t *vnm = vnet_get_main ();
1096 vnet_sw_interface_t *si;
1099 if (pool_is_free_index (vnm->interface_main.sw_interfaces, sw_if_index))
1100 return VNET_API_ERROR_INVALID_SW_IF_INDEX;
1102 si = vnet_get_sw_interface (vnm, sw_if_index);
1103 if (si->type == VNET_SW_INTERFACE_TYPE_SUB ||
1104 si->type == VNET_SW_INTERFACE_TYPE_PIPE ||
1105 si->type == VNET_SW_INTERFACE_TYPE_P2P)
1107 vnet_interface_main_t *im = &vnm->interface_main;
1108 vnet_hw_interface_t *hi = vnet_get_sup_hw_interface (vnm, sw_if_index);
1109 u64 sup_and_sub_key =
1110 ((u64) (si->sup_sw_if_index) << 32) | (u64) si->sub.id;
1111 hash_unset_mem_free (&im->sw_if_index_by_sup_and_sub, &sup_and_sub_key);
1112 hash_unset (hi->sub_interface_sw_if_index_by_id, si->sub.id);
1113 vnet_delete_sw_interface (vnm, sw_if_index);
1116 rv = VNET_API_ERROR_INVALID_SUB_SW_IF_INDEX;
1121 static clib_error_t *
1122 delete_simulated_ethernet_interfaces (vlib_main_t * vm,
1123 unformat_input_t * input,
1124 vlib_cli_command_t * cmd)
1127 u32 sw_if_index = ~0;
1128 vnet_main_t *vnm = vnet_get_main ();
1130 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
1132 if (unformat (input, "intfc %U",
1133 unformat_vnet_sw_interface, vnm, &sw_if_index))
1139 if (sw_if_index == ~0)
1140 return clib_error_return (0, "interface not specified");
1142 rv = vnet_delete_loopback_interface (sw_if_index);
1145 return clib_error_return (0, "vnet_delete_loopback_interface failed");
1150 static clib_error_t *
1151 delete_sub_interface (vlib_main_t * vm,
1152 unformat_input_t * input, vlib_cli_command_t * cmd)
1155 u32 sw_if_index = ~0;
1156 vnet_main_t *vnm = vnet_get_main ();
1158 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
1161 (input, "%U", unformat_vnet_sw_interface, vnm, &sw_if_index))
1166 if (sw_if_index == ~0)
1167 return clib_error_return (0, "interface doesn't exist");
1169 if (pool_is_free_index (vnm->interface_main.sw_interfaces, sw_if_index))
1170 rv = VNET_API_ERROR_INVALID_SW_IF_INDEX;
1172 rv = vnet_delete_sub_interface (sw_if_index);
1174 return clib_error_return (0, "delete_subinterface_interface failed");
1179 * Delete a loopback interface.
1182 * The following two command syntaxes are equivalent:
1183 * @cliexcmd{loopback delete-interface intfc <interface>}
1184 * @cliexcmd{delete loopback interface intfc <interface>}
1185 * Example of how to delete a loopback interface:
1186 * @cliexcmd{loopback delete-interface intfc loop0}
1188 VLIB_CLI_COMMAND (delete_simulated_ethernet_interface_command, static) = {
1189 .path = "loopback delete-interface",
1190 .short_help = "loopback delete-interface intfc <interface>",
1191 .function = delete_simulated_ethernet_interfaces,
1195 * Delete a loopback interface.
1198 * The following two command syntaxes are equivalent:
1199 * @cliexcmd{loopback delete-interface intfc <interface>}
1200 * @cliexcmd{delete loopback interface intfc <interface>}
1201 * Example of how to delete a loopback interface:
1202 * @cliexcmd{delete loopback interface intfc loop0}
1204 VLIB_CLI_COMMAND (delete_loopback_interface_command, static) = {
1205 .path = "delete loopback interface",
1206 .short_help = "delete loopback interface intfc <interface>",
1207 .function = delete_simulated_ethernet_interfaces,
1211 * Delete a sub-interface.
1214 * Example of how to delete a sub-interface:
1215 * @cliexcmd{delete sub-interface GigabitEthernet0/8/0.200}
1217 VLIB_CLI_COMMAND (delete_sub_interface_command, static) = {
1218 .path = "delete sub-interface",
1219 .short_help = "delete sub-interface <interface>",
1220 .function = delete_sub_interface,
1223 /* ethernet { ... } configuration. */
1226 * @cfgcmd{default-mtu <n>}
1227 * Specify the default mtu in the range of 64-9000. The default is 9000 bytes.
1230 static clib_error_t *
1231 ethernet_config (vlib_main_t * vm, unformat_input_t * input)
1233 ethernet_main_t *em = ðernet_main;
1235 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
1237 if (unformat (input, "default-mtu %u", &em->default_mtu))
1239 if (em->default_mtu < 64 || em->default_mtu > 9000)
1240 return clib_error_return (0, "default MTU must be >=64, <=9000");
1244 return clib_error_return (0, "unknown input '%U'",
1245 format_unformat_error, input);
1251 VLIB_CONFIG_FUNCTION (ethernet_config, "ethernet");
1254 * fd.io coding-style-patch-verification: ON
1257 * eval: (c-set-style "gnu")