2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
7 * http://www.apache.org/licenses/LICENSE-2.0
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
16 * ethernet.h: types/functions for ethernet.
18 * Copyright (c) 2008 Eliot Dresselhaus
20 * Permission is hereby granted, free of charge, to any person obtaining
21 * a copy of this software and associated documentation files (the
22 * "Software"), to deal in the Software without restriction, including
23 * without limitation the rights to use, copy, modify, merge, publish,
24 * distribute, sublicense, and/or sell copies of the Software, and to
25 * permit persons to whom the Software is furnished to do so, subject to
26 * the following conditions:
28 * The above copyright notice and this permission notice shall be
29 * included in all copies or substantial portions of the Software.
31 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35 * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36 * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37 * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
40 #ifndef included_ethernet_h
41 #define included_ethernet_h
43 #include <vnet/vnet.h>
44 #include <vnet/ethernet/packet.h>
45 #include <vnet/pg/pg.h>
48 ethernet_mac_address_u64 (u8 * a)
49 { return (((u64) a[0] << (u64) (5*8))
50 | ((u64) a[1] << (u64) (4*8))
51 | ((u64) a[2] << (u64) (3*8))
52 | ((u64) a[3] << (u64) (2*8))
53 | ((u64) a[4] << (u64) (1*8))
54 | ((u64) a[5] << (u64) (0*8))); }
56 static inline int ethernet_mac_address_is_multicast_u64 (u64 a)
58 return (a & (1ULL<<(5*8))) != 0;
61 /* Max. sized ethernet/vlan header for parsing. */
63 ethernet_header_t ethernet;
65 /* Allow up to 2 stacked vlan headers. */
66 ethernet_vlan_header_t vlan[2];
67 } ethernet_max_header_t;
69 struct vnet_hw_interface_t;
70 /* Ethernet flag change callback. */
71 typedef u32 (ethernet_flag_change_function_t)
72 (vnet_main_t * vnm, struct vnet_hw_interface_t * hi, u32 flags);
74 #define ETHERNET_MIN_PACKET_BYTES 64
75 #define ETHERNET_MAX_PACKET_BYTES 9216
77 /* Ethernet interface instance. */
78 typedef struct ethernet_interface {
80 /* Accept all packets (promiscuous mode). */
81 #define ETHERNET_INTERFACE_FLAG_ACCEPT_ALL (1 << 0)
82 #define ETHERNET_INTERFACE_FLAG_CONFIG_PROMISC(flags) \
83 (((flags) & ~ETHERNET_INTERFACE_FLAG_ACCEPT_ALL) == 0)
85 /* Change MTU on interface from hw interface structure */
86 #define ETHERNET_INTERFACE_FLAG_MTU (1 << 1)
87 #define ETHERNET_INTERFACE_FLAG_CONFIG_MTU(flags) \
88 ((flags) & ETHERNET_INTERFACE_FLAG_MTU)
90 /* Callback, e.g. to turn on/off promiscuous mode */
91 ethernet_flag_change_function_t * flag_change;
95 /* Ethernet (MAC) address for this interface. */
97 } ethernet_interface_t;
99 vnet_hw_interface_class_t ethernet_hw_interface_class;
102 /* Name (a c string). */
105 /* Ethernet type in host byte order. */
106 ethernet_type_t type;
108 /* Node which handles this type. */
111 /* Next index for this type. */
113 } ethernet_type_info_t;
116 #define ethernet_error(n,c,s) ETHERNET_ERROR_##n,
117 #include <vnet/ethernet/error.def>
118 #undef ethernet_error
123 // Structs used when parsing packet to find sw_if_index
128 // config entry is-valid flag
129 // exact match flags (valid if packet has 0/1/2/3 tags)
130 // L2 vs L3 forwarding mode
131 #define SUBINT_CONFIG_MATCH_0_TAG (1<<0)
132 #define SUBINT_CONFIG_MATCH_1_TAG (1<<1)
133 #define SUBINT_CONFIG_MATCH_2_TAG (1<<2)
134 #define SUBINT_CONFIG_MATCH_3_TAG (1<<3)
135 #define SUBINT_CONFIG_VALID (1<<4)
136 #define SUBINT_CONFIG_L2 (1<<5)
141 eth_create_valid_subint_match_flags (u32 num_tags) {
142 return SUBINT_CONFIG_VALID | (1 << num_tags);
147 subint_config_t untagged_subint;
148 subint_config_t default_subint;
149 u16 dot1q_vlans; // pool id for vlan table
150 u16 dot1ad_vlans; // pool id for vlan table
154 subint_config_t single_tag_subint;
155 subint_config_t inner_any_subint;
156 u32 qinqs; // pool id for qinq table
160 vlan_intf_t vlans[ETHERNET_N_VLAN];
164 subint_config_t subint;
168 qinq_intf_t vlans[ETHERNET_N_VLAN];
171 // Structure mapping to a next index based on ethertype.
172 // Common ethertypes are stored explicitly, others are
173 // stored in a sparse table.
175 /* Sparse vector mapping ethernet type in network byte order
177 u16 * input_next_by_type;
178 u32 * sparse_index_by_input_next_index;
180 /* cached next indexes for common ethertypes */
184 } next_by_ethertype_t;
188 vlib_main_t * vlib_main;
190 /* next node index for the L3 input node of each ethertype */
191 next_by_ethertype_t l3_next;
193 /* next node index for L2 interfaces */
196 /* flag and next node index for L3 redirect */
198 u32 redirect_l3_next;
200 /* Pool of ethernet interface instances. */
201 ethernet_interface_t * interfaces;
203 ethernet_type_info_t * type_infos;
205 /* Hash tables mapping name/type to type info index. */
206 uword * type_info_by_name, * type_info_by_type;
208 // The root of the vlan parsing tables. A vector with one element
209 // for each main interface, indexed by hw_if_index.
210 main_intf_t * main_intfs;
212 // Pool of vlan tables
213 vlan_table_t * vlan_pool;
215 // Pool of qinq tables;
216 qinq_table_t * qinq_pool;
218 /* Set to one to use AB.CD.EF instead of A:B:C:D:E:F as ethernet format. */
219 int format_ethernet_address_16bit;
223 ethernet_main_t ethernet_main;
225 always_inline ethernet_type_info_t *
226 ethernet_get_type_info (ethernet_main_t * em, ethernet_type_t type)
228 uword * p = hash_get (em->type_info_by_type, type);
229 return p ? vec_elt_at_index (em->type_infos, p[0]) : 0;
232 ethernet_interface_t *
233 ethernet_get_interface (ethernet_main_t * em, u32 hw_if_index);
236 ethernet_register_interface (vnet_main_t * vnm,
240 u32 * hw_if_index_return,
241 ethernet_flag_change_function_t flag_change);
243 void ethernet_delete_interface (vnet_main_t * vnm, u32 hw_if_index);
245 /* Register given node index to take input for given ethernet type. */
247 ethernet_register_input_type (vlib_main_t * vm,
248 ethernet_type_t type,
251 /* Register given node index to take input for packet from L2 interfaces. */
253 ethernet_register_l2_input (vlib_main_t * vm,
256 /* Register given node index to take redirected L3 traffic, and enable L3 redirect */
258 ethernet_register_l3_redirect (vlib_main_t * vm,
261 /* Formats ethernet address X:X:X:X:X:X */
262 u8 * format_ethernet_address (u8 * s, va_list * args);
263 u8 * format_ethernet_type (u8 * s, va_list * args);
264 u8 * format_ethernet_header (u8 * s, va_list * args);
265 u8 * format_ethernet_header_with_length (u8 * s, va_list * args);
267 /* Parse ethernet address in either X:X:X:X:X:X unix or X.X.X cisco format. */
269 unformat_ethernet_address (unformat_input_t * input, va_list * args);
271 /* Parse ethernet type as 0xXXXX or type name from ethernet/types.def.
272 In either host or network byte order. */
274 unformat_ethernet_type_host_byte_order (unformat_input_t * input,
277 unformat_ethernet_type_net_byte_order (unformat_input_t * input,
280 /* Parse ethernet header. */
282 unformat_ethernet_header (unformat_input_t * input, va_list * args);
284 /* Parse ethernet interface name; return hw_if_index. */
285 uword unformat_ethernet_interface (unformat_input_t * input, va_list * args);
287 uword unformat_pg_ethernet_header (unformat_input_t * input, va_list * args);
290 ethernet_setup_node (vlib_main_t * vm, u32 node_index)
292 vlib_node_t * n = vlib_get_node (vm, node_index);
293 pg_node_t * pn = pg_get_node (node_index);
295 n->format_buffer = format_ethernet_header_with_length;
296 n->unformat_buffer = unformat_ethernet_header;
297 pn->unformat_edit = unformat_pg_ethernet_header;
300 always_inline ethernet_header_t *
301 ethernet_buffer_get_header (vlib_buffer_t * b)
305 + vnet_buffer (b)->ethernet.start_of_ethernet_header);
308 ethernet_main_t * ethernet_get_main (vlib_main_t * vm);
309 u32 ethernet_set_flags (vnet_main_t * vnm, u32 hw_if_index, u32 flags);
310 void ethernet_sw_interface_set_l2_mode (vnet_main_t * vnm, u32 sw_if_index, u32 l2);
311 void ethernet_set_rx_redirect (vnet_main_t * vnm, vnet_hw_interface_t * hi, u32 enable);
314 vnet_arp_set_ip4_over_ethernet (vnet_main_t * vnm,
321 vnet_arp_unset_ip4_over_ethernet (vnet_main_t * vnm,
322 u32 sw_if_index, u32 fib_index,
325 int vnet_proxy_arp_fib_reset (u32 fib_id);
327 clib_error_t * next_by_ethertype_init (next_by_ethertype_t * l3_next);
328 clib_error_t * next_by_ethertype_register (next_by_ethertype_t * l3_next,
332 int vnet_create_loopback_interface (u32 * sw_if_indexp, u8 *mac_address);
333 int vnet_delete_loopback_interface (u32 sw_if_index);
335 // Perform ethernet subinterface classification table lookups given
336 // the ports's sw_if_index and fields extracted from the ethernet header.
337 // The resulting tables are used by identify_subint().
339 eth_vlan_table_lookups (ethernet_main_t *em,
341 u32 port_sw_if_index0,
345 vnet_hw_interface_t ** hi,
346 main_intf_t **main_intf,
347 vlan_intf_t **vlan_intf,
348 qinq_intf_t **qinq_intf)
350 vlan_table_t *vlan_table;
351 qinq_table_t *qinq_table;
354 // Read the main, vlan, and qinq interface table entries
355 // TODO: Consider if/how to prefetch tables. Also consider
356 // single-entry cache to skip table lookups and identify_subint()
358 *hi = vnet_get_sup_hw_interface (vnm, port_sw_if_index0);
359 *main_intf = vec_elt_at_index (em->main_intfs, (*hi)->hw_if_index);
361 // Always read the vlan and qinq tables, even if there are not that
362 // many tags on the packet. This makes the lookups and comparisons
363 // easier (and less branchy).
364 vlan_table_id = (first_ethertype == ETHERNET_TYPE_DOT1AD) ?
365 (*main_intf)->dot1ad_vlans :
366 (*main_intf)->dot1q_vlans;
367 vlan_table = vec_elt_at_index (em->vlan_pool, vlan_table_id);
368 *vlan_intf = &vlan_table->vlans[outer_id];
370 qinq_table = vec_elt_at_index (em->qinq_pool, (*vlan_intf)->qinqs);
371 *qinq_intf = &qinq_table->vlans[inner_id];
375 // Determine the subinterface for this packet, given the result of the
376 // vlan table lookups and vlan header parsing. Check the most specific
378 // Returns 1 if a matching subinterface was found, otherwise returns 0.
380 eth_identify_subint (vnet_hw_interface_t * hi,
383 main_intf_t * main_intf,
384 vlan_intf_t * vlan_intf,
385 qinq_intf_t * qinq_intf,
386 u32 * new_sw_if_index,
390 subint_config_t * subint;
392 // Each comparison is checking both the valid flag and the number of tags
393 // (incorporating exact-match/non-exact-match).
395 // check for specific double tag
396 subint = &qinq_intf->subint;
397 if ((subint->flags & match_flags) == match_flags) goto matched;
399 // check for specific outer and 'any' inner
400 subint = &vlan_intf->inner_any_subint;
401 if ((subint->flags & match_flags) == match_flags) goto matched;
403 // check for specific single tag
404 subint = &vlan_intf->single_tag_subint;
405 if ((subint->flags & match_flags) == match_flags) goto matched;
407 // check for untagged interface
408 subint = &main_intf->untagged_subint;
409 if ((subint->flags & match_flags) == match_flags) goto matched;
411 // check for default interface
412 subint = &main_intf->default_subint;
413 if ((subint->flags & match_flags) == match_flags) goto matched;
415 // No matching subinterface
416 *new_sw_if_index = ~0;
417 *error0 = ETHERNET_ERROR_UNKNOWN_VLAN;
422 *new_sw_if_index = subint->sw_if_index;
423 *is_l2 = subint->flags & SUBINT_CONFIG_L2;
427 always_inline ethernet_main_t *
428 vnet_get_ethernet_main (void)
430 return ðernet_main;
433 void vnet_register_ip4_arp_resolution_event (vnet_main_t * vnm,
440 int vnet_add_del_ip4_arp_change_event (vnet_main_t * vnm,
441 void * data_callback,
446 uword data, int is_add);
448 vlib_node_registration_t ethernet_input_node;
450 #endif /* included_ethernet_h */