interface: improve MTU handling
[vpp.git] / src / vnet / interface.h
1 /*
2  * Copyright (c) 2015 Cisco and/or its affiliates.
3  * Licensed under the Apache License, Version 2.0 (the "License");
4  * you may not use this file except in compliance with the License.
5  * You may obtain a copy of the License at:
6  *
7  *     http://www.apache.org/licenses/LICENSE-2.0
8  *
9  * Unless required by applicable law or agreed to in writing, software
10  * distributed under the License is distributed on an "AS IS" BASIS,
11  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12  * See the License for the specific language governing permissions and
13  * limitations under the License.
14  */
15 /*
16  * interface.h: VNET interfaces/sub-interfaces
17  *
18  * Copyright (c) 2008 Eliot Dresselhaus
19  *
20  * Permission is hereby granted, free of charge, to any person obtaining
21  * a copy of this software and associated documentation files (the
22  * "Software"), to deal in the Software without restriction, including
23  * without limitation the rights to use, copy, modify, merge, publish,
24  * distribute, sublicense, and/or sell copies of the Software, and to
25  * permit persons to whom the Software is furnished to do so, subject to
26  * the following conditions:
27  *
28  * The above copyright notice and this permission notice shall be
29  * included in all copies or substantial portions of the Software.
30  *
31  *  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32  *  EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33  *  MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34  *  NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35  *  LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36  *  OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37  *  WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
38  */
39
40 #ifndef included_vnet_interface_h
41 #define included_vnet_interface_h
42
43 #include <vlib/vlib.h>
44 #include <vppinfra/pcap.h>
45 #include <vnet/l3_types.h>
46 #include <vppinfra/lock.h>
47 #include <vnet/hash/hash.h>
48
49 struct vnet_main_t;
50 struct vnet_hw_interface_t;
51 struct vnet_sw_interface_t;
52 union ip46_address_t_;
53
54 typedef enum
55 {
56   VNET_HW_IF_RX_MODE_UNKNOWN,
57   VNET_HW_IF_RX_MODE_POLLING,
58   VNET_HW_IF_RX_MODE_INTERRUPT,
59   VNET_HW_IF_RX_MODE_ADAPTIVE,
60   VNET_HW_IF_RX_MODE_DEFAULT,
61   VNET_HW_IF_NUM_RX_MODES,
62 } vnet_hw_if_rx_mode;
63
64 /* Interface up/down callback. */
65 typedef clib_error_t *(vnet_interface_function_t)
66   (struct vnet_main_t * vnm, u32 if_index, u32 flags);
67
68 /* Sub-interface add/del callback. */
69 typedef clib_error_t *(vnet_subif_add_del_function_t)
70   (struct vnet_main_t * vnm, u32 if_index,
71    struct vnet_sw_interface_t * template, int is_add);
72
73 /* Interface set mtu callback. */
74 typedef clib_error_t *(vnet_interface_set_mtu_function_t) (
75   struct vnet_main_t *vnm, struct vnet_hw_interface_t *hi, u32 mtu);
76
77 /* Interface set mac address callback. */
78 typedef clib_error_t *(vnet_interface_set_mac_address_function_t)
79   (struct vnet_hw_interface_t * hi,
80    const u8 * old_address, const u8 * new_address);
81
82 /* Interface add/del additional mac address callback */
83 typedef clib_error_t *(vnet_interface_add_del_mac_address_function_t)
84   (struct vnet_hw_interface_t * hi, const u8 * address, u8 is_add);
85
86 /* Interface set rx mode callback. */
87 typedef clib_error_t *(vnet_interface_set_rx_mode_function_t)
88   (struct vnet_main_t * vnm, u32 if_index, u32 queue_id,
89    vnet_hw_if_rx_mode mode);
90
91 /* Interface set l2 mode callback. */
92 typedef clib_error_t *(vnet_interface_set_l2_mode_function_t)
93   (struct vnet_main_t * vnm, struct vnet_hw_interface_t * hi,
94    i32 l2_if_adjust);
95
96 /* Interface to set rss queues of the interface */
97 typedef clib_error_t *(vnet_interface_rss_queues_set_t)
98   (struct vnet_main_t * vnm, struct vnet_hw_interface_t * hi,
99    clib_bitmap_t * bitmap);
100
101 typedef enum
102 {
103   VNET_FLOW_DEV_OP_ADD_FLOW,
104   VNET_FLOW_DEV_OP_DEL_FLOW,
105   VNET_FLOW_DEV_OP_GET_COUNTER,
106   VNET_FLOW_DEV_OP_RESET_COUNTER,
107 } vnet_flow_dev_op_t;
108
109 /* Interface flow operations callback. */
110 typedef int (vnet_flow_dev_ops_function_t) (struct vnet_main_t * vnm,
111                                             vnet_flow_dev_op_t op,
112                                             u32 hw_if_index, u32 index,
113                                             uword * private_data);
114
115 typedef enum vnet_interface_function_priority_t_
116 {
117   VNET_ITF_FUNC_PRIORITY_LOW,
118   VNET_ITF_FUNC_PRIORITY_HIGH,
119 } vnet_interface_function_priority_t;
120 #define VNET_ITF_FUNC_N_PRIO ((vnet_interface_function_priority_t)VNET_ITF_FUNC_PRIORITY_HIGH+1)
121
122 typedef struct _vnet_interface_function_list_elt
123 {
124   struct _vnet_interface_function_list_elt *next_interface_function;
125   clib_error_t *(*fp) (struct vnet_main_t * vnm, u32 if_index, u32 flags);
126 } _vnet_interface_function_list_elt_t;
127
128 #ifndef CLIB_MARCH_VARIANT
129 #define _VNET_INTERFACE_FUNCTION_DECL_PRIO(f,tag,p)                    \
130                                                                         \
131 static void __vnet_interface_function_init_##tag##_##f (void)           \
132     __attribute__((__constructor__)) ;                                  \
133                                                                         \
134 static void __vnet_interface_function_init_##tag##_##f (void)           \
135 {                                                                       \
136  vnet_main_t * vnm = vnet_get_main();                                   \
137  static _vnet_interface_function_list_elt_t init_function;              \
138  init_function.next_interface_function = vnm->tag##_functions[p];       \
139  vnm->tag##_functions[p] = &init_function;                              \
140  init_function.fp = (void *) &f;                                        \
141 }                                                                       \
142 static void __vnet_interface_function_deinit_##tag##_##f (void)         \
143     __attribute__((__destructor__)) ;                                   \
144                                                                         \
145 static void __vnet_interface_function_deinit_##tag##_##f (void)         \
146 {                                                                       \
147  vnet_main_t * vnm = vnet_get_main();                                   \
148  _vnet_interface_function_list_elt_t *next;                             \
149  if (vnm->tag##_functions[p]->fp == f)                                  \
150     {                                                                   \
151       vnm->tag##_functions[p] =                                         \
152         vnm->tag##_functions[p]->next_interface_function;               \
153       return;                                                           \
154     }                                                                   \
155   next = vnm->tag##_functions[p];                                       \
156   while (next->next_interface_function)                                 \
157     {                                                                   \
158       if (next->next_interface_function->fp == f)                       \
159         {                                                               \
160           next->next_interface_function =                               \
161             next->next_interface_function->next_interface_function;     \
162           return;                                                       \
163         }                                                               \
164       next = next->next_interface_function;                             \
165     }                                                                   \
166 }
167 #else
168 /* create unused pointer to silence compiler warnings and get whole
169    function optimized out */
170 #define _VNET_INTERFACE_FUNCTION_DECL_PRIO(f,tag,p)                    \
171 static __clib_unused void * __clib_unused_##f = f;
172 #endif
173
174 #define _VNET_INTERFACE_FUNCTION_DECL(f,tag)                            \
175   _VNET_INTERFACE_FUNCTION_DECL_PRIO(f,tag,VNET_ITF_FUNC_PRIORITY_LOW)
176
177 #define VNET_HW_INTERFACE_ADD_DEL_FUNCTION(f)                   \
178   _VNET_INTERFACE_FUNCTION_DECL(f,hw_interface_add_del)
179 #define VNET_HW_INTERFACE_LINK_UP_DOWN_FUNCTION(f)              \
180   _VNET_INTERFACE_FUNCTION_DECL(f,hw_interface_link_up_down)
181 #define VNET_HW_INTERFACE_LINK_UP_DOWN_FUNCTION_PRIO(f,p)       \
182   _VNET_INTERFACE_FUNCTION_DECL_PRIO(f,hw_interface_link_up_down,p)
183 #define VNET_SW_INTERFACE_MTU_CHANGE_FUNCTION(f)                \
184   _VNET_INTERFACE_FUNCTION_DECL(f,sw_interface_mtu_change)
185 #define VNET_SW_INTERFACE_ADD_DEL_FUNCTION(f)                   \
186   _VNET_INTERFACE_FUNCTION_DECL(f,sw_interface_add_del)
187 #define VNET_SW_INTERFACE_ADD_DEL_FUNCTION_PRIO(f,p)            \
188   _VNET_INTERFACE_FUNCTION_DECL_PRIO(f,sw_interface_add_del,p)
189 #define VNET_SW_INTERFACE_ADMIN_UP_DOWN_FUNCTION(f)             \
190   _VNET_INTERFACE_FUNCTION_DECL(f,sw_interface_admin_up_down)
191 #define VNET_SW_INTERFACE_ADMIN_UP_DOWN_FUNCTION_PRIO(f,p)      \
192   _VNET_INTERFACE_FUNCTION_DECL_PRIO(f,sw_interface_admin_up_down, p)
193
194 /**
195  * Tunnel description parameters
196  */
197 typedef int (*vnet_dev_class_ip_tunnel_desc_t) (u32 sw_if_index,
198                                                 union ip46_address_t_ * src,
199                                                 union ip46_address_t_ * dst,
200                                                 u8 * is_l2);
201
202 /* A class of hardware interface devices. */
203 typedef struct _vnet_device_class
204 {
205   /* Index into main vector. */
206   u32 index;
207
208   /* Device name (e.g. "FOOBAR 1234a"). */
209   char *name;
210
211   /* Function to call when hardware interface is added/deleted. */
212   vnet_interface_function_t *interface_add_del_function;
213
214   /* Function to bring device administratively up/down. */
215   vnet_interface_function_t *admin_up_down_function;
216
217   /* Function to call when sub-interface is added/deleted */
218   vnet_subif_add_del_function_t *subif_add_del_function;
219
220   /* Function to call interface rx mode is changed */
221   vnet_interface_set_rx_mode_function_t *rx_mode_change_function;
222
223   /* Function to call interface l2 mode is changed */
224   vnet_interface_set_l2_mode_function_t *set_l2_mode_function;
225
226   /* Redistribute flag changes/existence of this interface class. */
227   u32 redistribute;
228
229   /* Transmit function. */
230   vlib_node_function_t *tx_function;
231
232   /* Transmit function candidate registration with priority */
233   vlib_node_fn_registration_t *tx_fn_registrations;
234
235   /* Error strings indexed by error code for this node. */
236   char **tx_function_error_strings;
237   vlib_error_desc_t *tx_function_error_counters;
238
239   /* Number of error codes used by this node. */
240   u32 tx_function_n_errors;
241
242   /* Renumber device name [only!] support, a control-plane kludge */
243   int (*name_renumber) (struct vnet_hw_interface_t * hi,
244                         u32 new_dev_instance);
245
246   /* Interface flow offload operations */
247   vnet_flow_dev_ops_function_t *flow_ops_function;
248
249   /* Format device instance as name. */
250   format_function_t *format_device_name;
251
252   /* Parse function for device name. */
253   unformat_function_t *unformat_device_name;
254
255   /* Format device verbosely for this class. */
256   format_function_t *format_device;
257
258   /* Trace buffer format for TX function. */
259   format_function_t *format_tx_trace;
260
261   /* Format flow offload entry */
262   format_function_t *format_flow;
263
264   vnet_dev_class_ip_tunnel_desc_t ip_tun_desc;
265
266   /* Function to clear hardware counters for device. */
267   void (*clear_counters) (u32 dev_class_instance);
268
269     uword (*is_valid_class_for_interface) (struct vnet_main_t * vnm,
270                                            u32 hw_if_index,
271                                            u32 hw_class_index);
272
273   /* Called when hardware class of an interface changes. */
274   void (*hw_class_change) (struct vnet_main_t * vnm,
275                            u32 hw_if_index, u32 new_hw_class_index);
276
277   /* Called to redirect traffic from a specific interface instance */
278   void (*rx_redirect_to_node) (struct vnet_main_t * vnm,
279                                u32 hw_if_index, u32 node_index);
280
281   /* Link-list of all device classes set up by constructors created below */
282   struct _vnet_device_class *next_class_registration;
283
284   /* Function to set mac address. */
285   vnet_interface_set_mac_address_function_t *mac_addr_change_function;
286
287   /* Function to add/delete additional MAC addresses */
288   vnet_interface_add_del_mac_address_function_t *mac_addr_add_del_function;
289
290   /* Interface to set rss queues of the interface */
291   vnet_interface_rss_queues_set_t *set_rss_queues_function;
292
293 } vnet_device_class_t;
294
295 #ifndef CLIB_MARCH_VARIANT
296 #define VNET_DEVICE_CLASS(x,...)                                        \
297   __VA_ARGS__ vnet_device_class_t x;                                    \
298 static void __vnet_add_device_class_registration_##x (void)             \
299     __attribute__((__constructor__)) ;                                  \
300 static void __vnet_add_device_class_registration_##x (void)             \
301 {                                                                       \
302     vnet_main_t * vnm = vnet_get_main();                                \
303     x.next_class_registration = vnm->device_class_registrations;        \
304     vnm->device_class_registrations = &x;                               \
305 }                                                                       \
306 static void __vnet_rm_device_class_registration_##x (void)              \
307     __attribute__((__destructor__)) ;                                   \
308 static void __vnet_rm_device_class_registration_##x (void)              \
309 {                                                                       \
310     vnet_main_t * vnm = vnet_get_main();                                \
311     VLIB_REMOVE_FROM_LINKED_LIST (vnm->device_class_registrations,      \
312                                   &x, next_class_registration);         \
313 }                                                                       \
314 __VA_ARGS__ vnet_device_class_t x
315 #else
316 /* create unused pointer to silence compiler warnings and get whole
317    function optimized out */
318 #define VNET_DEVICE_CLASS(x,...)                                        \
319 static __clib_unused vnet_device_class_t __clib_unused_##x
320 #endif
321
322 #define VNET_DEVICE_CLASS_TX_FN(devclass)                                     \
323   uword CLIB_MARCH_SFX (devclass##_tx_fn) ();                                 \
324   static vlib_node_fn_registration_t CLIB_MARCH_SFX (                         \
325     devclass##_tx_fn_registration) = {                                        \
326     .function = &CLIB_MARCH_SFX (devclass##_tx_fn),                           \
327   };                                                                          \
328                                                                               \
329   static void __clib_constructor CLIB_MARCH_SFX (                             \
330     devclass##_tx_fn_multiarch_register) (void)                               \
331   {                                                                           \
332     extern vnet_device_class_t devclass;                                      \
333     vlib_node_fn_registration_t *r;                                           \
334     r = &CLIB_MARCH_SFX (devclass##_tx_fn_registration);                      \
335     r->march_variant = CLIB_MARCH_SFX (CLIB_MARCH_VARIANT_TYPE);              \
336     r->next_registration = devclass.tx_fn_registrations;                      \
337     devclass.tx_fn_registrations = r;                                         \
338   }                                                                           \
339   uword CLIB_MARCH_SFX (devclass##_tx_fn)
340
341 /**
342  * Link Type: A description of the protocol of packets on the link.
343  * On an ethernet link this maps directly into the ethertype. On a GRE tunnel
344  * it maps to the GRE-proto, etc for other lnk types.
345  */
346 typedef enum vnet_link_t_
347 {
348 #if CLIB_DEBUG > 0
349   VNET_LINK_IP4 = 1,
350 #else
351   VNET_LINK_IP4 = 0,
352 #endif
353   VNET_LINK_IP6,
354   VNET_LINK_MPLS,
355   VNET_LINK_ETHERNET,
356   VNET_LINK_ARP,
357   VNET_LINK_NSH,
358 } __attribute__ ((packed)) vnet_link_t;
359
360 #define VNET_LINKS {                   \
361     [VNET_LINK_ETHERNET] = "ethernet", \
362     [VNET_LINK_IP4] = "ipv4",          \
363     [VNET_LINK_IP6] = "ipv6",          \
364     [VNET_LINK_MPLS] = "mpls",         \
365     [VNET_LINK_ARP] = "arp",           \
366     [VNET_LINK_NSH] = "nsh",           \
367 }
368
369 #define FOR_EACH_VNET_LINK(_link)    \
370   for (_link = VNET_LINK_IP4;        \
371        _link <= VNET_LINK_NSH;       \
372        _link++)
373
374 #define FOR_EACH_VNET_IP_LINK(_link)    \
375   for (_link = VNET_LINK_IP4;           \
376        _link <= VNET_LINK_IP6;          \
377        _link++)
378
379 /**
380  * @brief Number of link types. Not part of the enum so it does not have to be
381  * included in switch statements
382  */
383 #define VNET_LINK_NUM (VNET_LINK_NSH+1)
384 #define VNET_N_LINKS VNET_LINK_NUM
385
386 /**
387  * @brief Convert a link to to an Ethertype
388  */
389 extern vnet_l3_packet_type_t vnet_link_to_l3_proto (vnet_link_t link);
390
391 /**
392  * @brief Attributes assignable to a HW interface Class.
393  */
394 typedef enum vnet_hw_interface_class_flags_t_
395 {
396   /**
397    * @brief a point 2 point interface
398    */
399   VNET_HW_INTERFACE_CLASS_FLAG_P2P = (1 << 0),
400   /**
401    * @brief a non-broadcast multiple access interface
402    */
403   VNET_HW_INTERFACE_CLASS_FLAG_NBMA = (1 << 1),
404 } vnet_hw_interface_class_flags_t;
405
406 /* Layer-2 (e.g. Ethernet) interface class. */
407 typedef struct _vnet_hw_interface_class
408 {
409   /* Index into main vector. */
410   u32 index;
411
412   /* Class name (e.g. "Ethernet"). */
413   char *name;
414
415   /* Flags */
416   vnet_hw_interface_class_flags_t flags;
417
418   /* tx hash type for interfaces of this hw class */
419   vnet_hash_fn_type_t tx_hash_fn_type;
420
421   /* Function to call when hardware interface is added/deleted. */
422   vnet_interface_function_t *interface_add_del_function;
423
424   /* Function to bring interface administratively up/down. */
425   vnet_interface_function_t *admin_up_down_function;
426
427   /* Function to call when link state changes. */
428   vnet_interface_function_t *link_up_down_function;
429
430   /* Function to call when link MAC changes. */
431   vnet_interface_set_mac_address_function_t *mac_addr_change_function;
432
433   /* Function to add/delete additional MAC addresses */
434   vnet_interface_add_del_mac_address_function_t *mac_addr_add_del_function;
435   /* Function to set mtu. */
436   vnet_interface_set_mtu_function_t *set_mtu;
437
438   /* Format function to display interface name. */
439   format_function_t *format_interface_name;
440
441   /* Format function to display interface address. */
442   format_function_t *format_address;
443
444   /* Format packet header for this interface class. */
445   format_function_t *format_header;
446
447   /* Format device verbosely for this class. */
448   format_function_t *format_device;
449
450   /* Parser for hardware (e.g. ethernet) address. */
451   unformat_function_t *unformat_hw_address;
452
453   /* Parser for packet header for e.g. rewrite string. */
454   unformat_function_t *unformat_header;
455
456   /* Builds a rewrite string for the interface to the destination
457    * for the payload/link type. */
458   u8 *(*build_rewrite) (struct vnet_main_t * vnm,
459                         u32 sw_if_index,
460                         vnet_link_t link_type, const void *dst_hw_address);
461
462   /* Update an adjacency added by FIB (as opposed to via the
463    * neighbour resolution protocol). */
464   void (*update_adjacency) (struct vnet_main_t * vnm,
465                             u32 sw_if_index, u32 adj_index);
466
467     uword (*is_valid_class_for_interface) (struct vnet_main_t * vnm,
468                                            u32 hw_if_index,
469                                            u32 hw_class_index);
470
471   /* Called when hw interface class is changed and old hardware instance
472      may want to be deleted. */
473   void (*hw_class_change) (struct vnet_main_t * vnm, u32 hw_if_index,
474                            u32 old_class_index, u32 new_class_index);
475
476   /* List of hw interface classes, built by constructors */
477   struct _vnet_hw_interface_class *next_class_registration;
478
479 } vnet_hw_interface_class_t;
480
481 /**
482  * @brief Return a complete, zero-length (aka placeholder) rewrite
483  */
484 extern u8 *default_build_rewrite (struct vnet_main_t *vnm,
485                                   u32 sw_if_index,
486                                   vnet_link_t link_type,
487                                   const void *dst_hw_address);
488
489 /**
490  * @brief Default adjacency update function
491  */
492 extern void default_update_adjacency (struct vnet_main_t *vnm,
493                                       u32 sw_if_index, u32 adj_index);
494
495 #define VNET_HW_INTERFACE_CLASS(x,...)                                  \
496   __VA_ARGS__ vnet_hw_interface_class_t x;                              \
497 static void __vnet_add_hw_interface_class_registration_##x (void)       \
498     __attribute__((__constructor__)) ;                                  \
499 static void __vnet_add_hw_interface_class_registration_##x (void)       \
500 {                                                                       \
501     vnet_main_t * vnm = vnet_get_main();                                \
502     x.next_class_registration = vnm->hw_interface_class_registrations;  \
503     vnm->hw_interface_class_registrations = &x;                         \
504 }                                                                       \
505 static void __vnet_rm_hw_interface_class_registration_##x (void)        \
506     __attribute__((__destructor__)) ;                                   \
507 static void __vnet_rm_hw_interface_class_registration_##x (void)        \
508 {                                                                       \
509     vnet_main_t * vnm = vnet_get_main();                                \
510     VLIB_REMOVE_FROM_LINKED_LIST (vnm->hw_interface_class_registrations,\
511                                   &x, next_class_registration);         \
512 }                                                                       \
513 __VA_ARGS__ vnet_hw_interface_class_t x
514
515 typedef enum vnet_hw_interface_flags_t_
516 {
517   VNET_HW_INTERFACE_FLAG_NONE,
518   /* Hardware link state is up. */
519   VNET_HW_INTERFACE_FLAG_LINK_UP = (1 << 0),
520   /* Hardware duplex state */
521   VNET_HW_INTERFACE_FLAG_HALF_DUPLEX = (1 << 1),
522   VNET_HW_INTERFACE_FLAG_FULL_DUPLEX = (1 << 2),
523
524   /* non-broadcast multiple access */
525   VNET_HW_INTERFACE_FLAG_NBMA = (1 << 19),
526 } vnet_hw_interface_flags_t;
527
528 #define foreach_vnet_hw_if_caps                                               \
529   _ (0, TX_IP4_CKSUM, "ip4-csum-tx")                                          \
530   _ (1, TX_TCP_CKSUM, "tcp-csum-tx")                                          \
531   _ (2, TX_UDP_CKSUM, "udp-csum-tx")                                          \
532   _ (3, TX_IP4_OUTER_CKSUM, "outer-ip4-csum-tx")                              \
533   _ (4, TX_UDP_OUTER_CKSUM, "outer-udp-csum-tx")                              \
534   _ (5, RX_IP4_CKSUM, "ip4-csum-rx")                                          \
535   _ (6, RX_TCP_CKSUM, "tcp-csum-rx")                                          \
536   _ (7, RX_UDP_CKSUM, "udp-csum-rx")                                          \
537   _ (8, RX_IP4_OUTER_CKSUM, "outer-ip4-csum-rx")                              \
538   _ (9, RX_UDP_OUTER_CKSUM, "outer-udp-csum-rx")                              \
539   _ (10, TCP_GSO, "tcp-tso")                                                  \
540   _ (11, UDP_GSO, "udp-gso")                                                  \
541   _ (12, VXLAN_TNL_GSO, "vxlan-tnl-gso")                                      \
542   _ (13, IPIP_TNL_GSO, "ipip-tnl-gso")                                        \
543   _ (14, GENEVE_TNL_GSO, "geneve-tnl-gso")                                    \
544   _ (15, GRE_TNL_GSO, "gre-tnl-gso")                                          \
545   _ (16, UDP_TNL_GSO, "udp-tnl-gso")                                          \
546   _ (17, IP_TNL_GSO, "ip-tnl-gso")                                            \
547   _ (18, TCP_LRO, "tcp-lro")                                                  \
548   _ (30, INT_MODE, "int-mode")                                                \
549   _ (31, MAC_FILTER, "mac-filter")
550
551 typedef enum vnet_hw_if_caps_t_
552 {
553   VNET_HW_INTERFACE_CAP_NONE,
554 #define _(bit, sfx, str) VNET_HW_IF_CAP_##sfx = (1 << (bit)),
555   foreach_vnet_hw_if_caps
556 #undef _
557
558 } vnet_hw_if_caps_t;
559
560 #define VNET_HW_IF_CAP_L4_TX_CKSUM                                            \
561   (VNET_HW_IF_CAP_TX_TCP_CKSUM | VNET_HW_IF_CAP_TX_UDP_CKSUM)
562
563 #define VNET_HW_IF_CAP_TX_CKSUM                                               \
564   (VNET_HW_IF_CAP_TX_IP4_CKSUM | VNET_HW_IF_CAP_TX_TCP_CKSUM |                \
565    VNET_HW_IF_CAP_TX_UDP_CKSUM)
566
567 #define VNET_HW_IF_CAP_TX_OUTER_CKSUM                                         \
568   (VNET_HW_IF_CAP_TX_IP4_OUTER_CKSUM | VNET_HW_IF_CAP_TX_UDP_OUTER_CKSUM)
569
570 #define VNET_HW_IF_CAP_TX_CKSUM_MASK                                          \
571   (VNET_HW_IF_CAP_TX_CKSUM | VNET_HW_IF_CAP_TX_OUTER_CKSUM)
572
573 #define VNET_HW_IF_CAP_L4_RX_CKSUM                                            \
574   (VNET_HW_IF_CAP_RX_TCP_CKSUM | VNET_HW_IF_CAP_RX_UDP_CKSUM)
575
576 #define VNET_HW_IF_CAP_RX_CKSUM                                               \
577   (VNET_HW_IF_CAP_RX_IP4_CKSUM | VNET_HW_IF_CAP_RX_TCP_CKSUM |                \
578    VNET_HW_IF_CAP_RX_UDP_CKSUM)
579
580 #define VNET_HW_IF_CAP_TNL_GSO_MASK                                           \
581   VNET_HW_IF_CAP_VXLAN_TNL_GSO | VNET_HW_IF_CAP_IPIP_TNL_GSO
582
583 #define VNET_HW_INTERFACE_FLAG_DUPLEX_SHIFT 1
584 #define VNET_HW_INTERFACE_FLAG_SPEED_SHIFT  3
585 #define VNET_HW_INTERFACE_FLAG_DUPLEX_MASK      \
586   (VNET_HW_INTERFACE_FLAG_HALF_DUPLEX |         \
587    VNET_HW_INTERFACE_FLAG_FULL_DUPLEX)
588
589 typedef struct
590 {
591   /* hw interface index */
592   u32 hw_if_index;
593
594   /* device instance */
595   u32 dev_instance;
596
597   /* index of thread pollling this queue */
598   u32 thread_index;
599
600   /* file index of queue interrupt line */
601   u32 file_index;
602
603   /* hardware queue identifier */
604   u32 queue_id;
605
606   /* mode */
607   vnet_hw_if_rx_mode mode : 8;
608 #define VNET_HW_IF_RXQ_THREAD_ANY      ~0
609 #define VNET_HW_IF_RXQ_NO_RX_INTERRUPT ~0
610 } vnet_hw_if_rx_queue_t;
611
612 typedef struct
613 {
614   u8 shared_queue : 1;
615   /* hw interface index */
616   u32 hw_if_index;
617
618   /* hardware queue identifier */
619   u32 queue_id;
620
621   /* bitmap of threads which use this queue */
622   clib_bitmap_t *threads;
623 } vnet_hw_if_tx_queue_t;
624
625 typedef enum
626 {
627   VNET_HW_IF_TX_FRAME_HINT_NOT_CHAINED = (1 << 0),
628   VNET_HW_IF_TX_FRAME_HINT_NO_GSO = (1 << 1),
629   VNET_HW_IF_TX_FRAME_HINT_NO_CKSUM_OFFLOAD = (1 << 2),
630 } vnet_hw_if_tx_frame_hint_t;
631
632 typedef struct
633 {
634   u8 shared_queue : 1;
635   vnet_hw_if_tx_frame_hint_t hints : 16;
636   u32 queue_id;
637 } vnet_hw_if_tx_frame_t;
638
639 typedef struct
640 {
641   CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
642   vnet_hw_if_tx_frame_t *frame;
643   u32 *lookup_table;
644   u32 n_queues;
645 } vnet_hw_if_output_node_runtime_t;
646
647 /* Hardware-interface.  This corresponds to a physical wire
648    that packets flow over. */
649 typedef struct vnet_hw_interface_t
650 {
651   CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
652   /* flags */
653   vnet_hw_interface_flags_t flags;
654
655   /* capabilities flags */
656   vnet_hw_if_caps_t caps;
657
658   /* Hardware address as vector.  Zero (e.g. zero-length vector) if no
659      address for this class (e.g. PPP). */
660   u8 *hw_address;
661
662   /* Interface is up as far as software is concerned. */
663   /* NAME.{output,tx} nodes for this interface. */
664   u32 output_node_index, tx_node_index;
665
666   /* interface-output-arc-end node next index for tx node */
667   u32 if_out_arc_end_node_next_index;
668
669   /* (dev_class, dev_instance) uniquely identifies hw interface. */
670   u32 dev_class_index;
671   u32 dev_instance;
672
673   /* (hw_class, hw_instance) uniquely identifies hw interface. */
674   u32 hw_class_index;
675   u32 hw_instance;
676
677   /* Hardware index for this hardware interface. */
678   u32 hw_if_index;
679
680   /* Software index for this hardware interface. */
681   u32 sw_if_index;
682
683   /* per thread output-node runtimes */
684   vnet_hw_if_output_node_runtime_t *output_node_thread_runtimes;
685
686   CLIB_CACHE_LINE_ALIGN_MARK (cacheline1);
687
688   /* Interface name. */
689   u8 *name;
690
691   /* link speed in kbps */
692   u32 link_speed;
693
694   /* Next index in interface-output node for this interface
695      used by node function vnet_per_buffer_interface_output() */
696   u32 output_node_next_index;
697
698   /* called when hw interface is using transmit side packet steering */
699   vnet_hash_fn_t hf;
700
701   /* Maximum transmit rate for this interface in bits/sec. */
702   f64 max_rate_bits_per_sec;
703
704   /* Smallest packet size supported by this interface. */
705   u32 min_supported_packet_bytes;
706
707   /* Largest packet size supported by this interface. */
708   u32 max_supported_packet_bytes;
709
710   /* Smallest packet size for this interface. */
711   u32 min_packet_bytes;
712
713   /* Largest packet size for this interface. */
714   u32 max_packet_bytes;
715
716   /* Hash table mapping sub interface id to sw_if_index. */
717   uword *sub_interface_sw_if_index_by_id;
718
719   /* Count of number of L2 and L3 subinterfaces */
720   u32 l2_if_count;
721   u32 l3_if_count;
722
723   /* Bonded interface info -
724      0       - not a bonded interface nor a slave
725      ~0      - slave to a bonded interface
726      others  - A bonded interface with a pointer to bitmap for all slaves */
727   uword *bond_info;
728 #define VNET_HW_INTERFACE_BOND_INFO_NONE ((uword *) 0)
729 #define VNET_HW_INTERFACE_BOND_INFO_SLAVE ((uword *) ~0)
730
731   /* Input node */
732   u32 input_node_index;
733
734   vnet_hw_if_rx_mode default_rx_mode;
735
736   /* rx queues */
737   u32 *rx_queue_indices;
738
739   /* tx queues */
740   u32 *tx_queue_indices;
741
742   /* numa node that hardware device connects to */
743   u8 numa_node;
744
745   /* rss queues bitmap */
746   clib_bitmap_t *rss_queues;
747
748   /* trace */
749   i32 n_trace;
750
751   u32 trace_classify_table_index;
752 } vnet_hw_interface_t;
753
754 STATIC_ASSERT_OFFSET_OF (vnet_hw_interface_t, cacheline1,
755                          CLIB_CACHE_LINE_BYTES);
756
757 typedef struct
758 {
759   u32 dev_instance;
760   u32 queue_id;
761 } vnet_hw_if_rxq_poll_vector_t;
762
763 typedef struct
764 {
765   vnet_hw_if_rxq_poll_vector_t *rxq_vector_int;
766   vnet_hw_if_rxq_poll_vector_t *rxq_vector_poll;
767   void *rxq_interrupts;
768 } vnet_hw_if_rx_node_runtime_t;
769
770 extern vnet_device_class_t vnet_local_interface_device_class;
771
772 typedef enum
773 {
774   /* A hw interface. */
775   VNET_SW_INTERFACE_TYPE_HARDWARE,
776
777   /* A sub-interface. */
778   VNET_SW_INTERFACE_TYPE_SUB,
779   VNET_SW_INTERFACE_TYPE_P2P,
780   VNET_SW_INTERFACE_TYPE_PIPE,
781 } vnet_sw_interface_type_t;
782
783 typedef struct
784 {
785   /*
786    * Subinterface ID. A number 0-N to uniquely identify
787    * this subinterface under the main (parent?) interface
788    */
789   u32 id;
790
791   /* Classification data. Used to associate packet header with subinterface. */
792   struct
793   {
794     u16 outer_vlan_id;
795     u16 inner_vlan_id;
796     union
797     {
798       u16 raw_flags;
799       struct
800       {
801         u16 no_tags:1;
802         u16 one_tag:1;
803         u16 two_tags:1;
804         u16 dot1ad:1;           /* 0 = dot1q, 1=dot1ad */
805         u16 exact_match:1;
806         u16 default_sub:1;
807         u16 outer_vlan_id_any:1;
808         u16 inner_vlan_id_any:1;
809       } flags;
810     };
811   } eth;
812 } vnet_sub_interface_t;
813
814 typedef struct
815 {
816   /*
817    * Subinterface ID. A number 0-N to uniquely identify
818    * this subinterface under the main interface
819    */
820   u32 id;
821   u32 pool_index;
822   u8 client_mac[6];
823 } vnet_p2p_sub_interface_t;
824
825 typedef enum
826 {
827   /* THe BVI interface */
828   VNET_FLOOD_CLASS_BVI,
829   /* Always flood */
830   VNET_FLOOD_CLASS_NORMAL,
831   VNET_FLOOD_CLASS_TUNNEL_MASTER,
832   /* Does not flood when tunnel master is in the same L2 BD */
833   VNET_FLOOD_CLASS_TUNNEL_NORMAL,
834   /* Never flood to this type */
835   VNET_FLOOD_CLASS_NO_FLOOD,
836 } vnet_flood_class_t;
837
838 /* Per protocol MTU */
839 typedef enum
840 {
841   VNET_MTU_L3,                  /* Default payload MTU (without L2 headers) */
842   VNET_MTU_IP4,                 /* Per-protocol MTUs overriding default */
843   VNET_MTU_IP6,
844   VNET_MTU_MPLS,
845   VNET_N_MTU
846 } vnet_mtu_t;
847
848 extern vnet_mtu_t vnet_link_to_mtu (vnet_link_t link);
849
850 typedef enum vnet_sw_interface_flags_t_
851 {
852   VNET_SW_INTERFACE_FLAG_NONE = 0,
853   /* Interface is "up" meaning administratively up.
854      Up in the sense of link state being up is maintained by hardware interface. */
855   VNET_SW_INTERFACE_FLAG_ADMIN_UP = (1 << 0),
856
857   /* Interface is disabled for forwarding: punt all traffic to slow-path. */
858   VNET_SW_INTERFACE_FLAG_PUNT = (1 << 1),
859
860   __VNET_SW_INTERFACE_FLAG_UNSUED = (1 << 2),
861
862   VNET_SW_INTERFACE_FLAG_UNNUMBERED = (1 << 3),
863
864   __VNET_SW_INTERFACE_FLAG_UNUSED2 = (1 << 4),
865
866   /* Interface does not appear in CLI/API */
867   VNET_SW_INTERFACE_FLAG_HIDDEN = (1 << 5),
868
869   /* Interface in ERROR state */
870   VNET_SW_INTERFACE_FLAG_ERROR = (1 << 6),
871
872   /* Interface has IP configured directed broadcast */
873   VNET_SW_INTERFACE_FLAG_DIRECTED_BCAST = (1 << 7),
874
875 } __attribute__ ((packed)) vnet_sw_interface_flags_t;
876
877 /* Software-interface.  This corresponds to a Ethernet VLAN, ATM vc, a
878    tunnel, etc.  Configuration (e.g. IP address) gets attached to
879    software interface. */
880 typedef struct
881 {
882   vnet_sw_interface_type_t type:16;
883
884   vnet_sw_interface_flags_t flags;
885
886   /* Index for this interface. */
887   u32 sw_if_index;
888
889   /* Software interface index of super-interface;
890      equal to sw_if_index if this interface is not a
891      sub-interface. */
892   u32 sup_sw_if_index;
893
894   /* this swif is unnumbered, use addresses on unnumbered_sw_if_index... */
895   u32 unnumbered_sw_if_index;
896
897   /* VNET_SW_INTERFACE_TYPE_HARDWARE. */
898   u32 hw_if_index;
899
900   /* MTU for network layer (not including L2 headers) */
901   u32 mtu[VNET_N_MTU];
902
903   /* VNET_SW_INTERFACE_TYPE_SUB. */
904   vnet_sub_interface_t sub;
905
906   /* VNET_SW_INTERFACE_TYPE_P2P. */
907   vnet_p2p_sub_interface_t p2p;
908
909   vnet_flood_class_t flood_class;
910 } vnet_sw_interface_t;
911
912 typedef enum
913 {
914   /* Simple counters. */
915   VNET_INTERFACE_COUNTER_DROP = 0,
916   VNET_INTERFACE_COUNTER_PUNT = 1,
917   VNET_INTERFACE_COUNTER_IP4 = 2,
918   VNET_INTERFACE_COUNTER_IP6 = 3,
919   VNET_INTERFACE_COUNTER_RX_NO_BUF = 4,
920   VNET_INTERFACE_COUNTER_RX_MISS = 5,
921   VNET_INTERFACE_COUNTER_RX_ERROR = 6,
922   VNET_INTERFACE_COUNTER_TX_ERROR = 7,
923   VNET_INTERFACE_COUNTER_MPLS = 8,
924   VNET_N_SIMPLE_INTERFACE_COUNTER = 9,
925   /* Combined counters. */
926   VNET_INTERFACE_COUNTER_RX = 0,
927   VNET_INTERFACE_COUNTER_RX_UNICAST = 1,
928   VNET_INTERFACE_COUNTER_RX_MULTICAST = 2,
929   VNET_INTERFACE_COUNTER_RX_BROADCAST = 3,
930   VNET_INTERFACE_COUNTER_TX = 4,
931   VNET_INTERFACE_COUNTER_TX_UNICAST = 5,
932   VNET_INTERFACE_COUNTER_TX_MULTICAST = 6,
933   VNET_INTERFACE_COUNTER_TX_BROADCAST = 7,
934   VNET_N_COMBINED_INTERFACE_COUNTER = 8,
935 } vnet_interface_counter_type_t;
936
937 #define foreach_rx_combined_interface_counter(_x)               \
938   for (_x = VNET_INTERFACE_COUNTER_RX;                          \
939        _x <= VNET_INTERFACE_COUNTER_RX_BROADCAST;               \
940        _x++)
941
942 #define foreach_tx_combined_interface_counter(_x)               \
943   for (_x = VNET_INTERFACE_COUNTER_TX;                          \
944        _x <= VNET_INTERFACE_COUNTER_TX_BROADCAST;               \
945        _x++)
946
947 #define foreach_simple_interface_counter_name   \
948   _(DROP, drops, if)                            \
949   _(PUNT, punt, if)                             \
950   _(IP4, ip4, if)                               \
951   _(IP6, ip6, if)                               \
952   _(RX_NO_BUF, rx-no-buf, if)                   \
953   _(RX_MISS, rx-miss, if)                       \
954   _(RX_ERROR, rx-error, if)                     \
955   _(TX_ERROR, tx-error, if)         \
956   _(MPLS, mpls, if)
957
958 #define foreach_combined_interface_counter_name \
959   _(RX, rx, if)                                 \
960   _(RX_UNICAST, rx-unicast, if)                 \
961   _(RX_MULTICAST, rx-multicast, if)             \
962   _(RX_BROADCAST, rx-broadcast, if)             \
963   _(TX, tx, if)                                 \
964   _(TX_UNICAST, tx-unicast, if)                 \
965   _(TX_MULTICAST, tx-multicast, if)             \
966   _(TX_BROADCAST, tx-broadcast, if)
967
968 typedef enum
969 {
970   COLLECT_SIMPLE_STATS = 0,
971   COLLECT_DETAILED_STATS = 1,
972 } vnet_interface_stats_collection_mode_e;
973
974 extern int collect_detailed_interface_stats_flag;
975
976 static inline int
977 collect_detailed_interface_stats (void)
978 {
979   return collect_detailed_interface_stats_flag;
980 }
981
982 void collect_detailed_interface_stats_flag_set (void);
983 void collect_detailed_interface_stats_flag_clear (void);
984
985
986 typedef struct
987 {
988   u32 output_node_index;
989   u32 tx_node_index;
990 } vnet_hw_interface_nodes_t;
991
992 typedef struct
993 {
994   CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
995   u32 *split_buffers;
996 } vnet_interface_per_thread_data_t;
997
998 typedef u8 *(*vnet_buffer_opquae_formatter_t) (const vlib_buffer_t * b,
999                                                u8 * s);
1000
1001 typedef struct
1002 {
1003   /* Hardware interfaces. */
1004   vnet_hw_interface_t *hw_interfaces;
1005
1006   /* Hardware interface RX queues */
1007   vnet_hw_if_rx_queue_t *hw_if_rx_queues;
1008   uword *rxq_index_by_hw_if_index_and_queue_id;
1009
1010   /* Hardware interface TX queues */
1011   vnet_hw_if_tx_queue_t *hw_if_tx_queues;
1012   uword *txq_index_by_hw_if_index_and_queue_id;
1013
1014   /* Hash table mapping HW interface name to index. */
1015   uword *hw_interface_by_name;
1016
1017   /* Vectors if hardware interface classes and device classes. */
1018   vnet_hw_interface_class_t *hw_interface_classes;
1019   vnet_device_class_t *device_classes;
1020
1021   /* Hash table mapping name to hw interface/device class. */
1022   uword *hw_interface_class_by_name;
1023   uword *device_class_by_name;
1024
1025   /* Software interfaces. */
1026   vnet_sw_interface_t *sw_interfaces;
1027
1028   /* Hash table mapping sub intfc sw_if_index by sup sw_if_index and sub id */
1029   uword *sw_if_index_by_sup_and_sub;
1030
1031   /* Software interface counters both simple and combined
1032      packet and byte counters. */
1033   clib_spinlock_t sw_if_counter_lock;
1034   vlib_simple_counter_main_t *sw_if_counters;
1035   vlib_combined_counter_main_t *combined_sw_if_counters;
1036
1037   vnet_hw_interface_nodes_t *deleted_hw_interface_nodes;
1038
1039   /*
1040    * pcap drop tracing
1041    * Only the drop filter hash lives here. See ../src/vlib/main.h for
1042    * the rest of the variables.
1043    */
1044   uword *pcap_drop_filter_hash;
1045
1046   /* Buffer metadata format helper functions */
1047   vnet_buffer_opquae_formatter_t *buffer_opaque_format_helpers;
1048   vnet_buffer_opquae_formatter_t *buffer_opaque2_format_helpers;
1049
1050   /* per-thread data */
1051   vnet_interface_per_thread_data_t *per_thread_data;
1052
1053   /* feature_arc_index */
1054   u8 output_feature_arc_index;
1055
1056   /* fast lookup tables */
1057   u32 *hw_if_index_by_sw_if_index;
1058   u16 *if_out_arc_end_next_index_by_sw_if_index;
1059 } vnet_interface_main_t;
1060
1061 static inline void
1062 vnet_interface_counter_lock (vnet_interface_main_t * im)
1063 {
1064   if (im->sw_if_counter_lock)
1065     clib_spinlock_lock (&im->sw_if_counter_lock);
1066 }
1067
1068 static inline void
1069 vnet_interface_counter_unlock (vnet_interface_main_t * im)
1070 {
1071   if (im->sw_if_counter_lock)
1072     clib_spinlock_unlock (&im->sw_if_counter_lock);
1073 }
1074
1075 void vnet_pcap_drop_trace_filter_add_del (u32 error_index, int is_add);
1076
1077 int vnet_interface_name_renumber (u32 sw_if_index, u32 new_show_dev_instance);
1078
1079 void vnet_register_format_buffer_opaque_helper
1080   (vnet_buffer_opquae_formatter_t fn);
1081
1082 void vnet_register_format_buffer_opaque2_helper
1083   (vnet_buffer_opquae_formatter_t fn);
1084
1085 typedef struct
1086 {
1087   u8 *filename;
1088   int enable;
1089   int status;
1090   u32 packets_to_capture;
1091   u32 max_bytes_per_pkt;
1092   u8 rx_enable;
1093   u8 tx_enable;
1094   u8 drop_enable;
1095   u8 preallocate_data;
1096   u8 free_data;
1097   u32 sw_if_index;
1098   int filter;
1099   vlib_error_t drop_err;
1100 } vnet_pcap_dispatch_trace_args_t;
1101
1102 int vnet_pcap_dispatch_trace_configure (vnet_pcap_dispatch_trace_args_t *);
1103
1104 extern vlib_node_registration_t vnet_interface_output_node;
1105 extern vlib_node_registration_t vnet_interface_output_arc_end_node;
1106
1107 #endif /* included_vnet_interface_h */
1108
1109 /*
1110  * fd.io coding-style-patch-verification: ON
1111  *
1112  * Local Variables:
1113  * eval: (c-set-style "gnu")
1114  * End:
1115  */