0ee3093f383977155b5c957c72bef3b797215a99
[vpp.git] / src / vnet / interface.c
1 /*
2  * Copyright (c) 2015 Cisco and/or its affiliates.
3  * Licensed under the Apache License, Version 2.0 (the "License");
4  * you may not use this file except in compliance with the License.
5  * You may obtain a copy of the License at:
6  *
7  *     http://www.apache.org/licenses/LICENSE-2.0
8  *
9  * Unless required by applicable law or agreed to in writing, software
10  * distributed under the License is distributed on an "AS IS" BASIS,
11  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12  * See the License for the specific language governing permissions and
13  * limitations under the License.
14  */
15 /*
16  * interface.c: VNET interfaces/sub-interfaces
17  *
18  * Copyright (c) 2008 Eliot Dresselhaus
19  *
20  * Permission is hereby granted, free of charge, to any person obtaining
21  * a copy of this software and associated documentation files (the
22  * "Software"), to deal in the Software without restriction, including
23  * without limitation the rights to use, copy, modify, merge, publish,
24  * distribute, sublicense, and/or sell copies of the Software, and to
25  * permit persons to whom the Software is furnished to do so, subject to
26  * the following conditions:
27  *
28  * The above copyright notice and this permission notice shall be
29  * included in all copies or substantial portions of the Software.
30  *
31  *  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32  *  EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33  *  MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34  *  NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35  *  LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36  *  OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37  *  WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
38  */
39
40 #include <vnet/vnet.h>
41 #include <vnet/plugin/plugin.h>
42 #include <vnet/fib/ip6_fib.h>
43 #include <vnet/adj/adj.h>
44 #include <vnet/adj/adj_mcast.h>
45 #include <vnet/l2/l2_input.h>
46
47 typedef enum vnet_interface_helper_flags_t_
48 {
49   VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE = (1 << 0),
50   VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE = (1 << 1),
51 } vnet_interface_helper_flags_t;
52
53 static clib_error_t *vnet_hw_interface_set_flags_helper (vnet_main_t * vnm,
54                                                          u32 hw_if_index,
55                                                          vnet_hw_interface_flags_t
56                                                          flags,
57                                                          vnet_interface_helper_flags_t
58                                                          helper_flags);
59
60 static clib_error_t *vnet_sw_interface_set_flags_helper (vnet_main_t * vnm,
61                                                          u32 sw_if_index,
62                                                          vnet_sw_interface_flags_t
63                                                          flags,
64                                                          vnet_interface_helper_flags_t
65                                                          helper_flags);
66
67 static clib_error_t *vnet_hw_interface_set_class_helper (vnet_main_t * vnm,
68                                                          u32 hw_if_index,
69                                                          u32 hw_class_index,
70                                                          u32 redistribute);
71
72 typedef struct
73 {
74   /* Either sw or hw interface index. */
75   u32 sw_hw_if_index;
76
77   /* Flags. */
78   u32 flags;
79 } vnet_sw_hw_interface_state_t;
80
81 static void
82 serialize_vec_vnet_sw_hw_interface_state (serialize_main_t * m, va_list * va)
83 {
84   vnet_sw_hw_interface_state_t *s =
85     va_arg (*va, vnet_sw_hw_interface_state_t *);
86   u32 n = va_arg (*va, u32);
87   u32 i;
88   for (i = 0; i < n; i++)
89     {
90       serialize_integer (m, s[i].sw_hw_if_index,
91                          sizeof (s[i].sw_hw_if_index));
92       serialize_integer (m, s[i].flags, sizeof (s[i].flags));
93     }
94 }
95
96 static void
97 unserialize_vec_vnet_sw_hw_interface_state (serialize_main_t * m,
98                                             va_list * va)
99 {
100   vnet_sw_hw_interface_state_t *s =
101     va_arg (*va, vnet_sw_hw_interface_state_t *);
102   u32 n = va_arg (*va, u32);
103   u32 i;
104   for (i = 0; i < n; i++)
105     {
106       unserialize_integer (m, &s[i].sw_hw_if_index,
107                            sizeof (s[i].sw_hw_if_index));
108       unserialize_integer (m, &s[i].flags, sizeof (s[i].flags));
109     }
110 }
111
112 static vnet_sw_interface_flags_t
113 vnet_hw_interface_flags_to_sw (vnet_hw_interface_flags_t hwf)
114 {
115   vnet_sw_interface_flags_t swf = VNET_SW_INTERFACE_FLAG_NONE;
116
117   if (hwf & VNET_HW_INTERFACE_FLAG_LINK_UP)
118     swf |= VNET_SW_INTERFACE_FLAG_ADMIN_UP;
119
120   return (swf);
121 }
122
123 void
124 serialize_vnet_interface_state (serialize_main_t * m, va_list * va)
125 {
126   vnet_main_t *vnm = va_arg (*va, vnet_main_t *);
127   vnet_sw_hw_interface_state_t *sts = 0, *st;
128   vnet_sw_interface_t *sif;
129   vnet_hw_interface_t *hif;
130   vnet_interface_main_t *im = &vnm->interface_main;
131
132   /* Serialize hardware interface classes since they may have changed.
133      Must do this before sending up/down flags. */
134   /* *INDENT-OFF* */
135   pool_foreach (hif, im->hw_interfaces, ({
136     vnet_hw_interface_class_t * hw_class = vnet_get_hw_interface_class (vnm, hif->hw_class_index);
137     serialize_cstring (m, hw_class->name);
138   }));
139   /* *INDENT-ON* */
140
141   /* Send sw/hw interface state when non-zero. */
142   /* *INDENT-OFF* */
143   pool_foreach (sif, im->sw_interfaces, ({
144     if (sif->flags != 0)
145       {
146         vec_add2 (sts, st, 1);
147         st->sw_hw_if_index = sif->sw_if_index;
148         st->flags = sif->flags;
149       }
150   }));
151   /* *INDENT-ON* */
152
153   vec_serialize (m, sts, serialize_vec_vnet_sw_hw_interface_state);
154
155   if (sts)
156     _vec_len (sts) = 0;
157
158   /* *INDENT-OFF* */
159   pool_foreach (hif, im->hw_interfaces, ({
160     if (hif->flags != 0)
161       {
162         vec_add2 (sts, st, 1);
163         st->sw_hw_if_index = hif->hw_if_index;
164         st->flags = vnet_hw_interface_flags_to_sw(hif->flags);
165       }
166   }));
167   /* *INDENT-ON* */
168
169   vec_serialize (m, sts, serialize_vec_vnet_sw_hw_interface_state);
170
171   vec_free (sts);
172 }
173
174 static vnet_hw_interface_flags_t
175 vnet_sw_interface_flags_to_hw (vnet_sw_interface_flags_t swf)
176 {
177   vnet_hw_interface_flags_t hwf = VNET_HW_INTERFACE_FLAG_NONE;
178
179   if (swf & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
180     hwf |= VNET_HW_INTERFACE_FLAG_LINK_UP;
181
182   return (hwf);
183 }
184
185 void
186 unserialize_vnet_interface_state (serialize_main_t * m, va_list * va)
187 {
188   vnet_main_t *vnm = va_arg (*va, vnet_main_t *);
189   vnet_sw_hw_interface_state_t *sts = 0, *st;
190
191   /* First set interface hardware class. */
192   {
193     vnet_interface_main_t *im = &vnm->interface_main;
194     vnet_hw_interface_t *hif;
195     char *class_name;
196     uword *p;
197     clib_error_t *error;
198
199     /* *INDENT-OFF* */
200     pool_foreach (hif, im->hw_interfaces, ({
201       unserialize_cstring (m, &class_name);
202       p = hash_get_mem (im->hw_interface_class_by_name, class_name);
203       ASSERT (p != 0);
204       error = vnet_hw_interface_set_class_helper (vnm, hif->hw_if_index, p[0], /* redistribute */ 0);
205       if (error)
206         clib_error_report (error);
207       vec_free (class_name);
208     }));
209     /* *INDENT-ON* */
210   }
211
212   vec_unserialize (m, &sts, unserialize_vec_vnet_sw_hw_interface_state);
213   vec_foreach (st, sts)
214     vnet_sw_interface_set_flags_helper (vnm, st->sw_hw_if_index, st->flags,
215                                         /* no distribute */ 0);
216   vec_free (sts);
217
218   vec_unserialize (m, &sts, unserialize_vec_vnet_sw_hw_interface_state);
219   vec_foreach (st, sts)
220   {
221     vnet_hw_interface_set_flags_helper
222       (vnm, st->sw_hw_if_index, vnet_sw_interface_flags_to_hw (st->flags),
223        /* no distribute */ 0);
224   }
225   vec_free (sts);
226 }
227
228 static clib_error_t *
229 call_elf_section_interface_callbacks (vnet_main_t * vnm, u32 if_index,
230                                       u32 flags,
231                                       _vnet_interface_function_list_elt_t **
232                                       elts)
233 {
234   _vnet_interface_function_list_elt_t *elt;
235   vnet_interface_function_priority_t prio;
236   clib_error_t *error = 0;
237
238   for (prio = VNET_ITF_FUNC_PRIORITY_LOW;
239        prio <= VNET_ITF_FUNC_PRIORITY_HIGH; prio++)
240     {
241       elt = elts[prio];
242
243       while (elt)
244         {
245           error = elt->fp (vnm, if_index, flags);
246           if (error)
247             return error;
248           elt = elt->next_interface_function;
249         }
250     }
251   return error;
252 }
253
254 static clib_error_t *
255 call_hw_interface_add_del_callbacks (vnet_main_t * vnm, u32 hw_if_index,
256                                      u32 is_create)
257 {
258   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
259   vnet_hw_interface_class_t *hw_class =
260     vnet_get_hw_interface_class (vnm, hi->hw_class_index);
261   vnet_device_class_t *dev_class =
262     vnet_get_device_class (vnm, hi->dev_class_index);
263   clib_error_t *error = 0;
264
265   if (hw_class->interface_add_del_function
266       && (error =
267           hw_class->interface_add_del_function (vnm, hw_if_index, is_create)))
268     return error;
269
270   if (dev_class->interface_add_del_function
271       && (error =
272           dev_class->interface_add_del_function (vnm, hw_if_index,
273                                                  is_create)))
274     return error;
275
276   error = call_elf_section_interface_callbacks
277     (vnm, hw_if_index, is_create, vnm->hw_interface_add_del_functions);
278
279   return error;
280 }
281
282 static clib_error_t *
283 call_sw_interface_add_del_callbacks (vnet_main_t * vnm, u32 sw_if_index,
284                                      u32 is_create)
285 {
286   return call_elf_section_interface_callbacks
287     (vnm, sw_if_index, is_create, vnm->sw_interface_add_del_functions);
288 }
289
290 #define VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE (1 << 0)
291 #define VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE (1 << 1)
292
293 static clib_error_t *
294 vnet_hw_interface_set_flags_helper (vnet_main_t * vnm, u32 hw_if_index,
295                                     vnet_hw_interface_flags_t flags,
296                                     vnet_interface_helper_flags_t
297                                     helper_flags)
298 {
299   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
300   vnet_hw_interface_class_t *hw_class =
301     vnet_get_hw_interface_class (vnm, hi->hw_class_index);
302   u32 mask;
303   clib_error_t *error = 0;
304   u32 is_create =
305     (helper_flags & VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE) != 0;
306
307   mask =
308     (VNET_HW_INTERFACE_FLAG_LINK_UP | VNET_HW_INTERFACE_FLAG_DUPLEX_MASK |
309      VNET_HW_INTERFACE_FLAG_SPEED_MASK);
310   flags &= mask;
311
312   /* Call hardware interface add/del callbacks. */
313   if (is_create)
314     call_hw_interface_add_del_callbacks (vnm, hw_if_index, is_create);
315
316   /* Already in the desired state? */
317   if (!is_create && (hi->flags & mask) == flags)
318     goto done;
319
320   if ((hi->flags & VNET_HW_INTERFACE_FLAG_LINK_UP) !=
321       (flags & VNET_HW_INTERFACE_FLAG_LINK_UP))
322     {
323       /* Do hardware class (e.g. ethernet). */
324       if (hw_class->link_up_down_function
325           && (error = hw_class->link_up_down_function (vnm, hw_if_index,
326                                                        flags)))
327         goto done;
328
329       error = call_elf_section_interface_callbacks
330         (vnm, hw_if_index, flags, vnm->hw_interface_link_up_down_functions);
331
332       if (error)
333         goto done;
334     }
335
336   hi->flags &= ~mask;
337   hi->flags |= flags;
338
339 done:
340   return error;
341 }
342
343 static clib_error_t *
344 vnet_sw_interface_set_flags_helper (vnet_main_t * vnm, u32 sw_if_index,
345                                     vnet_sw_interface_flags_t flags,
346                                     vnet_interface_helper_flags_t
347                                     helper_flags)
348 {
349   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
350   u32 mask;
351   clib_error_t *error = 0;
352   u32 is_create =
353     (helper_flags & VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE) != 0;
354   u32 old_flags;
355
356   mask = VNET_SW_INTERFACE_FLAG_ADMIN_UP | VNET_SW_INTERFACE_FLAG_PUNT;
357   flags &= mask;
358
359   if (is_create)
360     {
361       error =
362         call_sw_interface_add_del_callbacks (vnm, sw_if_index, is_create);
363       if (error)
364         goto done;
365
366       if (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
367         {
368           /* Notify everyone when the interface is created as admin up */
369           error = call_elf_section_interface_callbacks (vnm, sw_if_index,
370                                                         flags,
371                                                         vnm->
372                                                         sw_interface_admin_up_down_functions);
373           if (error)
374             goto done;
375         }
376     }
377   else
378     {
379       vnet_sw_interface_t *si_sup = si;
380
381       /* Check that super interface is in correct state. */
382       if (si->type == VNET_SW_INTERFACE_TYPE_SUB)
383         {
384           si_sup = vnet_get_sw_interface (vnm, si->sup_sw_if_index);
385
386           /* Check to see if we're bringing down the soft interface and if it's parent is up */
387           if ((flags != (si_sup->flags & mask)) &&
388               (!((flags == 0)
389                  && ((si_sup->flags & mask) ==
390                      VNET_SW_INTERFACE_FLAG_ADMIN_UP))))
391             {
392               error = clib_error_return (0, "super-interface %U must be %U",
393                                          format_vnet_sw_interface_name, vnm,
394                                          si_sup,
395                                          format_vnet_sw_interface_flags,
396                                          flags);
397               goto done;
398             }
399         }
400
401       /* Do not change state for slave link of bonded interfaces */
402       if (si->flags & VNET_SW_INTERFACE_FLAG_BOND_SLAVE)
403         {
404           error = clib_error_return
405             (0, "not allowed as %U belong to a BondEthernet interface",
406              format_vnet_sw_interface_name, vnm, si);
407           goto done;
408         }
409
410       /* Already in the desired state? */
411       if ((si->flags & mask) == flags)
412         goto done;
413
414       /* Sub-interfaces of hardware interfaces that do no redistribute,
415          do not redistribute themselves. */
416       if (si_sup->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
417         {
418           vnet_hw_interface_t *hi =
419             vnet_get_hw_interface (vnm, si_sup->hw_if_index);
420           vnet_device_class_t *dev_class =
421             vnet_get_device_class (vnm, hi->dev_class_index);
422           if (!dev_class->redistribute)
423             helper_flags &=
424               ~VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE;
425         }
426
427       /* set the flags now before invoking the registered clients
428        * so that the state they query is consistent with the state here notified */
429       old_flags = si->flags;
430       si->flags &= ~mask;
431       si->flags |= flags;
432       if ((flags | old_flags) & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
433         error = call_elf_section_interface_callbacks
434           (vnm, sw_if_index, flags,
435            vnm->sw_interface_admin_up_down_functions);
436
437       if (error)
438         {
439           /* restore flags on error */
440           si->flags = old_flags;
441           goto done;
442         }
443
444       if (si->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
445         {
446           vnet_hw_interface_t *hi =
447             vnet_get_hw_interface (vnm, si->hw_if_index);
448           vnet_hw_interface_class_t *hw_class =
449             vnet_get_hw_interface_class (vnm, hi->hw_class_index);
450           vnet_device_class_t *dev_class =
451             vnet_get_device_class (vnm, hi->dev_class_index);
452
453           if ((flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP) &&
454               (si->flags & VNET_SW_INTERFACE_FLAG_ERROR))
455             {
456               error = clib_error_return (0, "Interface in the error state");
457               goto done;
458             }
459
460           /* save the si admin up flag */
461           old_flags = si->flags;
462
463           /* update si admin up flag in advance if we are going admin down */
464           if (!(flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP))
465             si->flags &= ~VNET_SW_INTERFACE_FLAG_ADMIN_UP;
466
467           if (dev_class->admin_up_down_function
468               && (error = dev_class->admin_up_down_function (vnm,
469                                                              si->hw_if_index,
470                                                              flags)))
471             {
472               /* restore si admin up flag to it's original state on errors */
473               si->flags = old_flags;
474               goto done;
475             }
476
477           if (hw_class->admin_up_down_function
478               && (error = hw_class->admin_up_down_function (vnm,
479                                                             si->hw_if_index,
480                                                             flags)))
481             {
482               /* restore si admin up flag to it's original state on errors */
483               si->flags = old_flags;
484               goto done;
485             }
486
487           /* Admin down implies link down. */
488           if (!(flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
489               && (hi->flags & VNET_HW_INTERFACE_FLAG_LINK_UP))
490             vnet_hw_interface_set_flags_helper (vnm, si->hw_if_index,
491                                                 hi->flags &
492                                                 ~VNET_HW_INTERFACE_FLAG_LINK_UP,
493                                                 helper_flags);
494         }
495     }
496
497   si->flags &= ~mask;
498   si->flags |= flags;
499
500 done:
501   return error;
502 }
503
504 clib_error_t *
505 vnet_hw_interface_set_flags (vnet_main_t * vnm, u32 hw_if_index,
506                              vnet_hw_interface_flags_t flags)
507 {
508   return vnet_hw_interface_set_flags_helper
509     (vnm, hw_if_index, flags,
510      VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE);
511 }
512
513 clib_error_t *
514 vnet_sw_interface_set_flags (vnet_main_t * vnm, u32 sw_if_index,
515                              vnet_sw_interface_flags_t flags)
516 {
517   return vnet_sw_interface_set_flags_helper
518     (vnm, sw_if_index, flags,
519      VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE);
520 }
521
522 static u32
523 vnet_create_sw_interface_no_callbacks (vnet_main_t * vnm,
524                                        vnet_sw_interface_t * template)
525 {
526   vnet_interface_main_t *im = &vnm->interface_main;
527   vnet_sw_interface_t *sw;
528   u32 sw_if_index;
529
530   pool_get (im->sw_interfaces, sw);
531   sw_if_index = sw - im->sw_interfaces;
532
533   sw[0] = template[0];
534
535   sw->flags = 0;
536   sw->sw_if_index = sw_if_index;
537   if (sw->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
538     sw->sup_sw_if_index = sw->sw_if_index;
539
540   /* Allocate counters for this interface. */
541   {
542     u32 i;
543
544     vnet_interface_counter_lock (im);
545
546     for (i = 0; i < vec_len (im->sw_if_counters); i++)
547       {
548         vlib_validate_simple_counter (&im->sw_if_counters[i], sw_if_index);
549         vlib_zero_simple_counter (&im->sw_if_counters[i], sw_if_index);
550       }
551
552     for (i = 0; i < vec_len (im->combined_sw_if_counters); i++)
553       {
554         vlib_validate_combined_counter (&im->combined_sw_if_counters[i],
555                                         sw_if_index);
556         vlib_zero_combined_counter (&im->combined_sw_if_counters[i],
557                                     sw_if_index);
558       }
559
560     vnet_interface_counter_unlock (im);
561   }
562
563   return sw_if_index;
564 }
565
566 clib_error_t *
567 vnet_create_sw_interface (vnet_main_t * vnm, vnet_sw_interface_t * template,
568                           u32 * sw_if_index)
569 {
570   clib_error_t *error;
571   vnet_hw_interface_t *hi;
572   vnet_device_class_t *dev_class;
573
574   hi = vnet_get_sup_hw_interface (vnm, template->sup_sw_if_index);
575   dev_class = vnet_get_device_class (vnm, hi->dev_class_index);
576
577   if (template->type == VNET_SW_INTERFACE_TYPE_SUB &&
578       dev_class->subif_add_del_function)
579     {
580       error = dev_class->subif_add_del_function (vnm, hi->hw_if_index,
581                                                  (struct vnet_sw_interface_t
582                                                   *) template, 1);
583       if (error)
584         return error;
585     }
586
587   *sw_if_index = vnet_create_sw_interface_no_callbacks (vnm, template);
588   error = vnet_sw_interface_set_flags_helper
589     (vnm, *sw_if_index, template->flags,
590      VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
591
592   if (error)
593     {
594       /* undo the work done by vnet_create_sw_interface_no_callbacks() */
595       vnet_interface_main_t *im = &vnm->interface_main;
596       vnet_sw_interface_t *sw =
597         pool_elt_at_index (im->sw_interfaces, *sw_if_index);
598       pool_put (im->sw_interfaces, sw);
599     }
600
601   return error;
602 }
603
604 void
605 vnet_delete_sw_interface (vnet_main_t * vnm, u32 sw_if_index)
606 {
607   vnet_interface_main_t *im = &vnm->interface_main;
608   vnet_sw_interface_t *sw =
609     pool_elt_at_index (im->sw_interfaces, sw_if_index);
610
611   /* Check if the interface has config and is removed from L2 BD or XConnect */
612   vlib_main_t *vm = vlib_get_main ();
613   l2_input_config_t *config;
614   if (sw_if_index < vec_len (l2input_main.configs))
615     {
616       config = vec_elt_at_index (l2input_main.configs, sw_if_index);
617       if (config->xconnect)
618         set_int_l2_mode (vm, vnm, MODE_L3, config->output_sw_if_index, 0,
619                          L2_BD_PORT_TYPE_NORMAL, 0, 0);
620       if (config->xconnect || config->bridge)
621         set_int_l2_mode (vm, vnm, MODE_L3, sw_if_index, 0,
622                          L2_BD_PORT_TYPE_NORMAL, 0, 0);
623     }
624   vnet_clear_sw_interface_tag (vnm, sw_if_index);
625
626   /* Bring down interface in case it is up. */
627   if (sw->flags != 0)
628     vnet_sw_interface_set_flags (vnm, sw_if_index, /* flags */ 0);
629
630   call_sw_interface_add_del_callbacks (vnm, sw_if_index, /* is_create */ 0);
631
632   pool_put (im->sw_interfaces, sw);
633 }
634
635 static clib_error_t *
636 call_sw_interface_mtu_change_callbacks (vnet_main_t * vnm, u32 sw_if_index)
637 {
638   return call_elf_section_interface_callbacks
639     (vnm, sw_if_index, 0, vnm->sw_interface_mtu_change_functions);
640 }
641
642 void
643 vnet_sw_interface_set_mtu (vnet_main_t * vnm, u32 sw_if_index, u32 mtu)
644 {
645   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
646
647   if (si->mtu[VNET_MTU_L3] != mtu)
648     {
649       si->mtu[VNET_MTU_L3] = mtu;
650       call_sw_interface_mtu_change_callbacks (vnm, sw_if_index);
651     }
652 }
653
654 void
655 vnet_sw_interface_set_protocol_mtu (vnet_main_t * vnm, u32 sw_if_index,
656                                     u32 mtu[])
657 {
658   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
659   bool changed = false;
660   int i;
661
662   for (i = 0; i < VNET_N_MTU; i++)
663     {
664       if (si->mtu[i] != mtu[i])
665         {
666           si->mtu[i] = mtu[i];
667           changed = true;
668         }
669     }
670   /* Notify interested parties */
671   if (changed)
672     call_sw_interface_mtu_change_callbacks (vnm, sw_if_index);
673 }
674
675 void
676 vnet_sw_interface_ip_directed_broadcast (vnet_main_t * vnm,
677                                          u32 sw_if_index, u8 enable)
678 {
679   vnet_sw_interface_t *si;
680
681   si = vnet_get_sw_interface (vnm, sw_if_index);
682
683   if (enable)
684     si->flags |= VNET_SW_INTERFACE_FLAG_DIRECTED_BCAST;
685   else
686     si->flags &= ~VNET_SW_INTERFACE_FLAG_DIRECTED_BCAST;
687
688   ip4_directed_broadcast (sw_if_index, enable);
689 }
690
691 /*
692  * Reflect a change in hardware MTU on protocol MTUs
693  */
694 static walk_rc_t
695 sw_interface_walk_callback (vnet_main_t * vnm, u32 sw_if_index, void *ctx)
696 {
697   u32 *link_mtu = ctx;
698   vnet_sw_interface_set_mtu (vnm, sw_if_index, *link_mtu);
699   return WALK_CONTINUE;
700 }
701
702 void
703 vnet_hw_interface_set_mtu (vnet_main_t * vnm, u32 hw_if_index, u32 mtu)
704 {
705   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
706
707   if (hi->max_packet_bytes != mtu)
708     {
709       hi->max_packet_bytes = mtu;
710       ethernet_set_flags (vnm, hw_if_index, ETHERNET_INTERFACE_FLAG_MTU);
711       vnet_hw_interface_walk_sw (vnm, hw_if_index, sw_interface_walk_callback,
712                                  &mtu);
713     }
714 }
715
716 static void
717 setup_tx_node (vlib_main_t * vm,
718                u32 node_index, vnet_device_class_t * dev_class)
719 {
720   vlib_node_t *n = vlib_get_node (vm, node_index);
721
722   n->function = dev_class->tx_function;
723   n->format_trace = dev_class->format_tx_trace;
724
725   vlib_register_errors (vm, node_index,
726                         dev_class->tx_function_n_errors,
727                         dev_class->tx_function_error_strings);
728 }
729
730 static void
731 setup_output_node (vlib_main_t * vm,
732                    u32 node_index, vnet_hw_interface_class_t * hw_class)
733 {
734   vlib_node_t *n = vlib_get_node (vm, node_index);
735   n->format_buffer = hw_class->format_header;
736   n->unformat_buffer = hw_class->unformat_header;
737 }
738
739 /* Register an interface instance. */
740 u32
741 vnet_register_interface (vnet_main_t * vnm,
742                          u32 dev_class_index,
743                          u32 dev_instance,
744                          u32 hw_class_index, u32 hw_instance)
745 {
746   vnet_interface_main_t *im = &vnm->interface_main;
747   vnet_hw_interface_t *hw;
748   vnet_device_class_t *dev_class =
749     vnet_get_device_class (vnm, dev_class_index);
750   vnet_hw_interface_class_t *hw_class =
751     vnet_get_hw_interface_class (vnm, hw_class_index);
752   vlib_main_t *vm = vnm->vlib_main;
753   vnet_feature_config_main_t *fcm;
754   vnet_config_main_t *cm;
755   u32 hw_index, i;
756   char *tx_node_name = NULL, *output_node_name = NULL;
757
758   pool_get (im->hw_interfaces, hw);
759   clib_memset (hw, 0, sizeof (*hw));
760
761   hw_index = hw - im->hw_interfaces;
762   hw->hw_if_index = hw_index;
763   hw->default_rx_mode = VNET_HW_INTERFACE_RX_MODE_POLLING;
764
765   if (dev_class->format_device_name)
766     hw->name = format (0, "%U", dev_class->format_device_name, dev_instance);
767   else if (hw_class->format_interface_name)
768     hw->name = format (0, "%U", hw_class->format_interface_name,
769                        dev_instance);
770   else
771     hw->name = format (0, "%s%x", hw_class->name, dev_instance);
772
773   if (!im->hw_interface_by_name)
774     im->hw_interface_by_name = hash_create_vec ( /* size */ 0,
775                                                 sizeof (hw->name[0]),
776                                                 sizeof (uword));
777
778   hash_set_mem (im->hw_interface_by_name, hw->name, hw_index);
779
780   /* Make hardware interface point to software interface. */
781   {
782     vnet_sw_interface_t sw = {
783       .type = VNET_SW_INTERFACE_TYPE_HARDWARE,
784       .flood_class = VNET_FLOOD_CLASS_NORMAL,
785       .hw_if_index = hw_index
786     };
787     hw->sw_if_index = vnet_create_sw_interface_no_callbacks (vnm, &sw);
788   }
789
790   hw->dev_class_index = dev_class_index;
791   hw->dev_instance = dev_instance;
792   hw->hw_class_index = hw_class_index;
793   hw->hw_instance = hw_instance;
794
795   hw->max_rate_bits_per_sec = 0;
796   hw->min_packet_bytes = 0;
797   vnet_sw_interface_set_mtu (vnm, hw->sw_if_index, 0);
798
799   if (dev_class->tx_function == 0)
800     goto no_output_nodes;       /* No output/tx nodes to create */
801
802   tx_node_name = (char *) format (0, "%v-tx", hw->name);
803   output_node_name = (char *) format (0, "%v-output", hw->name);
804
805   /* If we have previously deleted interface nodes, re-use them. */
806   if (vec_len (im->deleted_hw_interface_nodes) > 0)
807     {
808       vnet_hw_interface_nodes_t *hn;
809       vlib_node_t *node;
810       vlib_node_runtime_t *nrt;
811
812       hn = vec_end (im->deleted_hw_interface_nodes) - 1;
813
814       hw->tx_node_index = hn->tx_node_index;
815       hw->output_node_index = hn->output_node_index;
816
817       vlib_node_rename (vm, hw->tx_node_index, "%v", tx_node_name);
818       vlib_node_rename (vm, hw->output_node_index, "%v", output_node_name);
819
820       /* *INDENT-OFF* */
821       foreach_vlib_main ({
822         vnet_interface_output_runtime_t *rt;
823
824         rt = vlib_node_get_runtime_data (this_vlib_main, hw->output_node_index);
825         ASSERT (rt->is_deleted == 1);
826         rt->is_deleted = 0;
827         rt->hw_if_index = hw_index;
828         rt->sw_if_index = hw->sw_if_index;
829         rt->dev_instance = hw->dev_instance;
830
831         rt = vlib_node_get_runtime_data (this_vlib_main, hw->tx_node_index);
832         rt->hw_if_index = hw_index;
833         rt->sw_if_index = hw->sw_if_index;
834         rt->dev_instance = hw->dev_instance;
835       });
836       /* *INDENT-ON* */
837
838       /* The new class may differ from the old one.
839        * Functions have to be updated. */
840       node = vlib_get_node (vm, hw->output_node_index);
841       node->function = vnet_interface_output_node_multiarch_select ();
842       node->format_trace = format_vnet_interface_output_trace;
843       /* *INDENT-OFF* */
844       foreach_vlib_main ({
845         nrt = vlib_node_get_runtime (this_vlib_main, hw->output_node_index);
846         nrt->function = node->function;
847       });
848       /* *INDENT-ON* */
849
850       node = vlib_get_node (vm, hw->tx_node_index);
851       node->function = dev_class->tx_function;
852       node->format_trace = dev_class->format_tx_trace;
853       /* *INDENT-OFF* */
854       foreach_vlib_main ({
855         nrt = vlib_node_get_runtime (this_vlib_main, hw->tx_node_index);
856         nrt->function = node->function;
857       });
858       /* *INDENT-ON* */
859
860       _vec_len (im->deleted_hw_interface_nodes) -= 1;
861     }
862   else
863     {
864       vlib_node_registration_t r;
865       vnet_interface_output_runtime_t rt = {
866         .hw_if_index = hw_index,
867         .sw_if_index = hw->sw_if_index,
868         .dev_instance = hw->dev_instance,
869         .is_deleted = 0,
870       };
871
872       clib_memset (&r, 0, sizeof (r));
873       r.type = VLIB_NODE_TYPE_INTERNAL;
874       r.runtime_data = &rt;
875       r.runtime_data_bytes = sizeof (rt);
876       r.scalar_size = 0;
877       r.vector_size = sizeof (u32);
878
879       r.flags = VLIB_NODE_FLAG_IS_OUTPUT;
880       r.name = tx_node_name;
881       r.function = dev_class->tx_function;
882
883       hw->tx_node_index = vlib_register_node (vm, &r);
884
885       vlib_node_add_named_next_with_slot (vm, hw->tx_node_index,
886                                           "error-drop",
887                                           VNET_INTERFACE_TX_NEXT_DROP);
888
889       r.flags = 0;
890       r.name = output_node_name;
891       r.function = vnet_interface_output_node_multiarch_select ();
892       r.format_trace = format_vnet_interface_output_trace;
893
894       {
895         static char *e[] = {
896           "interface is down",
897           "interface is deleted",
898         };
899
900         r.n_errors = ARRAY_LEN (e);
901         r.error_strings = e;
902       }
903       hw->output_node_index = vlib_register_node (vm, &r);
904
905       vlib_node_add_named_next_with_slot (vm, hw->output_node_index,
906                                           "error-drop",
907                                           VNET_INTERFACE_OUTPUT_NEXT_DROP);
908       vlib_node_add_next_with_slot (vm, hw->output_node_index,
909                                     hw->tx_node_index,
910                                     VNET_INTERFACE_OUTPUT_NEXT_TX);
911
912       /* add interface to the list of "output-interface" feature arc start nodes
913          and clone nexts from 1st interface if it exists */
914       fcm = vnet_feature_get_config_main (im->output_feature_arc_index);
915       cm = &fcm->config_main;
916       i = vec_len (cm->start_node_indices);
917       vec_validate (cm->start_node_indices, i);
918       cm->start_node_indices[i] = hw->output_node_index;
919       if (hw_index)
920         {
921           /* copy nexts from 1st interface */
922           vnet_hw_interface_t *first_hw;
923           vlib_node_t *first_node;
924
925           first_hw = vnet_get_hw_interface (vnm, /* hw_if_index */ 0);
926           first_node = vlib_get_node (vm, first_hw->output_node_index);
927
928           /* 1st 2 nexts are already added above */
929           for (i = 2; i < vec_len (first_node->next_nodes); i++)
930             vlib_node_add_next_with_slot (vm, hw->output_node_index,
931                                           first_node->next_nodes[i], i);
932         }
933     }
934
935   setup_output_node (vm, hw->output_node_index, hw_class);
936   setup_tx_node (vm, hw->tx_node_index, dev_class);
937
938 no_output_nodes:
939   /* Call all up/down callbacks with zero flags when interface is created. */
940   vnet_sw_interface_set_flags_helper (vnm, hw->sw_if_index, /* flags */ 0,
941                                       VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
942   vnet_hw_interface_set_flags_helper (vnm, hw_index, /* flags */ 0,
943                                       VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
944   vec_free (tx_node_name);
945   vec_free (output_node_name);
946
947   return hw_index;
948 }
949
950 void
951 vnet_delete_hw_interface (vnet_main_t * vnm, u32 hw_if_index)
952 {
953   vnet_interface_main_t *im = &vnm->interface_main;
954   vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
955   vlib_main_t *vm = vnm->vlib_main;
956   vnet_device_class_t *dev_class = vnet_get_device_class (vnm,
957                                                           hw->dev_class_index);
958   /* If it is up, mark it down. */
959   if (hw->flags != 0)
960     vnet_hw_interface_set_flags (vnm, hw_if_index, /* flags */ 0);
961
962   /* Call delete callbacks. */
963   call_hw_interface_add_del_callbacks (vnm, hw_if_index, /* is_create */ 0);
964
965   /* Delete any sub-interfaces. */
966   {
967     u32 id, sw_if_index;
968     /* *INDENT-OFF* */
969     hash_foreach (id, sw_if_index, hw->sub_interface_sw_if_index_by_id,
970     ({
971       vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
972       u64 sup_and_sub_key =
973         ((u64) (si->sup_sw_if_index) << 32) | (u64) si->sub.id;
974       hash_unset_mem_free (&im->sw_if_index_by_sup_and_sub, &sup_and_sub_key);
975       vnet_delete_sw_interface (vnm, sw_if_index);
976     }));
977     hash_free (hw->sub_interface_sw_if_index_by_id);
978     /* *INDENT-ON* */
979   }
980
981   /* Delete software interface corresponding to hardware interface. */
982   vnet_delete_sw_interface (vnm, hw->sw_if_index);
983
984   if (dev_class->tx_function)
985     {
986       /* Put output/tx nodes into recycle pool */
987       vnet_hw_interface_nodes_t *dn;
988
989       /* *INDENT-OFF* */
990       foreach_vlib_main
991         ({
992           vnet_interface_output_runtime_t *rt =
993             vlib_node_get_runtime_data (this_vlib_main, hw->output_node_index);
994
995           /* Mark node runtime as deleted so output node (if called)
996            * will drop packets. */
997           rt->is_deleted = 1;
998         });
999       /* *INDENT-ON* */
1000
1001       vlib_node_rename (vm, hw->output_node_index,
1002                         "interface-%d-output-deleted", hw_if_index);
1003       vlib_node_rename (vm, hw->tx_node_index, "interface-%d-tx-deleted",
1004                         hw_if_index);
1005       vec_add2 (im->deleted_hw_interface_nodes, dn, 1);
1006       dn->tx_node_index = hw->tx_node_index;
1007       dn->output_node_index = hw->output_node_index;
1008     }
1009
1010   hash_unset_mem (im->hw_interface_by_name, hw->name);
1011   vec_free (hw->name);
1012   vec_free (hw->hw_address);
1013   vec_free (hw->input_node_thread_index_by_queue);
1014   vec_free (hw->dq_runtime_index_by_queue);
1015
1016   pool_put (im->hw_interfaces, hw);
1017 }
1018
1019 void
1020 vnet_hw_interface_walk_sw (vnet_main_t * vnm,
1021                            u32 hw_if_index,
1022                            vnet_hw_sw_interface_walk_t fn, void *ctx)
1023 {
1024   vnet_hw_interface_t *hi;
1025   u32 id, sw_if_index;
1026
1027   hi = vnet_get_hw_interface (vnm, hw_if_index);
1028   /* the super first, then the sub interfaces */
1029   if (WALK_STOP == fn (vnm, hi->sw_if_index, ctx))
1030     return;
1031
1032   /* *INDENT-OFF* */
1033   hash_foreach (id, sw_if_index,
1034                 hi->sub_interface_sw_if_index_by_id,
1035   ({
1036     if (WALK_STOP == fn (vnm, sw_if_index, ctx))
1037       break;
1038   }));
1039   /* *INDENT-ON* */
1040 }
1041
1042 void
1043 vnet_hw_interface_walk (vnet_main_t * vnm,
1044                         vnet_hw_interface_walk_t fn, void *ctx)
1045 {
1046   vnet_interface_main_t *im;
1047   vnet_hw_interface_t *hi;
1048
1049   im = &vnm->interface_main;
1050
1051   /* *INDENT-OFF* */
1052   pool_foreach (hi, im->hw_interfaces,
1053   ({
1054     if (WALK_STOP == fn(vnm, hi->hw_if_index, ctx))
1055       break;
1056   }));
1057   /* *INDENT-ON* */
1058 }
1059
1060 void
1061 vnet_sw_interface_walk (vnet_main_t * vnm,
1062                         vnet_sw_interface_walk_t fn, void *ctx)
1063 {
1064   vnet_interface_main_t *im;
1065   vnet_sw_interface_t *si;
1066
1067   im = &vnm->interface_main;
1068
1069   /* *INDENT-OFF* */
1070   pool_foreach (si, im->sw_interfaces,
1071   {
1072     if (WALK_STOP == fn (vnm, si, ctx))
1073       break;
1074   });
1075   /* *INDENT-ON* */
1076 }
1077
1078 void
1079 vnet_hw_interface_init_for_class (vnet_main_t * vnm, u32 hw_if_index,
1080                                   u32 hw_class_index, u32 hw_instance)
1081 {
1082   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1083   vnet_hw_interface_class_t *hc =
1084     vnet_get_hw_interface_class (vnm, hw_class_index);
1085
1086   hi->hw_class_index = hw_class_index;
1087   hi->hw_instance = hw_instance;
1088   setup_output_node (vnm->vlib_main, hi->output_node_index, hc);
1089 }
1090
1091 static clib_error_t *
1092 vnet_hw_interface_set_class_helper (vnet_main_t * vnm, u32 hw_if_index,
1093                                     u32 hw_class_index, u32 redistribute)
1094 {
1095   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1096   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, hi->sw_if_index);
1097   vnet_hw_interface_class_t *old_class =
1098     vnet_get_hw_interface_class (vnm, hi->hw_class_index);
1099   vnet_hw_interface_class_t *new_class =
1100     vnet_get_hw_interface_class (vnm, hw_class_index);
1101   vnet_device_class_t *dev_class =
1102     vnet_get_device_class (vnm, hi->dev_class_index);
1103   clib_error_t *error = 0;
1104
1105   /* New class equals old class?  Nothing to do. */
1106   if (hi->hw_class_index == hw_class_index)
1107     return 0;
1108
1109   /* No need (and incorrect since admin up flag may be set) to do error checking when
1110      receiving unserialize message. */
1111   if (redistribute)
1112     {
1113       if (si->flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
1114         return clib_error_return (0,
1115                                   "%v must be admin down to change class from %s to %s",
1116                                   hi->name, old_class->name, new_class->name);
1117
1118       /* Make sure interface supports given class. */
1119       if ((new_class->is_valid_class_for_interface
1120            && !new_class->is_valid_class_for_interface (vnm, hw_if_index,
1121                                                         hw_class_index))
1122           || (dev_class->is_valid_class_for_interface
1123               && !dev_class->is_valid_class_for_interface (vnm, hw_if_index,
1124                                                            hw_class_index)))
1125         return clib_error_return (0,
1126                                   "%v class cannot be changed from %s to %s",
1127                                   hi->name, old_class->name, new_class->name);
1128
1129     }
1130
1131   if (old_class->hw_class_change)
1132     old_class->hw_class_change (vnm, hw_if_index, old_class->index,
1133                                 new_class->index);
1134
1135   vnet_hw_interface_init_for_class (vnm, hw_if_index, new_class->index,
1136                                     /* instance */ ~0);
1137
1138   if (new_class->hw_class_change)
1139     new_class->hw_class_change (vnm, hw_if_index, old_class->index,
1140                                 new_class->index);
1141
1142   if (dev_class->hw_class_change)
1143     dev_class->hw_class_change (vnm, hw_if_index, new_class->index);
1144
1145   return error;
1146 }
1147
1148 clib_error_t *
1149 vnet_hw_interface_set_class (vnet_main_t * vnm, u32 hw_if_index,
1150                              u32 hw_class_index)
1151 {
1152   return vnet_hw_interface_set_class_helper (vnm, hw_if_index, hw_class_index,
1153                                              /* redistribute */ 1);
1154 }
1155
1156 static int
1157 vnet_hw_interface_rx_redirect_to_node_helper (vnet_main_t * vnm,
1158                                               u32 hw_if_index,
1159                                               u32 node_index,
1160                                               u32 redistribute)
1161 {
1162   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1163   vnet_device_class_t *dev_class = vnet_get_device_class
1164     (vnm, hi->dev_class_index);
1165
1166   if (dev_class->rx_redirect_to_node)
1167     {
1168       dev_class->rx_redirect_to_node (vnm, hw_if_index, node_index);
1169       return 0;
1170     }
1171
1172   return VNET_API_ERROR_UNIMPLEMENTED;
1173 }
1174
1175 int
1176 vnet_hw_interface_rx_redirect_to_node (vnet_main_t * vnm, u32 hw_if_index,
1177                                        u32 node_index)
1178 {
1179   return vnet_hw_interface_rx_redirect_to_node_helper (vnm, hw_if_index,
1180                                                        node_index,
1181                                                        1 /* redistribute */ );
1182 }
1183
1184 word
1185 vnet_sw_interface_compare (vnet_main_t * vnm,
1186                            uword sw_if_index0, uword sw_if_index1)
1187 {
1188   vnet_sw_interface_t *sup0 = vnet_get_sup_sw_interface (vnm, sw_if_index0);
1189   vnet_sw_interface_t *sup1 = vnet_get_sup_sw_interface (vnm, sw_if_index1);
1190   vnet_hw_interface_t *h0 = vnet_get_hw_interface (vnm, sup0->hw_if_index);
1191   vnet_hw_interface_t *h1 = vnet_get_hw_interface (vnm, sup1->hw_if_index);
1192
1193   if (h0 != h1)
1194     return vec_cmp (h0->name, h1->name);
1195   return (word) h0->hw_instance - (word) h1->hw_instance;
1196 }
1197
1198 word
1199 vnet_hw_interface_compare (vnet_main_t * vnm,
1200                            uword hw_if_index0, uword hw_if_index1)
1201 {
1202   vnet_hw_interface_t *h0 = vnet_get_hw_interface (vnm, hw_if_index0);
1203   vnet_hw_interface_t *h1 = vnet_get_hw_interface (vnm, hw_if_index1);
1204
1205   if (h0 != h1)
1206     return vec_cmp (h0->name, h1->name);
1207   return (word) h0->hw_instance - (word) h1->hw_instance;
1208 }
1209
1210 int
1211 vnet_sw_interface_is_p2p (vnet_main_t * vnm, u32 sw_if_index)
1212 {
1213   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
1214   if ((si->type == VNET_SW_INTERFACE_TYPE_P2P) ||
1215       (si->type == VNET_SW_INTERFACE_TYPE_PIPE))
1216     return 1;
1217
1218   vnet_hw_interface_t *hw = vnet_get_sup_hw_interface (vnm, sw_if_index);
1219   vnet_hw_interface_class_t *hc =
1220     vnet_get_hw_interface_class (vnm, hw->hw_class_index);
1221
1222   return (hc->flags & VNET_HW_INTERFACE_CLASS_FLAG_P2P);
1223 }
1224
1225 clib_error_t *
1226 vnet_interface_init (vlib_main_t * vm)
1227 {
1228   vnet_main_t *vnm = vnet_get_main ();
1229   vnet_interface_main_t *im = &vnm->interface_main;
1230   vlib_buffer_t *b = 0;
1231   vnet_buffer_opaque_t *o = 0;
1232   clib_error_t *error;
1233
1234   /*
1235    * Keep people from shooting themselves in the foot.
1236    */
1237   if (sizeof (b->opaque) != sizeof (vnet_buffer_opaque_t))
1238     {
1239 #define _(a) if (sizeof(o->a) > sizeof (o->unused))                     \
1240       clib_warning                                                      \
1241         ("FATAL: size of opaque union subtype %s is %d (max %d)",       \
1242          #a, sizeof(o->a), sizeof (o->unused));
1243       foreach_buffer_opaque_union_subtype;
1244 #undef _
1245
1246       return clib_error_return
1247         (0, "FATAL: size of vlib buffer opaque %d, size of vnet opaque %d",
1248          sizeof (b->opaque), sizeof (vnet_buffer_opaque_t));
1249     }
1250
1251   im->sw_if_counter_lock = clib_mem_alloc_aligned (CLIB_CACHE_LINE_BYTES,
1252                                                    CLIB_CACHE_LINE_BYTES);
1253   im->sw_if_counter_lock[0] = 1;        /* should be no need */
1254
1255   vec_validate (im->sw_if_counters, VNET_N_SIMPLE_INTERFACE_COUNTER - 1);
1256 #define _(E,n,p)                                                        \
1257   im->sw_if_counters[VNET_INTERFACE_COUNTER_##E].name = #n;             \
1258   im->sw_if_counters[VNET_INTERFACE_COUNTER_##E].stat_segment_name = "/" #p "/" #n;
1259   foreach_simple_interface_counter_name
1260 #undef _
1261     vec_validate (im->combined_sw_if_counters,
1262                   VNET_N_COMBINED_INTERFACE_COUNTER - 1);
1263 #define _(E,n,p)                                                        \
1264   im->combined_sw_if_counters[VNET_INTERFACE_COUNTER_##E].name = #n;    \
1265   im->combined_sw_if_counters[VNET_INTERFACE_COUNTER_##E].stat_segment_name = "/" #p "/" #n;
1266   foreach_combined_interface_counter_name
1267 #undef _
1268     im->sw_if_counter_lock[0] = 0;
1269
1270   im->device_class_by_name = hash_create_string ( /* size */ 0,
1271                                                  sizeof (uword));
1272   {
1273     vnet_device_class_t *c;
1274
1275     c = vnm->device_class_registrations;
1276
1277     while (c)
1278       {
1279         c->index = vec_len (im->device_classes);
1280         hash_set_mem (im->device_class_by_name, c->name, c->index);
1281
1282         if (c->tx_fn_registrations)
1283           {
1284             vlib_node_fn_registration_t *fnr = c->tx_fn_registrations;
1285             int priority = -1;
1286
1287             /* to avoid confusion, please remove ".tx_function" statement
1288                from VNET_DEVICE_CLASS() if using function candidates */
1289             ASSERT (c->tx_function == 0);
1290
1291             while (fnr)
1292               {
1293                 if (fnr->priority > priority)
1294                   {
1295                     priority = fnr->priority;
1296                     c->tx_function = fnr->function;
1297                   }
1298                 fnr = fnr->next_registration;
1299               }
1300           }
1301
1302         vec_add1 (im->device_classes, c[0]);
1303         c = c->next_class_registration;
1304       }
1305   }
1306
1307   im->hw_interface_class_by_name = hash_create_string ( /* size */ 0,
1308                                                        sizeof (uword));
1309
1310   im->sw_if_index_by_sup_and_sub = hash_create_mem (0, sizeof (u64),
1311                                                     sizeof (uword));
1312   {
1313     vnet_hw_interface_class_t *c;
1314
1315     c = vnm->hw_interface_class_registrations;
1316
1317     while (c)
1318       {
1319         c->index = vec_len (im->hw_interface_classes);
1320         hash_set_mem (im->hw_interface_class_by_name, c->name, c->index);
1321
1322         if (NULL == c->build_rewrite)
1323           c->build_rewrite = default_build_rewrite;
1324         if (NULL == c->update_adjacency)
1325           c->update_adjacency = default_update_adjacency;
1326
1327         vec_add1 (im->hw_interface_classes, c[0]);
1328         c = c->next_class_registration;
1329       }
1330   }
1331
1332   if ((error = vlib_call_init_function (vm, vnet_interface_cli_init)))
1333     return error;
1334
1335   vnm->interface_tag_by_sw_if_index = hash_create (0, sizeof (uword));
1336
1337 #if VLIB_BUFFER_TRACE_TRAJECTORY > 0
1338   if ((error = vlib_call_init_function (vm, trajectory_trace_init)))
1339     return error;
1340 #endif
1341
1342   return 0;
1343 }
1344
1345 VLIB_INIT_FUNCTION (vnet_interface_init);
1346
1347 /* Kludge to renumber interface names [only!] */
1348 int
1349 vnet_interface_name_renumber (u32 sw_if_index, u32 new_show_dev_instance)
1350 {
1351   int rv;
1352   vnet_main_t *vnm = vnet_get_main ();
1353   vnet_interface_main_t *im = &vnm->interface_main;
1354   vnet_hw_interface_t *hi = vnet_get_sup_hw_interface (vnm, sw_if_index);
1355
1356   vnet_device_class_t *dev_class = vnet_get_device_class
1357     (vnm, hi->dev_class_index);
1358
1359   if (dev_class->name_renumber == 0 || dev_class->format_device_name == 0)
1360     return VNET_API_ERROR_UNIMPLEMENTED;
1361
1362   rv = dev_class->name_renumber (hi, new_show_dev_instance);
1363
1364   if (rv)
1365     return rv;
1366
1367   hash_unset_mem (im->hw_interface_by_name, hi->name);
1368   vec_free (hi->name);
1369   /* Use the mapping we set up to call it Ishmael */
1370   hi->name = format (0, "%U", dev_class->format_device_name,
1371                      hi->dev_instance);
1372
1373   hash_set_mem (im->hw_interface_by_name, hi->name, hi->hw_if_index);
1374   return rv;
1375 }
1376
1377 clib_error_t *
1378 vnet_rename_interface (vnet_main_t * vnm, u32 hw_if_index, char *new_name)
1379 {
1380   vnet_interface_main_t *im = &vnm->interface_main;
1381   vlib_main_t *vm = vnm->vlib_main;
1382   vnet_hw_interface_t *hw;
1383   u8 *old_name;
1384   clib_error_t *error = 0;
1385
1386   hw = vnet_get_hw_interface (vnm, hw_if_index);
1387   if (!hw)
1388     {
1389       return clib_error_return (0,
1390                                 "unable to find hw interface for index %u",
1391                                 hw_if_index);
1392     }
1393
1394   old_name = hw->name;
1395
1396   /* set new hw->name */
1397   hw->name = format (0, "%s", new_name);
1398
1399   /* remove the old name to hw_if_index mapping and install the new one */
1400   hash_unset_mem (im->hw_interface_by_name, old_name);
1401   hash_set_mem (im->hw_interface_by_name, hw->name, hw_if_index);
1402
1403   /* rename tx/output nodes */
1404   vlib_node_rename (vm, hw->tx_node_index, "%v-tx", hw->name);
1405   vlib_node_rename (vm, hw->output_node_index, "%v-output", hw->name);
1406
1407   /* free the old name vector */
1408   vec_free (old_name);
1409
1410   return error;
1411 }
1412
1413 static clib_error_t *
1414 vnet_hw_interface_change_mac_address_helper (vnet_main_t * vnm,
1415                                              u32 hw_if_index,
1416                                              const u8 * mac_address)
1417 {
1418   clib_error_t *error = 0;
1419   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1420
1421   if (hi->hw_address)
1422     {
1423       u8 *old_address = vec_dup (hi->hw_address);
1424       vnet_device_class_t *dev_class =
1425         vnet_get_device_class (vnm, hi->dev_class_index);
1426       if (dev_class->mac_addr_change_function)
1427         {
1428           error =
1429             dev_class->mac_addr_change_function (hi, old_address,
1430                                                  mac_address);
1431         }
1432       if (!error)
1433         {
1434           vnet_hw_interface_class_t *hw_class;
1435
1436           hw_class = vnet_get_hw_interface_class (vnm, hi->hw_class_index);
1437
1438           if (NULL != hw_class->mac_addr_change_function)
1439             hw_class->mac_addr_change_function (hi, old_address, mac_address);
1440         }
1441       else
1442         {
1443           error =
1444             clib_error_return (0,
1445                                "MAC Address Change is not supported on this interface");
1446         }
1447       vec_free (old_address);
1448     }
1449   else
1450     {
1451       error =
1452         clib_error_return (0,
1453                            "mac address change is not supported for interface index %u",
1454                            hw_if_index);
1455     }
1456   return error;
1457 }
1458
1459 clib_error_t *
1460 vnet_hw_interface_change_mac_address (vnet_main_t * vnm, u32 hw_if_index,
1461                                       const u8 * mac_address)
1462 {
1463   return vnet_hw_interface_change_mac_address_helper
1464     (vnm, hw_if_index, mac_address);
1465 }
1466
1467 /* update the unnumbered state of an interface*/
1468 void
1469 vnet_sw_interface_update_unnumbered (u32 unnumbered_sw_if_index,
1470                                      u32 ip_sw_if_index, u8 enable)
1471 {
1472   vnet_main_t *vnm = vnet_get_main ();
1473   vnet_sw_interface_t *si;
1474   u32 was_unnum;
1475
1476   si = vnet_get_sw_interface (vnm, unnumbered_sw_if_index);
1477   was_unnum = (si->flags & VNET_SW_INTERFACE_FLAG_UNNUMBERED);
1478
1479   if (enable)
1480     {
1481       si->flags |= VNET_SW_INTERFACE_FLAG_UNNUMBERED;
1482       si->unnumbered_sw_if_index = ip_sw_if_index;
1483
1484       ip4_main.lookup_main.if_address_pool_index_by_sw_if_index
1485         [unnumbered_sw_if_index] =
1486         ip4_main.
1487         lookup_main.if_address_pool_index_by_sw_if_index[ip_sw_if_index];
1488       ip6_main.
1489         lookup_main.if_address_pool_index_by_sw_if_index
1490         [unnumbered_sw_if_index] =
1491         ip6_main.
1492         lookup_main.if_address_pool_index_by_sw_if_index[ip_sw_if_index];
1493     }
1494   else
1495     {
1496       si->flags &= ~(VNET_SW_INTERFACE_FLAG_UNNUMBERED);
1497       si->unnumbered_sw_if_index = (u32) ~ 0;
1498
1499       ip4_main.lookup_main.if_address_pool_index_by_sw_if_index
1500         [unnumbered_sw_if_index] = ~0;
1501       ip6_main.lookup_main.if_address_pool_index_by_sw_if_index
1502         [unnumbered_sw_if_index] = ~0;
1503     }
1504
1505   if (was_unnum != (si->flags & VNET_SW_INTERFACE_FLAG_UNNUMBERED))
1506     {
1507       ip4_sw_interface_enable_disable (unnumbered_sw_if_index, enable);
1508       ip6_sw_interface_enable_disable (unnumbered_sw_if_index, enable);
1509     }
1510 }
1511
1512 vnet_l3_packet_type_t
1513 vnet_link_to_l3_proto (vnet_link_t link)
1514 {
1515   switch (link)
1516     {
1517     case VNET_LINK_IP4:
1518       return (VNET_L3_PACKET_TYPE_IP4);
1519     case VNET_LINK_IP6:
1520       return (VNET_L3_PACKET_TYPE_IP6);
1521     case VNET_LINK_MPLS:
1522       return (VNET_L3_PACKET_TYPE_MPLS);
1523     case VNET_LINK_ARP:
1524       return (VNET_L3_PACKET_TYPE_ARP);
1525     case VNET_LINK_ETHERNET:
1526     case VNET_LINK_NSH:
1527       ASSERT (0);
1528       break;
1529     }
1530   ASSERT (0);
1531   return (0);
1532 }
1533
1534 vnet_mtu_t
1535 vnet_link_to_mtu (vnet_link_t link)
1536 {
1537   switch (link)
1538     {
1539     case VNET_LINK_IP4:
1540       return (VNET_MTU_IP4);
1541     case VNET_LINK_IP6:
1542       return (VNET_MTU_IP6);
1543     case VNET_LINK_MPLS:
1544       return (VNET_MTU_MPLS);
1545     default:
1546       return (VNET_MTU_L3);
1547     }
1548 }
1549
1550 u8 *
1551 default_build_rewrite (vnet_main_t * vnm,
1552                        u32 sw_if_index,
1553                        vnet_link_t link_type, const void *dst_address)
1554 {
1555   return (NULL);
1556 }
1557
1558 void
1559 default_update_adjacency (vnet_main_t * vnm, u32 sw_if_index, u32 ai)
1560 {
1561   ip_adjacency_t *adj;
1562
1563   adj = adj_get (ai);
1564
1565   switch (adj->lookup_next_index)
1566     {
1567     case IP_LOOKUP_NEXT_GLEAN:
1568       adj_glean_update_rewrite (ai);
1569       break;
1570     case IP_LOOKUP_NEXT_ARP:
1571     case IP_LOOKUP_NEXT_BCAST:
1572       /*
1573        * default rewrite in neighbour adj
1574        */
1575       adj_nbr_update_rewrite
1576         (ai,
1577          ADJ_NBR_REWRITE_FLAG_COMPLETE,
1578          vnet_build_rewrite_for_sw_interface (vnm,
1579                                               sw_if_index,
1580                                               adj_get_link_type (ai), NULL));
1581       break;
1582     case IP_LOOKUP_NEXT_MCAST:
1583       /*
1584        * mcast traffic also uses default rewrite string with no mcast
1585        * switch time updates.
1586        */
1587       adj_mcast_update_rewrite
1588         (ai,
1589          vnet_build_rewrite_for_sw_interface (vnm,
1590                                               sw_if_index,
1591                                               adj_get_link_type (ai),
1592                                               NULL), 0);
1593       break;
1594     case IP_LOOKUP_NEXT_DROP:
1595     case IP_LOOKUP_NEXT_PUNT:
1596     case IP_LOOKUP_NEXT_LOCAL:
1597     case IP_LOOKUP_NEXT_REWRITE:
1598     case IP_LOOKUP_NEXT_MCAST_MIDCHAIN:
1599     case IP_LOOKUP_NEXT_MIDCHAIN:
1600     case IP_LOOKUP_NEXT_ICMP_ERROR:
1601     case IP_LOOKUP_N_NEXT:
1602       ASSERT (0);
1603       break;
1604     }
1605 }
1606
1607 int collect_detailed_interface_stats_flag = 0;
1608
1609 void
1610 collect_detailed_interface_stats_flag_set (void)
1611 {
1612   collect_detailed_interface_stats_flag = 1;
1613 }
1614
1615 void
1616 collect_detailed_interface_stats_flag_clear (void)
1617 {
1618   collect_detailed_interface_stats_flag = 0;
1619 }
1620
1621 static clib_error_t *
1622 collect_detailed_interface_stats_cli (vlib_main_t * vm,
1623                                       unformat_input_t * input,
1624                                       vlib_cli_command_t * cmd)
1625 {
1626   unformat_input_t _line_input, *line_input = &_line_input;
1627   clib_error_t *error = NULL;
1628
1629   /* Get a line of input. */
1630   if (!unformat_user (input, unformat_line_input, line_input))
1631     return clib_error_return (0, "expected enable | disable");
1632
1633   while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
1634     {
1635       if (unformat (line_input, "enable") || unformat (line_input, "on"))
1636         collect_detailed_interface_stats_flag_set ();
1637       else if (unformat (line_input, "disable")
1638                || unformat (line_input, "off"))
1639         collect_detailed_interface_stats_flag_clear ();
1640       else
1641         {
1642           error = clib_error_return (0, "unknown input `%U'",
1643                                      format_unformat_error, line_input);
1644           goto done;
1645         }
1646     }
1647
1648 done:
1649   unformat_free (line_input);
1650   return error;
1651 }
1652
1653 /* *INDENT-OFF* */
1654 VLIB_CLI_COMMAND (collect_detailed_interface_stats_command, static) = {
1655   .path = "interface collect detailed-stats",
1656   .short_help = "interface collect detailed-stats <enable|disable>",
1657   .function = collect_detailed_interface_stats_cli,
1658 };
1659 /* *INDENT-ON* */
1660
1661 /*
1662  * fd.io coding-style-patch-verification: ON
1663  *
1664  * Local Variables:
1665  * eval: (c-set-style "gnu")
1666  * End:
1667  */