L2 BD: introduce a BD interface on which to send UU packets
[vpp.git] / src / vnet / interface.c
1 /*
2  * Copyright (c) 2015 Cisco and/or its affiliates.
3  * Licensed under the Apache License, Version 2.0 (the "License");
4  * you may not use this file except in compliance with the License.
5  * You may obtain a copy of the License at:
6  *
7  *     http://www.apache.org/licenses/LICENSE-2.0
8  *
9  * Unless required by applicable law or agreed to in writing, software
10  * distributed under the License is distributed on an "AS IS" BASIS,
11  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12  * See the License for the specific language governing permissions and
13  * limitations under the License.
14  */
15 /*
16  * interface.c: VNET interfaces/sub-interfaces
17  *
18  * Copyright (c) 2008 Eliot Dresselhaus
19  *
20  * Permission is hereby granted, free of charge, to any person obtaining
21  * a copy of this software and associated documentation files (the
22  * "Software"), to deal in the Software without restriction, including
23  * without limitation the rights to use, copy, modify, merge, publish,
24  * distribute, sublicense, and/or sell copies of the Software, and to
25  * permit persons to whom the Software is furnished to do so, subject to
26  * the following conditions:
27  *
28  * The above copyright notice and this permission notice shall be
29  * included in all copies or substantial portions of the Software.
30  *
31  *  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32  *  EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33  *  MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34  *  NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35  *  LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36  *  OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37  *  WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
38  */
39
40 #include <vnet/vnet.h>
41 #include <vnet/plugin/plugin.h>
42 #include <vnet/fib/ip6_fib.h>
43 #include <vnet/adj/adj.h>
44 #include <vnet/adj/adj_mcast.h>
45 #include <vnet/l2/l2_input.h>
46
47 #define VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE (1 << 0)
48 #define VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE (1 << 1)
49
50 static clib_error_t *vnet_hw_interface_set_flags_helper (vnet_main_t * vnm,
51                                                          u32 hw_if_index,
52                                                          u32 flags,
53                                                          u32 helper_flags);
54
55 static clib_error_t *vnet_sw_interface_set_flags_helper (vnet_main_t * vnm,
56                                                          u32 sw_if_index,
57                                                          u32 flags,
58                                                          u32 helper_flags);
59
60 static clib_error_t *vnet_hw_interface_set_class_helper (vnet_main_t * vnm,
61                                                          u32 hw_if_index,
62                                                          u32 hw_class_index,
63                                                          u32 redistribute);
64
65 typedef struct
66 {
67   /* Either sw or hw interface index. */
68   u32 sw_hw_if_index;
69
70   /* Flags. */
71   u32 flags;
72 } vnet_sw_hw_interface_state_t;
73
74 static void
75 serialize_vec_vnet_sw_hw_interface_state (serialize_main_t * m, va_list * va)
76 {
77   vnet_sw_hw_interface_state_t *s =
78     va_arg (*va, vnet_sw_hw_interface_state_t *);
79   u32 n = va_arg (*va, u32);
80   u32 i;
81   for (i = 0; i < n; i++)
82     {
83       serialize_integer (m, s[i].sw_hw_if_index,
84                          sizeof (s[i].sw_hw_if_index));
85       serialize_integer (m, s[i].flags, sizeof (s[i].flags));
86     }
87 }
88
89 static void
90 unserialize_vec_vnet_sw_hw_interface_state (serialize_main_t * m,
91                                             va_list * va)
92 {
93   vnet_sw_hw_interface_state_t *s =
94     va_arg (*va, vnet_sw_hw_interface_state_t *);
95   u32 n = va_arg (*va, u32);
96   u32 i;
97   for (i = 0; i < n; i++)
98     {
99       unserialize_integer (m, &s[i].sw_hw_if_index,
100                            sizeof (s[i].sw_hw_if_index));
101       unserialize_integer (m, &s[i].flags, sizeof (s[i].flags));
102     }
103 }
104
105 static void
106 serialize_vnet_sw_hw_interface_set_flags (serialize_main_t * m, va_list * va)
107 {
108   vnet_sw_hw_interface_state_t *s =
109     va_arg (*va, vnet_sw_hw_interface_state_t *);
110   serialize (m, serialize_vec_vnet_sw_hw_interface_state, s, 1);
111 }
112
113 static void
114 unserialize_vnet_sw_interface_set_flags (serialize_main_t * m, va_list * va)
115 {
116   CLIB_UNUSED (mc_main_t * mc) = va_arg (*va, mc_main_t *);
117   vnet_sw_hw_interface_state_t s;
118
119   unserialize (m, unserialize_vec_vnet_sw_hw_interface_state, &s, 1);
120
121   vnet_sw_interface_set_flags_helper
122     (vnet_get_main (), s.sw_hw_if_index, s.flags,
123      /* helper_flags no redistribution */ 0);
124 }
125
126 static void
127 unserialize_vnet_hw_interface_set_flags (serialize_main_t * m, va_list * va)
128 {
129   CLIB_UNUSED (mc_main_t * mc) = va_arg (*va, mc_main_t *);
130   vnet_sw_hw_interface_state_t s;
131
132   unserialize (m, unserialize_vec_vnet_sw_hw_interface_state, &s, 1);
133
134   vnet_hw_interface_set_flags_helper
135     (vnet_get_main (), s.sw_hw_if_index, s.flags,
136      /* helper_flags no redistribution */ 0);
137 }
138
139 MC_SERIALIZE_MSG (vnet_sw_interface_set_flags_msg, static) =
140 {
141 .name = "vnet_sw_interface_set_flags",.serialize =
142     serialize_vnet_sw_hw_interface_set_flags,.unserialize =
143     unserialize_vnet_sw_interface_set_flags,};
144
145 MC_SERIALIZE_MSG (vnet_hw_interface_set_flags_msg, static) =
146 {
147 .name = "vnet_hw_interface_set_flags",.serialize =
148     serialize_vnet_sw_hw_interface_set_flags,.unserialize =
149     unserialize_vnet_hw_interface_set_flags,};
150
151 void
152 serialize_vnet_interface_state (serialize_main_t * m, va_list * va)
153 {
154   vnet_main_t *vnm = va_arg (*va, vnet_main_t *);
155   vnet_sw_hw_interface_state_t *sts = 0, *st;
156   vnet_sw_interface_t *sif;
157   vnet_hw_interface_t *hif;
158   vnet_interface_main_t *im = &vnm->interface_main;
159
160   /* Serialize hardware interface classes since they may have changed.
161      Must do this before sending up/down flags. */
162   /* *INDENT-OFF* */
163   pool_foreach (hif, im->hw_interfaces, ({
164     vnet_hw_interface_class_t * hw_class = vnet_get_hw_interface_class (vnm, hif->hw_class_index);
165     serialize_cstring (m, hw_class->name);
166   }));
167   /* *INDENT-ON* */
168
169   /* Send sw/hw interface state when non-zero. */
170   /* *INDENT-OFF* */
171   pool_foreach (sif, im->sw_interfaces, ({
172     if (sif->flags != 0)
173       {
174         vec_add2 (sts, st, 1);
175         st->sw_hw_if_index = sif->sw_if_index;
176         st->flags = sif->flags;
177       }
178   }));
179   /* *INDENT-ON* */
180
181   vec_serialize (m, sts, serialize_vec_vnet_sw_hw_interface_state);
182
183   if (sts)
184     _vec_len (sts) = 0;
185
186   /* *INDENT-OFF* */
187   pool_foreach (hif, im->hw_interfaces, ({
188     if (hif->flags != 0)
189       {
190         vec_add2 (sts, st, 1);
191         st->sw_hw_if_index = hif->hw_if_index;
192         st->flags = hif->flags;
193       }
194   }));
195   /* *INDENT-ON* */
196
197   vec_serialize (m, sts, serialize_vec_vnet_sw_hw_interface_state);
198
199   vec_free (sts);
200 }
201
202 void
203 unserialize_vnet_interface_state (serialize_main_t * m, va_list * va)
204 {
205   vnet_main_t *vnm = va_arg (*va, vnet_main_t *);
206   vnet_sw_hw_interface_state_t *sts = 0, *st;
207
208   /* First set interface hardware class. */
209   {
210     vnet_interface_main_t *im = &vnm->interface_main;
211     vnet_hw_interface_t *hif;
212     char *class_name;
213     uword *p;
214     clib_error_t *error;
215
216     /* *INDENT-OFF* */
217     pool_foreach (hif, im->hw_interfaces, ({
218       unserialize_cstring (m, &class_name);
219       p = hash_get_mem (im->hw_interface_class_by_name, class_name);
220       ASSERT (p != 0);
221       error = vnet_hw_interface_set_class_helper (vnm, hif->hw_if_index, p[0], /* redistribute */ 0);
222       if (error)
223         clib_error_report (error);
224       vec_free (class_name);
225     }));
226     /* *INDENT-ON* */
227   }
228
229   vec_unserialize (m, &sts, unserialize_vec_vnet_sw_hw_interface_state);
230   vec_foreach (st, sts)
231     vnet_sw_interface_set_flags_helper (vnm, st->sw_hw_if_index, st->flags,
232                                         /* no distribute */ 0);
233   vec_free (sts);
234
235   vec_unserialize (m, &sts, unserialize_vec_vnet_sw_hw_interface_state);
236   vec_foreach (st, sts)
237     vnet_hw_interface_set_flags_helper (vnm, st->sw_hw_if_index, st->flags,
238                                         /* no distribute */ 0);
239   vec_free (sts);
240 }
241
242 static clib_error_t *
243 call_elf_section_interface_callbacks (vnet_main_t * vnm, u32 if_index,
244                                       u32 flags,
245                                       _vnet_interface_function_list_elt_t **
246                                       elts)
247 {
248   _vnet_interface_function_list_elt_t *elt;
249   vnet_interface_function_priority_t prio;
250   clib_error_t *error = 0;
251
252   for (prio = VNET_ITF_FUNC_PRIORITY_LOW;
253        prio <= VNET_ITF_FUNC_PRIORITY_HIGH; prio++)
254     {
255       elt = elts[prio];
256
257       while (elt)
258         {
259           error = elt->fp (vnm, if_index, flags);
260           if (error)
261             return error;
262           elt = elt->next_interface_function;
263         }
264     }
265   return error;
266 }
267
268 static clib_error_t *
269 call_hw_interface_add_del_callbacks (vnet_main_t * vnm, u32 hw_if_index,
270                                      u32 is_create)
271 {
272   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
273   vnet_hw_interface_class_t *hw_class =
274     vnet_get_hw_interface_class (vnm, hi->hw_class_index);
275   vnet_device_class_t *dev_class =
276     vnet_get_device_class (vnm, hi->dev_class_index);
277   clib_error_t *error = 0;
278
279   if (hw_class->interface_add_del_function
280       && (error =
281           hw_class->interface_add_del_function (vnm, hw_if_index, is_create)))
282     return error;
283
284   if (dev_class->interface_add_del_function
285       && (error =
286           dev_class->interface_add_del_function (vnm, hw_if_index,
287                                                  is_create)))
288     return error;
289
290   error = call_elf_section_interface_callbacks
291     (vnm, hw_if_index, is_create, vnm->hw_interface_add_del_functions);
292
293   return error;
294 }
295
296 static clib_error_t *
297 call_sw_interface_add_del_callbacks (vnet_main_t * vnm, u32 sw_if_index,
298                                      u32 is_create)
299 {
300   return call_elf_section_interface_callbacks
301     (vnm, sw_if_index, is_create, vnm->sw_interface_add_del_functions);
302 }
303
304 #define VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE (1 << 0)
305 #define VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE (1 << 1)
306
307 static clib_error_t *
308 vnet_hw_interface_set_flags_helper (vnet_main_t * vnm, u32 hw_if_index,
309                                     u32 flags, u32 helper_flags)
310 {
311   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
312   vnet_hw_interface_class_t *hw_class =
313     vnet_get_hw_interface_class (vnm, hi->hw_class_index);
314   vnet_device_class_t *dev_class =
315     vnet_get_device_class (vnm, hi->dev_class_index);
316   vlib_main_t *vm = vnm->vlib_main;
317   u32 mask;
318   clib_error_t *error = 0;
319   u32 is_create =
320     (helper_flags & VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE) != 0;
321
322   mask =
323     (VNET_HW_INTERFACE_FLAG_LINK_UP | VNET_HW_INTERFACE_FLAG_DUPLEX_MASK |
324      VNET_HW_INTERFACE_FLAG_SPEED_MASK);
325   flags &= mask;
326
327   /* Call hardware interface add/del callbacks. */
328   if (is_create)
329     call_hw_interface_add_del_callbacks (vnm, hw_if_index, is_create);
330
331   /* Already in the desired state? */
332   if (!is_create && (hi->flags & mask) == flags)
333     goto done;
334
335   /* Some interface classes do not redistribute (e.g. are local). */
336   if (!dev_class->redistribute)
337     helper_flags &= ~VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE;
338
339   if (vm->mc_main
340       && (helper_flags & VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE))
341     {
342       vnet_sw_hw_interface_state_t s;
343       s.sw_hw_if_index = hw_if_index;
344       s.flags = flags;
345       mc_serialize (vm->mc_main, &vnet_hw_interface_set_flags_msg, &s);
346     }
347
348   if ((hi->flags & VNET_HW_INTERFACE_FLAG_LINK_UP) !=
349       (flags & VNET_HW_INTERFACE_FLAG_LINK_UP))
350     {
351       /* Do hardware class (e.g. ethernet). */
352       if (hw_class->link_up_down_function
353           && (error = hw_class->link_up_down_function (vnm, hw_if_index,
354                                                        flags)))
355         goto done;
356
357       error = call_elf_section_interface_callbacks
358         (vnm, hw_if_index, flags, vnm->hw_interface_link_up_down_functions);
359
360       if (error)
361         goto done;
362     }
363
364   hi->flags &= ~mask;
365   hi->flags |= flags;
366
367 done:
368   return error;
369 }
370
371 static clib_error_t *
372 vnet_sw_interface_set_flags_helper (vnet_main_t * vnm, u32 sw_if_index,
373                                     u32 flags, u32 helper_flags)
374 {
375   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
376   vlib_main_t *vm = vnm->vlib_main;
377   u32 mask;
378   clib_error_t *error = 0;
379   u32 is_create =
380     (helper_flags & VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE) != 0;
381   u32 old_flags;
382
383   mask = VNET_SW_INTERFACE_FLAG_ADMIN_UP | VNET_SW_INTERFACE_FLAG_PUNT;
384   flags &= mask;
385
386   if (is_create)
387     {
388       error =
389         call_sw_interface_add_del_callbacks (vnm, sw_if_index, is_create);
390       if (error)
391         goto done;
392
393       if (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
394         {
395           /* Notify everyone when the interface is created as admin up */
396           error = call_elf_section_interface_callbacks (vnm, sw_if_index,
397                                                         flags,
398                                                         vnm->
399                                                         sw_interface_admin_up_down_functions);
400           if (error)
401             goto done;
402         }
403     }
404   else
405     {
406       vnet_sw_interface_t *si_sup = si;
407
408       /* Check that super interface is in correct state. */
409       if (si->type == VNET_SW_INTERFACE_TYPE_SUB)
410         {
411           si_sup = vnet_get_sw_interface (vnm, si->sup_sw_if_index);
412
413           /* Check to see if we're bringing down the soft interface and if it's parent is up */
414           if ((flags != (si_sup->flags & mask)) &&
415               (!((flags == 0)
416                  && ((si_sup->flags & mask) ==
417                      VNET_SW_INTERFACE_FLAG_ADMIN_UP))))
418             {
419               error = clib_error_return (0, "super-interface %U must be %U",
420                                          format_vnet_sw_interface_name, vnm,
421                                          si_sup,
422                                          format_vnet_sw_interface_flags,
423                                          flags);
424               goto done;
425             }
426         }
427
428       /* Do not change state for slave link of bonded interfaces */
429       if (si->flags & VNET_SW_INTERFACE_FLAG_BOND_SLAVE)
430         {
431           error = clib_error_return
432             (0, "not allowed as %U belong to a BondEthernet interface",
433              format_vnet_sw_interface_name, vnm, si);
434           goto done;
435         }
436
437       /* Already in the desired state? */
438       if ((si->flags & mask) == flags)
439         goto done;
440
441       /* Sub-interfaces of hardware interfaces that do no redistribute,
442          do not redistribute themselves. */
443       if (si_sup->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
444         {
445           vnet_hw_interface_t *hi =
446             vnet_get_hw_interface (vnm, si_sup->hw_if_index);
447           vnet_device_class_t *dev_class =
448             vnet_get_device_class (vnm, hi->dev_class_index);
449           if (!dev_class->redistribute)
450             helper_flags &=
451               ~VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE;
452         }
453
454       if (vm->mc_main
455           && (helper_flags &
456               VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE))
457         {
458           vnet_sw_hw_interface_state_t s;
459           s.sw_hw_if_index = sw_if_index;
460           s.flags = flags;
461           mc_serialize (vm->mc_main, &vnet_sw_interface_set_flags_msg, &s);
462         }
463
464       /* set the flags now before invoking the registered clients
465        * so that the state they query is consistent with the state here notified */
466       old_flags = si->flags;
467       si->flags &= ~mask;
468       si->flags |= flags;
469       if ((flags | old_flags) & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
470         error = call_elf_section_interface_callbacks
471           (vnm, sw_if_index, flags,
472            vnm->sw_interface_admin_up_down_functions);
473
474       if (error)
475         {
476           /* restore flags on error */
477           si->flags = old_flags;
478           goto done;
479         }
480
481       if (si->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
482         {
483           vnet_hw_interface_t *hi =
484             vnet_get_hw_interface (vnm, si->hw_if_index);
485           vnet_hw_interface_class_t *hw_class =
486             vnet_get_hw_interface_class (vnm, hi->hw_class_index);
487           vnet_device_class_t *dev_class =
488             vnet_get_device_class (vnm, hi->dev_class_index);
489
490           if ((flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP) &&
491               (si->flags & VNET_SW_INTERFACE_FLAG_ERROR))
492             {
493               error = clib_error_return (0, "Interface in the error state");
494               goto done;
495             }
496
497           /* save the si admin up flag */
498           old_flags = si->flags;
499
500           /* update si admin up flag in advance if we are going admin down */
501           if (!(flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP))
502             si->flags &= ~VNET_SW_INTERFACE_FLAG_ADMIN_UP;
503
504           if (dev_class->admin_up_down_function
505               && (error = dev_class->admin_up_down_function (vnm,
506                                                              si->hw_if_index,
507                                                              flags)))
508             {
509               /* restore si admin up flag to it's original state on errors */
510               si->flags = old_flags;
511               goto done;
512             }
513
514           if (hw_class->admin_up_down_function
515               && (error = hw_class->admin_up_down_function (vnm,
516                                                             si->hw_if_index,
517                                                             flags)))
518             {
519               /* restore si admin up flag to it's original state on errors */
520               si->flags = old_flags;
521               goto done;
522             }
523
524           /* Admin down implies link down. */
525           if (!(flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
526               && (hi->flags & VNET_HW_INTERFACE_FLAG_LINK_UP))
527             vnet_hw_interface_set_flags_helper (vnm, si->hw_if_index,
528                                                 hi->flags &
529                                                 ~VNET_HW_INTERFACE_FLAG_LINK_UP,
530                                                 helper_flags);
531         }
532     }
533
534   si->flags &= ~mask;
535   si->flags |= flags;
536
537 done:
538   return error;
539 }
540
541 clib_error_t *
542 vnet_hw_interface_set_flags (vnet_main_t * vnm, u32 hw_if_index, u32 flags)
543 {
544   return vnet_hw_interface_set_flags_helper
545     (vnm, hw_if_index, flags,
546      VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE);
547 }
548
549 clib_error_t *
550 vnet_sw_interface_set_flags (vnet_main_t * vnm, u32 sw_if_index, u32 flags)
551 {
552   return vnet_sw_interface_set_flags_helper
553     (vnm, sw_if_index, flags,
554      VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE);
555 }
556
557 static u32
558 vnet_create_sw_interface_no_callbacks (vnet_main_t * vnm,
559                                        vnet_sw_interface_t * template)
560 {
561   vnet_interface_main_t *im = &vnm->interface_main;
562   vnet_sw_interface_t *sw;
563   u32 sw_if_index;
564
565   pool_get (im->sw_interfaces, sw);
566   sw_if_index = sw - im->sw_interfaces;
567
568   sw[0] = template[0];
569
570   sw->flags = 0;
571   sw->sw_if_index = sw_if_index;
572   if (sw->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
573     sw->sup_sw_if_index = sw->sw_if_index;
574
575   /* Allocate counters for this interface. */
576   {
577     u32 i;
578
579     vnet_interface_counter_lock (im);
580
581     for (i = 0; i < vec_len (im->sw_if_counters); i++)
582       {
583         vlib_validate_simple_counter (&im->sw_if_counters[i], sw_if_index);
584         vlib_zero_simple_counter (&im->sw_if_counters[i], sw_if_index);
585       }
586
587     for (i = 0; i < vec_len (im->combined_sw_if_counters); i++)
588       {
589         vlib_validate_combined_counter (&im->combined_sw_if_counters[i],
590                                         sw_if_index);
591         vlib_zero_combined_counter (&im->combined_sw_if_counters[i],
592                                     sw_if_index);
593       }
594
595     vnet_interface_counter_unlock (im);
596   }
597
598   return sw_if_index;
599 }
600
601 clib_error_t *
602 vnet_create_sw_interface (vnet_main_t * vnm, vnet_sw_interface_t * template,
603                           u32 * sw_if_index)
604 {
605   clib_error_t *error;
606   vnet_hw_interface_t *hi;
607   vnet_device_class_t *dev_class;
608
609   hi = vnet_get_sup_hw_interface (vnm, template->sup_sw_if_index);
610   dev_class = vnet_get_device_class (vnm, hi->dev_class_index);
611
612   if (template->type == VNET_SW_INTERFACE_TYPE_SUB &&
613       dev_class->subif_add_del_function)
614     {
615       error = dev_class->subif_add_del_function (vnm, hi->hw_if_index,
616                                                  (struct vnet_sw_interface_t
617                                                   *) template, 1);
618       if (error)
619         return error;
620     }
621
622   *sw_if_index = vnet_create_sw_interface_no_callbacks (vnm, template);
623   error = vnet_sw_interface_set_flags_helper
624     (vnm, *sw_if_index, template->flags,
625      VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
626
627   if (error)
628     {
629       /* undo the work done by vnet_create_sw_interface_no_callbacks() */
630       vnet_interface_main_t *im = &vnm->interface_main;
631       vnet_sw_interface_t *sw =
632         pool_elt_at_index (im->sw_interfaces, *sw_if_index);
633       pool_put (im->sw_interfaces, sw);
634     }
635
636   return error;
637 }
638
639 void
640 vnet_delete_sw_interface (vnet_main_t * vnm, u32 sw_if_index)
641 {
642   vnet_interface_main_t *im = &vnm->interface_main;
643   vnet_sw_interface_t *sw =
644     pool_elt_at_index (im->sw_interfaces, sw_if_index);
645
646   /* Check if the interface has config and is removed from L2 BD or XConnect */
647   vlib_main_t *vm = vlib_get_main ();
648   l2_input_config_t *config;
649   if (sw_if_index < vec_len (l2input_main.configs))
650     {
651       config = vec_elt_at_index (l2input_main.configs, sw_if_index);
652       if (config->xconnect)
653         set_int_l2_mode (vm, vnm, MODE_L3, config->output_sw_if_index, 0,
654                          L2_BD_PORT_TYPE_NORMAL, 0, 0);
655       if (config->xconnect || config->bridge)
656         set_int_l2_mode (vm, vnm, MODE_L3, sw_if_index, 0,
657                          L2_BD_PORT_TYPE_NORMAL, 0, 0);
658     }
659   vnet_clear_sw_interface_tag (vnm, sw_if_index);
660
661   /* Bring down interface in case it is up. */
662   if (sw->flags != 0)
663     vnet_sw_interface_set_flags (vnm, sw_if_index, /* flags */ 0);
664
665   call_sw_interface_add_del_callbacks (vnm, sw_if_index, /* is_create */ 0);
666
667   pool_put (im->sw_interfaces, sw);
668 }
669
670 static clib_error_t *
671 call_sw_interface_mtu_change_callbacks (vnet_main_t * vnm, u32 sw_if_index)
672 {
673   return call_elf_section_interface_callbacks
674     (vnm, sw_if_index, 0, vnm->sw_interface_mtu_change_functions);
675 }
676
677 void
678 vnet_sw_interface_set_mtu (vnet_main_t * vnm, u32 sw_if_index, u32 mtu)
679 {
680   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
681
682   if (si->mtu[VNET_MTU_L3] != mtu)
683     {
684       si->mtu[VNET_MTU_L3] = mtu;
685       call_sw_interface_mtu_change_callbacks (vnm, sw_if_index);
686     }
687 }
688
689 void
690 vnet_sw_interface_set_protocol_mtu (vnet_main_t * vnm, u32 sw_if_index,
691                                     u32 mtu[])
692 {
693   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
694   bool changed = false;
695   int i;
696
697   for (i = 0; i < VNET_N_MTU; i++)
698     {
699       if (si->mtu[i] != mtu[i])
700         {
701           si->mtu[i] = mtu[i];
702           changed = true;
703         }
704     }
705   /* Notify interested parties */
706   if (changed)
707     call_sw_interface_mtu_change_callbacks (vnm, sw_if_index);
708 }
709
710 void
711 vnet_sw_interface_ip_directed_broadcast (vnet_main_t * vnm,
712                                          u32 sw_if_index, u8 enable)
713 {
714   vnet_sw_interface_t *si;
715
716   si = vnet_get_sw_interface (vnm, sw_if_index);
717
718   if (enable)
719     si->flags |= VNET_SW_INTERFACE_FLAG_DIRECTED_BCAST;
720   else
721     si->flags &= ~VNET_SW_INTERFACE_FLAG_DIRECTED_BCAST;
722
723   ip4_directed_broadcast (sw_if_index, enable);
724 }
725
726 /*
727  * Reflect a change in hardware MTU on protocol MTUs
728  */
729 static walk_rc_t
730 sw_interface_walk_callback (vnet_main_t * vnm, u32 sw_if_index, void *ctx)
731 {
732   u32 *link_mtu = ctx;
733   vnet_sw_interface_set_mtu (vnm, sw_if_index, *link_mtu);
734   return WALK_CONTINUE;
735 }
736
737 void
738 vnet_hw_interface_set_mtu (vnet_main_t * vnm, u32 hw_if_index, u32 mtu)
739 {
740   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
741
742   if (hi->max_packet_bytes != mtu)
743     {
744       hi->max_packet_bytes = mtu;
745       ethernet_set_flags (vnm, hw_if_index, ETHERNET_INTERFACE_FLAG_MTU);
746       vnet_hw_interface_walk_sw (vnm, hw_if_index, sw_interface_walk_callback,
747                                  &mtu);
748     }
749 }
750
751 static void
752 setup_tx_node (vlib_main_t * vm,
753                u32 node_index, vnet_device_class_t * dev_class)
754 {
755   vlib_node_t *n = vlib_get_node (vm, node_index);
756
757   n->function = dev_class->tx_function;
758   n->format_trace = dev_class->format_tx_trace;
759
760   vlib_register_errors (vm, node_index,
761                         dev_class->tx_function_n_errors,
762                         dev_class->tx_function_error_strings);
763 }
764
765 static void
766 setup_output_node (vlib_main_t * vm,
767                    u32 node_index, vnet_hw_interface_class_t * hw_class)
768 {
769   vlib_node_t *n = vlib_get_node (vm, node_index);
770   n->format_buffer = hw_class->format_header;
771   n->unformat_buffer = hw_class->unformat_header;
772 }
773
774 /* Register an interface instance. */
775 u32
776 vnet_register_interface (vnet_main_t * vnm,
777                          u32 dev_class_index,
778                          u32 dev_instance,
779                          u32 hw_class_index, u32 hw_instance)
780 {
781   vnet_interface_main_t *im = &vnm->interface_main;
782   vnet_hw_interface_t *hw;
783   vnet_device_class_t *dev_class =
784     vnet_get_device_class (vnm, dev_class_index);
785   vnet_hw_interface_class_t *hw_class =
786     vnet_get_hw_interface_class (vnm, hw_class_index);
787   vlib_main_t *vm = vnm->vlib_main;
788   vnet_feature_config_main_t *fcm;
789   vnet_config_main_t *cm;
790   u32 hw_index, i;
791   char *tx_node_name = NULL, *output_node_name = NULL;
792
793   pool_get (im->hw_interfaces, hw);
794   memset (hw, 0, sizeof (*hw));
795
796   hw_index = hw - im->hw_interfaces;
797   hw->hw_if_index = hw_index;
798   hw->default_rx_mode = VNET_HW_INTERFACE_RX_MODE_POLLING;
799
800   if (dev_class->format_device_name)
801     hw->name = format (0, "%U", dev_class->format_device_name, dev_instance);
802   else if (hw_class->format_interface_name)
803     hw->name = format (0, "%U", hw_class->format_interface_name,
804                        dev_instance);
805   else
806     hw->name = format (0, "%s%x", hw_class->name, dev_instance);
807
808   if (!im->hw_interface_by_name)
809     im->hw_interface_by_name = hash_create_vec ( /* size */ 0,
810                                                 sizeof (hw->name[0]),
811                                                 sizeof (uword));
812
813   hash_set_mem (im->hw_interface_by_name, hw->name, hw_index);
814
815   /* Make hardware interface point to software interface. */
816   {
817     vnet_sw_interface_t sw = {
818       .type = VNET_SW_INTERFACE_TYPE_HARDWARE,
819       .flood_class = VNET_FLOOD_CLASS_NORMAL,
820       .hw_if_index = hw_index
821     };
822     hw->sw_if_index = vnet_create_sw_interface_no_callbacks (vnm, &sw);
823   }
824
825   hw->dev_class_index = dev_class_index;
826   hw->dev_instance = dev_instance;
827   hw->hw_class_index = hw_class_index;
828   hw->hw_instance = hw_instance;
829
830   hw->max_rate_bits_per_sec = 0;
831   hw->min_packet_bytes = 0;
832   vnet_sw_interface_set_mtu (vnm, hw->sw_if_index, 0);
833
834   if (dev_class->tx_function == 0)
835     goto no_output_nodes;       /* No output/tx nodes to create */
836
837   tx_node_name = (char *) format (0, "%v-tx", hw->name);
838   output_node_name = (char *) format (0, "%v-output", hw->name);
839
840   /* If we have previously deleted interface nodes, re-use them. */
841   if (vec_len (im->deleted_hw_interface_nodes) > 0)
842     {
843       vnet_hw_interface_nodes_t *hn;
844       vlib_node_t *node;
845       vlib_node_runtime_t *nrt;
846
847       hn = vec_end (im->deleted_hw_interface_nodes) - 1;
848
849       hw->tx_node_index = hn->tx_node_index;
850       hw->output_node_index = hn->output_node_index;
851
852       vlib_node_rename (vm, hw->tx_node_index, "%v", tx_node_name);
853       vlib_node_rename (vm, hw->output_node_index, "%v", output_node_name);
854
855       /* *INDENT-OFF* */
856       foreach_vlib_main ({
857         vnet_interface_output_runtime_t *rt;
858
859         rt = vlib_node_get_runtime_data (this_vlib_main, hw->output_node_index);
860         ASSERT (rt->is_deleted == 1);
861         rt->is_deleted = 0;
862         rt->hw_if_index = hw_index;
863         rt->sw_if_index = hw->sw_if_index;
864         rt->dev_instance = hw->dev_instance;
865
866         rt = vlib_node_get_runtime_data (this_vlib_main, hw->tx_node_index);
867         rt->hw_if_index = hw_index;
868         rt->sw_if_index = hw->sw_if_index;
869         rt->dev_instance = hw->dev_instance;
870       });
871       /* *INDENT-ON* */
872
873       /* The new class may differ from the old one.
874        * Functions have to be updated. */
875       node = vlib_get_node (vm, hw->output_node_index);
876       node->function = vnet_interface_output_node_multiarch_select ();
877       node->format_trace = format_vnet_interface_output_trace;
878       /* *INDENT-OFF* */
879       foreach_vlib_main ({
880         nrt = vlib_node_get_runtime (this_vlib_main, hw->output_node_index);
881         nrt->function = node->function;
882       });
883       /* *INDENT-ON* */
884
885       node = vlib_get_node (vm, hw->tx_node_index);
886       node->function = dev_class->tx_function;
887       node->format_trace = dev_class->format_tx_trace;
888       /* *INDENT-OFF* */
889       foreach_vlib_main ({
890         nrt = vlib_node_get_runtime (this_vlib_main, hw->tx_node_index);
891         nrt->function = node->function;
892       });
893       /* *INDENT-ON* */
894
895       _vec_len (im->deleted_hw_interface_nodes) -= 1;
896     }
897   else
898     {
899       vlib_node_registration_t r;
900       vnet_interface_output_runtime_t rt = {
901         .hw_if_index = hw_index,
902         .sw_if_index = hw->sw_if_index,
903         .dev_instance = hw->dev_instance,
904         .is_deleted = 0,
905       };
906
907       memset (&r, 0, sizeof (r));
908       r.type = VLIB_NODE_TYPE_INTERNAL;
909       r.runtime_data = &rt;
910       r.runtime_data_bytes = sizeof (rt);
911       r.scalar_size = 0;
912       r.vector_size = sizeof (u32);
913
914       r.flags = VLIB_NODE_FLAG_IS_OUTPUT;
915       r.name = tx_node_name;
916       r.function = dev_class->tx_function;
917
918       hw->tx_node_index = vlib_register_node (vm, &r);
919
920       vlib_node_add_named_next_with_slot (vm, hw->tx_node_index,
921                                           "error-drop",
922                                           VNET_INTERFACE_TX_NEXT_DROP);
923
924       r.flags = 0;
925       r.name = output_node_name;
926       r.function = vnet_interface_output_node_multiarch_select ();
927       r.format_trace = format_vnet_interface_output_trace;
928
929       {
930         static char *e[] = {
931           "interface is down",
932           "interface is deleted",
933         };
934
935         r.n_errors = ARRAY_LEN (e);
936         r.error_strings = e;
937       }
938       hw->output_node_index = vlib_register_node (vm, &r);
939
940       vlib_node_add_named_next_with_slot (vm, hw->output_node_index,
941                                           "error-drop",
942                                           VNET_INTERFACE_OUTPUT_NEXT_DROP);
943       vlib_node_add_next_with_slot (vm, hw->output_node_index,
944                                     hw->tx_node_index,
945                                     VNET_INTERFACE_OUTPUT_NEXT_TX);
946
947       /* add interface to the list of "output-interface" feature arc start nodes
948          and clone nexts from 1st interface if it exists */
949       fcm = vnet_feature_get_config_main (im->output_feature_arc_index);
950       cm = &fcm->config_main;
951       i = vec_len (cm->start_node_indices);
952       vec_validate (cm->start_node_indices, i);
953       cm->start_node_indices[i] = hw->output_node_index;
954       if (hw_index)
955         {
956           /* copy nexts from 1st interface */
957           vnet_hw_interface_t *first_hw;
958           vlib_node_t *first_node;
959
960           first_hw = vnet_get_hw_interface (vnm, /* hw_if_index */ 0);
961           first_node = vlib_get_node (vm, first_hw->output_node_index);
962
963           /* 1st 2 nexts are already added above */
964           for (i = 2; i < vec_len (first_node->next_nodes); i++)
965             vlib_node_add_next_with_slot (vm, hw->output_node_index,
966                                           first_node->next_nodes[i], i);
967         }
968     }
969
970   setup_output_node (vm, hw->output_node_index, hw_class);
971   setup_tx_node (vm, hw->tx_node_index, dev_class);
972
973 no_output_nodes:
974   /* Call all up/down callbacks with zero flags when interface is created. */
975   vnet_sw_interface_set_flags_helper (vnm, hw->sw_if_index, /* flags */ 0,
976                                       VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
977   vnet_hw_interface_set_flags_helper (vnm, hw_index, /* flags */ 0,
978                                       VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
979   vec_free (tx_node_name);
980   vec_free (output_node_name);
981
982   return hw_index;
983 }
984
985 void
986 vnet_delete_hw_interface (vnet_main_t * vnm, u32 hw_if_index)
987 {
988   vnet_interface_main_t *im = &vnm->interface_main;
989   vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
990   vlib_main_t *vm = vnm->vlib_main;
991   vnet_device_class_t *dev_class = vnet_get_device_class (vnm,
992                                                           hw->dev_class_index);
993   /* If it is up, mark it down. */
994   if (hw->flags != 0)
995     vnet_hw_interface_set_flags (vnm, hw_if_index, /* flags */ 0);
996
997   /* Call delete callbacks. */
998   call_hw_interface_add_del_callbacks (vnm, hw_if_index, /* is_create */ 0);
999
1000   /* Delete any sub-interfaces. */
1001   {
1002     u32 id, sw_if_index;
1003     /* *INDENT-OFF* */
1004     hash_foreach (id, sw_if_index, hw->sub_interface_sw_if_index_by_id,
1005     ({
1006       vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
1007       u64 sup_and_sub_key =
1008         ((u64) (si->sup_sw_if_index) << 32) | (u64) si->sub.id;
1009       hash_unset_mem_free (&im->sw_if_index_by_sup_and_sub, &sup_and_sub_key);
1010       vnet_delete_sw_interface (vnm, sw_if_index);
1011     }));
1012     hash_free (hw->sub_interface_sw_if_index_by_id);
1013     /* *INDENT-ON* */
1014   }
1015
1016   /* Delete software interface corresponding to hardware interface. */
1017   vnet_delete_sw_interface (vnm, hw->sw_if_index);
1018
1019   if (dev_class->tx_function)
1020     {
1021       /* Put output/tx nodes into recycle pool */
1022       vnet_hw_interface_nodes_t *dn;
1023
1024       /* *INDENT-OFF* */
1025       foreach_vlib_main
1026         ({
1027           vnet_interface_output_runtime_t *rt =
1028             vlib_node_get_runtime_data (this_vlib_main, hw->output_node_index);
1029
1030           /* Mark node runtime as deleted so output node (if called)
1031            * will drop packets. */
1032           rt->is_deleted = 1;
1033         });
1034       /* *INDENT-ON* */
1035
1036       vlib_node_rename (vm, hw->output_node_index,
1037                         "interface-%d-output-deleted", hw_if_index);
1038       vlib_node_rename (vm, hw->tx_node_index, "interface-%d-tx-deleted",
1039                         hw_if_index);
1040       vec_add2 (im->deleted_hw_interface_nodes, dn, 1);
1041       dn->tx_node_index = hw->tx_node_index;
1042       dn->output_node_index = hw->output_node_index;
1043     }
1044
1045   hash_unset_mem (im->hw_interface_by_name, hw->name);
1046   vec_free (hw->name);
1047   vec_free (hw->hw_address);
1048   vec_free (hw->input_node_thread_index_by_queue);
1049   vec_free (hw->dq_runtime_index_by_queue);
1050
1051   pool_put (im->hw_interfaces, hw);
1052 }
1053
1054 void
1055 vnet_hw_interface_walk_sw (vnet_main_t * vnm,
1056                            u32 hw_if_index,
1057                            vnet_hw_sw_interface_walk_t fn, void *ctx)
1058 {
1059   vnet_hw_interface_t *hi;
1060   u32 id, sw_if_index;
1061
1062   hi = vnet_get_hw_interface (vnm, hw_if_index);
1063   /* the super first, then the sub interfaces */
1064   if (WALK_STOP == fn (vnm, hi->sw_if_index, ctx))
1065     return;
1066
1067   /* *INDENT-OFF* */
1068   hash_foreach (id, sw_if_index,
1069                 hi->sub_interface_sw_if_index_by_id,
1070   ({
1071     if (WALK_STOP == fn (vnm, sw_if_index, ctx))
1072       break;
1073   }));
1074   /* *INDENT-ON* */
1075 }
1076
1077 void
1078 vnet_hw_interface_walk (vnet_main_t * vnm,
1079                         vnet_hw_interface_walk_t fn, void *ctx)
1080 {
1081   vnet_interface_main_t *im;
1082   vnet_hw_interface_t *hi;
1083
1084   im = &vnm->interface_main;
1085
1086   /* *INDENT-OFF* */
1087   pool_foreach (hi, im->hw_interfaces,
1088   ({
1089     if (WALK_STOP == fn(vnm, hi->hw_if_index, ctx))
1090       break;
1091   }));
1092   /* *INDENT-ON* */
1093 }
1094
1095 void
1096 vnet_sw_interface_walk (vnet_main_t * vnm,
1097                         vnet_sw_interface_walk_t fn, void *ctx)
1098 {
1099   vnet_interface_main_t *im;
1100   vnet_sw_interface_t *si;
1101
1102   im = &vnm->interface_main;
1103
1104   /* *INDENT-OFF* */
1105   pool_foreach (si, im->sw_interfaces,
1106   {
1107     if (WALK_STOP == fn (vnm, si, ctx))
1108       break;
1109   });
1110   /* *INDENT-ON* */
1111 }
1112
1113 static void
1114 serialize_vnet_hw_interface_set_class (serialize_main_t * m, va_list * va)
1115 {
1116   u32 hw_if_index = va_arg (*va, u32);
1117   char *hw_class_name = va_arg (*va, char *);
1118   serialize_integer (m, hw_if_index, sizeof (hw_if_index));
1119   serialize_cstring (m, hw_class_name);
1120 }
1121
1122 static void
1123 unserialize_vnet_hw_interface_set_class (serialize_main_t * m, va_list * va)
1124 {
1125   CLIB_UNUSED (mc_main_t * mc) = va_arg (*va, mc_main_t *);
1126   vnet_main_t *vnm = vnet_get_main ();
1127   u32 hw_if_index;
1128   char *hw_class_name;
1129   uword *p;
1130   clib_error_t *error;
1131
1132   unserialize_integer (m, &hw_if_index, sizeof (hw_if_index));
1133   unserialize_cstring (m, &hw_class_name);
1134   p =
1135     hash_get (vnm->interface_main.hw_interface_class_by_name, hw_class_name);
1136   ASSERT (p != 0);
1137   error = vnet_hw_interface_set_class_helper (vnm, hw_if_index, p[0],
1138                                               /* redistribute */ 0);
1139   if (error)
1140     clib_error_report (error);
1141 }
1142
1143 MC_SERIALIZE_MSG (vnet_hw_interface_set_class_msg, static) =
1144 {
1145 .name = "vnet_hw_interface_set_class",.serialize =
1146     serialize_vnet_hw_interface_set_class,.unserialize =
1147     unserialize_vnet_hw_interface_set_class,};
1148
1149 void
1150 vnet_hw_interface_init_for_class (vnet_main_t * vnm, u32 hw_if_index,
1151                                   u32 hw_class_index, u32 hw_instance)
1152 {
1153   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1154   vnet_hw_interface_class_t *hc =
1155     vnet_get_hw_interface_class (vnm, hw_class_index);
1156
1157   hi->hw_class_index = hw_class_index;
1158   hi->hw_instance = hw_instance;
1159   setup_output_node (vnm->vlib_main, hi->output_node_index, hc);
1160 }
1161
1162 static clib_error_t *
1163 vnet_hw_interface_set_class_helper (vnet_main_t * vnm, u32 hw_if_index,
1164                                     u32 hw_class_index, u32 redistribute)
1165 {
1166   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1167   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, hi->sw_if_index);
1168   vnet_hw_interface_class_t *old_class =
1169     vnet_get_hw_interface_class (vnm, hi->hw_class_index);
1170   vnet_hw_interface_class_t *new_class =
1171     vnet_get_hw_interface_class (vnm, hw_class_index);
1172   vnet_device_class_t *dev_class =
1173     vnet_get_device_class (vnm, hi->dev_class_index);
1174   clib_error_t *error = 0;
1175
1176   /* New class equals old class?  Nothing to do. */
1177   if (hi->hw_class_index == hw_class_index)
1178     return 0;
1179
1180   /* No need (and incorrect since admin up flag may be set) to do error checking when
1181      receiving unserialize message. */
1182   if (redistribute)
1183     {
1184       if (si->flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
1185         return clib_error_return (0,
1186                                   "%v must be admin down to change class from %s to %s",
1187                                   hi->name, old_class->name, new_class->name);
1188
1189       /* Make sure interface supports given class. */
1190       if ((new_class->is_valid_class_for_interface
1191            && !new_class->is_valid_class_for_interface (vnm, hw_if_index,
1192                                                         hw_class_index))
1193           || (dev_class->is_valid_class_for_interface
1194               && !dev_class->is_valid_class_for_interface (vnm, hw_if_index,
1195                                                            hw_class_index)))
1196         return clib_error_return (0,
1197                                   "%v class cannot be changed from %s to %s",
1198                                   hi->name, old_class->name, new_class->name);
1199
1200       if (vnm->vlib_main->mc_main)
1201         {
1202           mc_serialize (vnm->vlib_main->mc_main,
1203                         &vnet_hw_interface_set_class_msg, hw_if_index,
1204                         new_class->name);
1205           return 0;
1206         }
1207     }
1208
1209   if (old_class->hw_class_change)
1210     old_class->hw_class_change (vnm, hw_if_index, old_class->index,
1211                                 new_class->index);
1212
1213   vnet_hw_interface_init_for_class (vnm, hw_if_index, new_class->index,
1214                                     /* instance */ ~0);
1215
1216   if (new_class->hw_class_change)
1217     new_class->hw_class_change (vnm, hw_if_index, old_class->index,
1218                                 new_class->index);
1219
1220   if (dev_class->hw_class_change)
1221     dev_class->hw_class_change (vnm, hw_if_index, new_class->index);
1222
1223   return error;
1224 }
1225
1226 clib_error_t *
1227 vnet_hw_interface_set_class (vnet_main_t * vnm, u32 hw_if_index,
1228                              u32 hw_class_index)
1229 {
1230   return vnet_hw_interface_set_class_helper (vnm, hw_if_index, hw_class_index,
1231                                              /* redistribute */ 1);
1232 }
1233
1234 static int
1235 vnet_hw_interface_rx_redirect_to_node_helper (vnet_main_t * vnm,
1236                                               u32 hw_if_index,
1237                                               u32 node_index,
1238                                               u32 redistribute)
1239 {
1240   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1241   vnet_device_class_t *dev_class = vnet_get_device_class
1242     (vnm, hi->dev_class_index);
1243
1244   if (redistribute)
1245     {
1246       /* $$$$ fixme someday maybe */
1247       ASSERT (vnm->vlib_main->mc_main == 0);
1248     }
1249   if (dev_class->rx_redirect_to_node)
1250     {
1251       dev_class->rx_redirect_to_node (vnm, hw_if_index, node_index);
1252       return 0;
1253     }
1254
1255   return VNET_API_ERROR_UNIMPLEMENTED;
1256 }
1257
1258 int
1259 vnet_hw_interface_rx_redirect_to_node (vnet_main_t * vnm, u32 hw_if_index,
1260                                        u32 node_index)
1261 {
1262   return vnet_hw_interface_rx_redirect_to_node_helper (vnm, hw_if_index,
1263                                                        node_index,
1264                                                        1 /* redistribute */ );
1265 }
1266
1267 word
1268 vnet_sw_interface_compare (vnet_main_t * vnm,
1269                            uword sw_if_index0, uword sw_if_index1)
1270 {
1271   vnet_sw_interface_t *sup0 = vnet_get_sup_sw_interface (vnm, sw_if_index0);
1272   vnet_sw_interface_t *sup1 = vnet_get_sup_sw_interface (vnm, sw_if_index1);
1273   vnet_hw_interface_t *h0 = vnet_get_hw_interface (vnm, sup0->hw_if_index);
1274   vnet_hw_interface_t *h1 = vnet_get_hw_interface (vnm, sup1->hw_if_index);
1275
1276   if (h0 != h1)
1277     return vec_cmp (h0->name, h1->name);
1278   return (word) h0->hw_instance - (word) h1->hw_instance;
1279 }
1280
1281 word
1282 vnet_hw_interface_compare (vnet_main_t * vnm,
1283                            uword hw_if_index0, uword hw_if_index1)
1284 {
1285   vnet_hw_interface_t *h0 = vnet_get_hw_interface (vnm, hw_if_index0);
1286   vnet_hw_interface_t *h1 = vnet_get_hw_interface (vnm, hw_if_index1);
1287
1288   if (h0 != h1)
1289     return vec_cmp (h0->name, h1->name);
1290   return (word) h0->hw_instance - (word) h1->hw_instance;
1291 }
1292
1293 int
1294 vnet_sw_interface_is_p2p (vnet_main_t * vnm, u32 sw_if_index)
1295 {
1296   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
1297   if ((si->type == VNET_SW_INTERFACE_TYPE_P2P) ||
1298       (si->type == VNET_SW_INTERFACE_TYPE_PIPE))
1299     return 1;
1300
1301   vnet_hw_interface_t *hw = vnet_get_sup_hw_interface (vnm, sw_if_index);
1302   vnet_hw_interface_class_t *hc =
1303     vnet_get_hw_interface_class (vnm, hw->hw_class_index);
1304
1305   return (hc->flags & VNET_HW_INTERFACE_CLASS_FLAG_P2P);
1306 }
1307
1308 clib_error_t *
1309 vnet_interface_init (vlib_main_t * vm)
1310 {
1311   vnet_main_t *vnm = vnet_get_main ();
1312   vnet_interface_main_t *im = &vnm->interface_main;
1313   vlib_buffer_t *b = 0;
1314   vnet_buffer_opaque_t *o = 0;
1315   clib_error_t *error;
1316
1317   /*
1318    * Keep people from shooting themselves in the foot.
1319    */
1320   if (sizeof (b->opaque) != sizeof (vnet_buffer_opaque_t))
1321     {
1322 #define _(a) if (sizeof(o->a) > sizeof (o->unused))                     \
1323       clib_warning                                                      \
1324         ("FATAL: size of opaque union subtype %s is %d (max %d)",       \
1325          #a, sizeof(o->a), sizeof (o->unused));
1326       foreach_buffer_opaque_union_subtype;
1327 #undef _
1328
1329       return clib_error_return
1330         (0, "FATAL: size of vlib buffer opaque %d, size of vnet opaque %d",
1331          sizeof (b->opaque), sizeof (vnet_buffer_opaque_t));
1332     }
1333
1334   im->sw_if_counter_lock = clib_mem_alloc_aligned (CLIB_CACHE_LINE_BYTES,
1335                                                    CLIB_CACHE_LINE_BYTES);
1336   im->sw_if_counter_lock[0] = 1;        /* should be no need */
1337
1338   vec_validate (im->sw_if_counters, VNET_N_SIMPLE_INTERFACE_COUNTER - 1);
1339 #define _(E,n,p)                                                        \
1340   im->sw_if_counters[VNET_INTERFACE_COUNTER_##E].name = #n;             \
1341   im->sw_if_counters[VNET_INTERFACE_COUNTER_##E].stat_segment_name = "/" #p "/" #n;
1342   foreach_simple_interface_counter_name
1343 #undef _
1344     vec_validate (im->combined_sw_if_counters,
1345                   VNET_N_COMBINED_INTERFACE_COUNTER - 1);
1346 #define _(E,n,p)                                                        \
1347   im->combined_sw_if_counters[VNET_INTERFACE_COUNTER_##E].name = #n;    \
1348   im->combined_sw_if_counters[VNET_INTERFACE_COUNTER_##E].stat_segment_name = "/" #p "/" #n;
1349   foreach_combined_interface_counter_name
1350 #undef _
1351     im->sw_if_counter_lock[0] = 0;
1352
1353   im->device_class_by_name = hash_create_string ( /* size */ 0,
1354                                                  sizeof (uword));
1355   {
1356     vnet_device_class_t *c;
1357
1358     c = vnm->device_class_registrations;
1359
1360     while (c)
1361       {
1362         c->index = vec_len (im->device_classes);
1363         hash_set_mem (im->device_class_by_name, c->name, c->index);
1364
1365         if (c->tx_fn_registrations)
1366           {
1367             vlib_node_fn_registration_t *fnr = c->tx_fn_registrations;
1368             int priority = -1;
1369
1370             /* to avoid confusion, please remove ".tx_function" statement
1371                from VNET_DEVICE_CLASS() if using function candidates */
1372             ASSERT (c->tx_function == 0);
1373
1374             while (fnr)
1375               {
1376                 if (fnr->priority > priority)
1377                   {
1378                     priority = fnr->priority;
1379                     c->tx_function = fnr->function;
1380                   }
1381                 fnr = fnr->next_registration;
1382               }
1383           }
1384
1385         vec_add1 (im->device_classes, c[0]);
1386         c = c->next_class_registration;
1387       }
1388   }
1389
1390   im->hw_interface_class_by_name = hash_create_string ( /* size */ 0,
1391                                                        sizeof (uword));
1392
1393   im->sw_if_index_by_sup_and_sub = hash_create_mem (0, sizeof (u64),
1394                                                     sizeof (uword));
1395   {
1396     vnet_hw_interface_class_t *c;
1397
1398     c = vnm->hw_interface_class_registrations;
1399
1400     while (c)
1401       {
1402         c->index = vec_len (im->hw_interface_classes);
1403         hash_set_mem (im->hw_interface_class_by_name, c->name, c->index);
1404
1405         if (NULL == c->build_rewrite)
1406           c->build_rewrite = default_build_rewrite;
1407         if (NULL == c->update_adjacency)
1408           c->update_adjacency = default_update_adjacency;
1409
1410         vec_add1 (im->hw_interface_classes, c[0]);
1411         c = c->next_class_registration;
1412       }
1413   }
1414
1415   if ((error = vlib_call_init_function (vm, vnet_interface_cli_init)))
1416     return error;
1417
1418   vnm->interface_tag_by_sw_if_index = hash_create (0, sizeof (uword));
1419
1420 #if VLIB_BUFFER_TRACE_TRAJECTORY > 0
1421   if ((error = vlib_call_init_function (vm, trajectory_trace_init)))
1422     return error;
1423 #endif
1424
1425   return 0;
1426 }
1427
1428 VLIB_INIT_FUNCTION (vnet_interface_init);
1429
1430 /* Kludge to renumber interface names [only!] */
1431 int
1432 vnet_interface_name_renumber (u32 sw_if_index, u32 new_show_dev_instance)
1433 {
1434   int rv;
1435   vnet_main_t *vnm = vnet_get_main ();
1436   vnet_interface_main_t *im = &vnm->interface_main;
1437   vnet_hw_interface_t *hi = vnet_get_sup_hw_interface (vnm, sw_if_index);
1438
1439   vnet_device_class_t *dev_class = vnet_get_device_class
1440     (vnm, hi->dev_class_index);
1441
1442   if (dev_class->name_renumber == 0 || dev_class->format_device_name == 0)
1443     return VNET_API_ERROR_UNIMPLEMENTED;
1444
1445   rv = dev_class->name_renumber (hi, new_show_dev_instance);
1446
1447   if (rv)
1448     return rv;
1449
1450   hash_unset_mem (im->hw_interface_by_name, hi->name);
1451   vec_free (hi->name);
1452   /* Use the mapping we set up to call it Ishmael */
1453   hi->name = format (0, "%U", dev_class->format_device_name,
1454                      hi->dev_instance);
1455
1456   hash_set_mem (im->hw_interface_by_name, hi->name, hi->hw_if_index);
1457   return rv;
1458 }
1459
1460 clib_error_t *
1461 vnet_rename_interface (vnet_main_t * vnm, u32 hw_if_index, char *new_name)
1462 {
1463   vnet_interface_main_t *im = &vnm->interface_main;
1464   vlib_main_t *vm = vnm->vlib_main;
1465   vnet_hw_interface_t *hw;
1466   u8 *old_name;
1467   clib_error_t *error = 0;
1468
1469   hw = vnet_get_hw_interface (vnm, hw_if_index);
1470   if (!hw)
1471     {
1472       return clib_error_return (0,
1473                                 "unable to find hw interface for index %u",
1474                                 hw_if_index);
1475     }
1476
1477   old_name = hw->name;
1478
1479   /* set new hw->name */
1480   hw->name = format (0, "%s", new_name);
1481
1482   /* remove the old name to hw_if_index mapping and install the new one */
1483   hash_unset_mem (im->hw_interface_by_name, old_name);
1484   hash_set_mem (im->hw_interface_by_name, hw->name, hw_if_index);
1485
1486   /* rename tx/output nodes */
1487   vlib_node_rename (vm, hw->tx_node_index, "%v-tx", hw->name);
1488   vlib_node_rename (vm, hw->output_node_index, "%v-output", hw->name);
1489
1490   /* free the old name vector */
1491   vec_free (old_name);
1492
1493   return error;
1494 }
1495
1496 static clib_error_t *
1497 vnet_hw_interface_change_mac_address_helper (vnet_main_t * vnm,
1498                                              u32 hw_if_index,
1499                                              u8 * mac_address)
1500 {
1501   clib_error_t *error = 0;
1502   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1503
1504   if (hi->hw_address)
1505     {
1506       u8 *old_address = vec_dup (hi->hw_address);
1507       vnet_device_class_t *dev_class =
1508         vnet_get_device_class (vnm, hi->dev_class_index);
1509       if (dev_class->mac_addr_change_function)
1510         {
1511           error =
1512             dev_class->mac_addr_change_function (hi, old_address,
1513                                                  mac_address);
1514         }
1515       if (!error)
1516         {
1517           vnet_hw_interface_class_t *hw_class;
1518
1519           hw_class = vnet_get_hw_interface_class (vnm, hi->hw_class_index);
1520
1521           if (NULL != hw_class->mac_addr_change_function)
1522             hw_class->mac_addr_change_function (hi, old_address, mac_address);
1523         }
1524       else
1525         {
1526           error =
1527             clib_error_return (0,
1528                                "MAC Address Change is not supported on this interface");
1529         }
1530       vec_free (old_address);
1531     }
1532   else
1533     {
1534       error =
1535         clib_error_return (0,
1536                            "mac address change is not supported for interface index %u",
1537                            hw_if_index);
1538     }
1539   return error;
1540 }
1541
1542 clib_error_t *
1543 vnet_hw_interface_change_mac_address (vnet_main_t * vnm, u32 hw_if_index,
1544                                       u8 * mac_address)
1545 {
1546   return vnet_hw_interface_change_mac_address_helper
1547     (vnm, hw_if_index, mac_address);
1548 }
1549
1550 /* update the unnumbered state of an interface*/
1551 void
1552 vnet_sw_interface_update_unnumbered (u32 unnumbered_sw_if_index,
1553                                      u32 ip_sw_if_index, u8 enable)
1554 {
1555   vnet_main_t *vnm = vnet_get_main ();
1556   vnet_sw_interface_t *si;
1557   u32 was_unnum;
1558
1559   si = vnet_get_sw_interface (vnm, unnumbered_sw_if_index);
1560   was_unnum = (si->flags & VNET_SW_INTERFACE_FLAG_UNNUMBERED);
1561
1562   if (enable)
1563     {
1564       si->flags |= VNET_SW_INTERFACE_FLAG_UNNUMBERED;
1565       si->unnumbered_sw_if_index = ip_sw_if_index;
1566
1567       ip4_main.lookup_main.if_address_pool_index_by_sw_if_index
1568         [unnumbered_sw_if_index] =
1569         ip4_main.
1570         lookup_main.if_address_pool_index_by_sw_if_index[ip_sw_if_index];
1571       ip6_main.
1572         lookup_main.if_address_pool_index_by_sw_if_index
1573         [unnumbered_sw_if_index] =
1574         ip6_main.
1575         lookup_main.if_address_pool_index_by_sw_if_index[ip_sw_if_index];
1576     }
1577   else
1578     {
1579       si->flags &= ~(VNET_SW_INTERFACE_FLAG_UNNUMBERED);
1580       si->unnumbered_sw_if_index = (u32) ~ 0;
1581
1582       ip4_main.lookup_main.if_address_pool_index_by_sw_if_index
1583         [unnumbered_sw_if_index] = ~0;
1584       ip6_main.lookup_main.if_address_pool_index_by_sw_if_index
1585         [unnumbered_sw_if_index] = ~0;
1586     }
1587
1588   if (was_unnum != (si->flags & VNET_SW_INTERFACE_FLAG_UNNUMBERED))
1589     {
1590       ip4_sw_interface_enable_disable (unnumbered_sw_if_index, enable);
1591       ip6_sw_interface_enable_disable (unnumbered_sw_if_index, enable);
1592     }
1593 }
1594
1595 vnet_l3_packet_type_t
1596 vnet_link_to_l3_proto (vnet_link_t link)
1597 {
1598   switch (link)
1599     {
1600     case VNET_LINK_IP4:
1601       return (VNET_L3_PACKET_TYPE_IP4);
1602     case VNET_LINK_IP6:
1603       return (VNET_L3_PACKET_TYPE_IP6);
1604     case VNET_LINK_MPLS:
1605       return (VNET_L3_PACKET_TYPE_MPLS);
1606     case VNET_LINK_ARP:
1607       return (VNET_L3_PACKET_TYPE_ARP);
1608     case VNET_LINK_ETHERNET:
1609     case VNET_LINK_NSH:
1610       ASSERT (0);
1611       break;
1612     }
1613   ASSERT (0);
1614   return (0);
1615 }
1616
1617 vnet_mtu_t
1618 vnet_link_to_mtu (vnet_link_t link)
1619 {
1620   switch (link)
1621     {
1622     case VNET_LINK_IP4:
1623       return (VNET_MTU_IP4);
1624     case VNET_LINK_IP6:
1625       return (VNET_MTU_IP6);
1626     case VNET_LINK_MPLS:
1627       return (VNET_MTU_MPLS);
1628     default:
1629       return (VNET_MTU_L3);
1630     }
1631 }
1632
1633 u8 *
1634 default_build_rewrite (vnet_main_t * vnm,
1635                        u32 sw_if_index,
1636                        vnet_link_t link_type, const void *dst_address)
1637 {
1638   return (NULL);
1639 }
1640
1641 void
1642 default_update_adjacency (vnet_main_t * vnm, u32 sw_if_index, u32 ai)
1643 {
1644   ip_adjacency_t *adj;
1645
1646   adj = adj_get (ai);
1647
1648   switch (adj->lookup_next_index)
1649     {
1650     case IP_LOOKUP_NEXT_GLEAN:
1651       adj_glean_update_rewrite (ai);
1652       break;
1653     case IP_LOOKUP_NEXT_ARP:
1654     case IP_LOOKUP_NEXT_BCAST:
1655       /*
1656        * default rewrite in neighbour adj
1657        */
1658       adj_nbr_update_rewrite
1659         (ai,
1660          ADJ_NBR_REWRITE_FLAG_COMPLETE,
1661          vnet_build_rewrite_for_sw_interface (vnm,
1662                                               sw_if_index,
1663                                               adj_get_link_type (ai), NULL));
1664       break;
1665     case IP_LOOKUP_NEXT_MCAST:
1666       /*
1667        * mcast traffic also uses default rewrite string with no mcast
1668        * switch time updates.
1669        */
1670       adj_mcast_update_rewrite
1671         (ai,
1672          vnet_build_rewrite_for_sw_interface (vnm,
1673                                               sw_if_index,
1674                                               adj_get_link_type (ai),
1675                                               NULL), 0);
1676       break;
1677     case IP_LOOKUP_NEXT_DROP:
1678     case IP_LOOKUP_NEXT_PUNT:
1679     case IP_LOOKUP_NEXT_LOCAL:
1680     case IP_LOOKUP_NEXT_REWRITE:
1681     case IP_LOOKUP_NEXT_MCAST_MIDCHAIN:
1682     case IP_LOOKUP_NEXT_MIDCHAIN:
1683     case IP_LOOKUP_NEXT_ICMP_ERROR:
1684     case IP_LOOKUP_N_NEXT:
1685       ASSERT (0);
1686       break;
1687     }
1688 }
1689
1690 int collect_detailed_interface_stats_flag = 0;
1691
1692 void
1693 collect_detailed_interface_stats_flag_set (void)
1694 {
1695   collect_detailed_interface_stats_flag = 1;
1696 }
1697
1698 void
1699 collect_detailed_interface_stats_flag_clear (void)
1700 {
1701   collect_detailed_interface_stats_flag = 0;
1702 }
1703
1704 static clib_error_t *
1705 collect_detailed_interface_stats_cli (vlib_main_t * vm,
1706                                       unformat_input_t * input,
1707                                       vlib_cli_command_t * cmd)
1708 {
1709   unformat_input_t _line_input, *line_input = &_line_input;
1710   clib_error_t *error = NULL;
1711
1712   /* Get a line of input. */
1713   if (!unformat_user (input, unformat_line_input, line_input))
1714     return clib_error_return (0, "expected enable | disable");
1715
1716   while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
1717     {
1718       if (unformat (line_input, "enable") || unformat (line_input, "on"))
1719         collect_detailed_interface_stats_flag_set ();
1720       else if (unformat (line_input, "disable")
1721                || unformat (line_input, "off"))
1722         collect_detailed_interface_stats_flag_clear ();
1723       else
1724         {
1725           error = clib_error_return (0, "unknown input `%U'",
1726                                      format_unformat_error, line_input);
1727           goto done;
1728         }
1729     }
1730
1731 done:
1732   unformat_free (line_input);
1733   return error;
1734 }
1735
1736 /* *INDENT-OFF* */
1737 VLIB_CLI_COMMAND (collect_detailed_interface_stats_command, static) = {
1738   .path = "interface collect detailed-stats",
1739   .short_help = "interface collect detailed-stats <enable|disable>",
1740   .function = collect_detailed_interface_stats_cli,
1741 };
1742 /* *INDENT-ON* */
1743
1744 /*
1745  * fd.io coding-style-patch-verification: ON
1746  *
1747  * Local Variables:
1748  * eval: (c-set-style "gnu")
1749  * End:
1750  */