IP directed broadcast
[vpp.git] / src / vnet / interface.c
1 /*
2  * Copyright (c) 2015 Cisco and/or its affiliates.
3  * Licensed under the Apache License, Version 2.0 (the "License");
4  * you may not use this file except in compliance with the License.
5  * You may obtain a copy of the License at:
6  *
7  *     http://www.apache.org/licenses/LICENSE-2.0
8  *
9  * Unless required by applicable law or agreed to in writing, software
10  * distributed under the License is distributed on an "AS IS" BASIS,
11  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12  * See the License for the specific language governing permissions and
13  * limitations under the License.
14  */
15 /*
16  * interface.c: VNET interfaces/sub-interfaces
17  *
18  * Copyright (c) 2008 Eliot Dresselhaus
19  *
20  * Permission is hereby granted, free of charge, to any person obtaining
21  * a copy of this software and associated documentation files (the
22  * "Software"), to deal in the Software without restriction, including
23  * without limitation the rights to use, copy, modify, merge, publish,
24  * distribute, sublicense, and/or sell copies of the Software, and to
25  * permit persons to whom the Software is furnished to do so, subject to
26  * the following conditions:
27  *
28  * The above copyright notice and this permission notice shall be
29  * included in all copies or substantial portions of the Software.
30  *
31  *  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32  *  EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33  *  MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34  *  NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35  *  LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36  *  OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37  *  WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
38  */
39
40 #include <vnet/vnet.h>
41 #include <vnet/plugin/plugin.h>
42 #include <vnet/fib/ip6_fib.h>
43 #include <vnet/adj/adj.h>
44 #include <vnet/adj/adj_mcast.h>
45
46 #define VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE (1 << 0)
47 #define VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE (1 << 1)
48
49 static clib_error_t *vnet_hw_interface_set_flags_helper (vnet_main_t * vnm,
50                                                          u32 hw_if_index,
51                                                          u32 flags,
52                                                          u32 helper_flags);
53
54 static clib_error_t *vnet_sw_interface_set_flags_helper (vnet_main_t * vnm,
55                                                          u32 sw_if_index,
56                                                          u32 flags,
57                                                          u32 helper_flags);
58
59 static clib_error_t *vnet_hw_interface_set_class_helper (vnet_main_t * vnm,
60                                                          u32 hw_if_index,
61                                                          u32 hw_class_index,
62                                                          u32 redistribute);
63
64 typedef struct
65 {
66   /* Either sw or hw interface index. */
67   u32 sw_hw_if_index;
68
69   /* Flags. */
70   u32 flags;
71 } vnet_sw_hw_interface_state_t;
72
73 static void
74 serialize_vec_vnet_sw_hw_interface_state (serialize_main_t * m, va_list * va)
75 {
76   vnet_sw_hw_interface_state_t *s =
77     va_arg (*va, vnet_sw_hw_interface_state_t *);
78   u32 n = va_arg (*va, u32);
79   u32 i;
80   for (i = 0; i < n; i++)
81     {
82       serialize_integer (m, s[i].sw_hw_if_index,
83                          sizeof (s[i].sw_hw_if_index));
84       serialize_integer (m, s[i].flags, sizeof (s[i].flags));
85     }
86 }
87
88 static void
89 unserialize_vec_vnet_sw_hw_interface_state (serialize_main_t * m,
90                                             va_list * va)
91 {
92   vnet_sw_hw_interface_state_t *s =
93     va_arg (*va, vnet_sw_hw_interface_state_t *);
94   u32 n = va_arg (*va, u32);
95   u32 i;
96   for (i = 0; i < n; i++)
97     {
98       unserialize_integer (m, &s[i].sw_hw_if_index,
99                            sizeof (s[i].sw_hw_if_index));
100       unserialize_integer (m, &s[i].flags, sizeof (s[i].flags));
101     }
102 }
103
104 static void
105 serialize_vnet_sw_hw_interface_set_flags (serialize_main_t * m, va_list * va)
106 {
107   vnet_sw_hw_interface_state_t *s =
108     va_arg (*va, vnet_sw_hw_interface_state_t *);
109   serialize (m, serialize_vec_vnet_sw_hw_interface_state, s, 1);
110 }
111
112 static void
113 unserialize_vnet_sw_interface_set_flags (serialize_main_t * m, va_list * va)
114 {
115   CLIB_UNUSED (mc_main_t * mc) = va_arg (*va, mc_main_t *);
116   vnet_sw_hw_interface_state_t s;
117
118   unserialize (m, unserialize_vec_vnet_sw_hw_interface_state, &s, 1);
119
120   vnet_sw_interface_set_flags_helper
121     (vnet_get_main (), s.sw_hw_if_index, s.flags,
122      /* helper_flags no redistribution */ 0);
123 }
124
125 static void
126 unserialize_vnet_hw_interface_set_flags (serialize_main_t * m, va_list * va)
127 {
128   CLIB_UNUSED (mc_main_t * mc) = va_arg (*va, mc_main_t *);
129   vnet_sw_hw_interface_state_t s;
130
131   unserialize (m, unserialize_vec_vnet_sw_hw_interface_state, &s, 1);
132
133   vnet_hw_interface_set_flags_helper
134     (vnet_get_main (), s.sw_hw_if_index, s.flags,
135      /* helper_flags no redistribution */ 0);
136 }
137
138 MC_SERIALIZE_MSG (vnet_sw_interface_set_flags_msg, static) =
139 {
140 .name = "vnet_sw_interface_set_flags",.serialize =
141     serialize_vnet_sw_hw_interface_set_flags,.unserialize =
142     unserialize_vnet_sw_interface_set_flags,};
143
144 MC_SERIALIZE_MSG (vnet_hw_interface_set_flags_msg, static) =
145 {
146 .name = "vnet_hw_interface_set_flags",.serialize =
147     serialize_vnet_sw_hw_interface_set_flags,.unserialize =
148     unserialize_vnet_hw_interface_set_flags,};
149
150 void
151 serialize_vnet_interface_state (serialize_main_t * m, va_list * va)
152 {
153   vnet_main_t *vnm = va_arg (*va, vnet_main_t *);
154   vnet_sw_hw_interface_state_t *sts = 0, *st;
155   vnet_sw_interface_t *sif;
156   vnet_hw_interface_t *hif;
157   vnet_interface_main_t *im = &vnm->interface_main;
158
159   /* Serialize hardware interface classes since they may have changed.
160      Must do this before sending up/down flags. */
161   /* *INDENT-OFF* */
162   pool_foreach (hif, im->hw_interfaces, ({
163     vnet_hw_interface_class_t * hw_class = vnet_get_hw_interface_class (vnm, hif->hw_class_index);
164     serialize_cstring (m, hw_class->name);
165   }));
166   /* *INDENT-ON* */
167
168   /* Send sw/hw interface state when non-zero. */
169   /* *INDENT-OFF* */
170   pool_foreach (sif, im->sw_interfaces, ({
171     if (sif->flags != 0)
172       {
173         vec_add2 (sts, st, 1);
174         st->sw_hw_if_index = sif->sw_if_index;
175         st->flags = sif->flags;
176       }
177   }));
178   /* *INDENT-ON* */
179
180   vec_serialize (m, sts, serialize_vec_vnet_sw_hw_interface_state);
181
182   if (sts)
183     _vec_len (sts) = 0;
184
185   /* *INDENT-OFF* */
186   pool_foreach (hif, im->hw_interfaces, ({
187     if (hif->flags != 0)
188       {
189         vec_add2 (sts, st, 1);
190         st->sw_hw_if_index = hif->hw_if_index;
191         st->flags = hif->flags;
192       }
193   }));
194   /* *INDENT-ON* */
195
196   vec_serialize (m, sts, serialize_vec_vnet_sw_hw_interface_state);
197
198   vec_free (sts);
199 }
200
201 void
202 unserialize_vnet_interface_state (serialize_main_t * m, va_list * va)
203 {
204   vnet_main_t *vnm = va_arg (*va, vnet_main_t *);
205   vnet_sw_hw_interface_state_t *sts = 0, *st;
206
207   /* First set interface hardware class. */
208   {
209     vnet_interface_main_t *im = &vnm->interface_main;
210     vnet_hw_interface_t *hif;
211     char *class_name;
212     uword *p;
213     clib_error_t *error;
214
215     /* *INDENT-OFF* */
216     pool_foreach (hif, im->hw_interfaces, ({
217       unserialize_cstring (m, &class_name);
218       p = hash_get_mem (im->hw_interface_class_by_name, class_name);
219       ASSERT (p != 0);
220       error = vnet_hw_interface_set_class_helper (vnm, hif->hw_if_index, p[0], /* redistribute */ 0);
221       if (error)
222         clib_error_report (error);
223       vec_free (class_name);
224     }));
225     /* *INDENT-ON* */
226   }
227
228   vec_unserialize (m, &sts, unserialize_vec_vnet_sw_hw_interface_state);
229   vec_foreach (st, sts)
230     vnet_sw_interface_set_flags_helper (vnm, st->sw_hw_if_index, st->flags,
231                                         /* no distribute */ 0);
232   vec_free (sts);
233
234   vec_unserialize (m, &sts, unserialize_vec_vnet_sw_hw_interface_state);
235   vec_foreach (st, sts)
236     vnet_hw_interface_set_flags_helper (vnm, st->sw_hw_if_index, st->flags,
237                                         /* no distribute */ 0);
238   vec_free (sts);
239 }
240
241 static clib_error_t *
242 call_elf_section_interface_callbacks (vnet_main_t * vnm, u32 if_index,
243                                       u32 flags,
244                                       _vnet_interface_function_list_elt_t **
245                                       elts)
246 {
247   _vnet_interface_function_list_elt_t *elt;
248   vnet_interface_function_priority_t prio;
249   clib_error_t *error = 0;
250
251   for (prio = VNET_ITF_FUNC_PRIORITY_LOW;
252        prio <= VNET_ITF_FUNC_PRIORITY_HIGH; prio++)
253     {
254       elt = elts[prio];
255
256       while (elt)
257         {
258           error = elt->fp (vnm, if_index, flags);
259           if (error)
260             return error;
261           elt = elt->next_interface_function;
262         }
263     }
264   return error;
265 }
266
267 static clib_error_t *
268 call_hw_interface_add_del_callbacks (vnet_main_t * vnm, u32 hw_if_index,
269                                      u32 is_create)
270 {
271   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
272   vnet_hw_interface_class_t *hw_class =
273     vnet_get_hw_interface_class (vnm, hi->hw_class_index);
274   vnet_device_class_t *dev_class =
275     vnet_get_device_class (vnm, hi->dev_class_index);
276   clib_error_t *error = 0;
277
278   if (hw_class->interface_add_del_function
279       && (error =
280           hw_class->interface_add_del_function (vnm, hw_if_index, is_create)))
281     return error;
282
283   if (dev_class->interface_add_del_function
284       && (error =
285           dev_class->interface_add_del_function (vnm, hw_if_index,
286                                                  is_create)))
287     return error;
288
289   error = call_elf_section_interface_callbacks
290     (vnm, hw_if_index, is_create, vnm->hw_interface_add_del_functions);
291
292   return error;
293 }
294
295 static clib_error_t *
296 call_sw_interface_add_del_callbacks (vnet_main_t * vnm, u32 sw_if_index,
297                                      u32 is_create)
298 {
299   return call_elf_section_interface_callbacks
300     (vnm, sw_if_index, is_create, vnm->sw_interface_add_del_functions);
301 }
302
303 #define VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE (1 << 0)
304 #define VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE (1 << 1)
305
306 static clib_error_t *
307 vnet_hw_interface_set_flags_helper (vnet_main_t * vnm, u32 hw_if_index,
308                                     u32 flags, u32 helper_flags)
309 {
310   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
311   vnet_hw_interface_class_t *hw_class =
312     vnet_get_hw_interface_class (vnm, hi->hw_class_index);
313   vnet_device_class_t *dev_class =
314     vnet_get_device_class (vnm, hi->dev_class_index);
315   vlib_main_t *vm = vnm->vlib_main;
316   u32 mask;
317   clib_error_t *error = 0;
318   u32 is_create =
319     (helper_flags & VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE) != 0;
320
321   mask =
322     (VNET_HW_INTERFACE_FLAG_LINK_UP | VNET_HW_INTERFACE_FLAG_DUPLEX_MASK |
323      VNET_HW_INTERFACE_FLAG_SPEED_MASK);
324   flags &= mask;
325
326   /* Call hardware interface add/del callbacks. */
327   if (is_create)
328     call_hw_interface_add_del_callbacks (vnm, hw_if_index, is_create);
329
330   /* Already in the desired state? */
331   if (!is_create && (hi->flags & mask) == flags)
332     goto done;
333
334   /* Some interface classes do not redistribute (e.g. are local). */
335   if (!dev_class->redistribute)
336     helper_flags &= ~VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE;
337
338   if (vm->mc_main
339       && (helper_flags & VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE))
340     {
341       vnet_sw_hw_interface_state_t s;
342       s.sw_hw_if_index = hw_if_index;
343       s.flags = flags;
344       mc_serialize (vm->mc_main, &vnet_hw_interface_set_flags_msg, &s);
345     }
346
347   if ((hi->flags & VNET_HW_INTERFACE_FLAG_LINK_UP) !=
348       (flags & VNET_HW_INTERFACE_FLAG_LINK_UP))
349     {
350       /* Do hardware class (e.g. ethernet). */
351       if (hw_class->link_up_down_function
352           && (error = hw_class->link_up_down_function (vnm, hw_if_index,
353                                                        flags)))
354         goto done;
355
356       error = call_elf_section_interface_callbacks
357         (vnm, hw_if_index, flags, vnm->hw_interface_link_up_down_functions);
358
359       if (error)
360         goto done;
361     }
362
363   hi->flags &= ~mask;
364   hi->flags |= flags;
365
366 done:
367   return error;
368 }
369
370 static clib_error_t *
371 vnet_sw_interface_set_flags_helper (vnet_main_t * vnm, u32 sw_if_index,
372                                     u32 flags, u32 helper_flags)
373 {
374   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
375   vlib_main_t *vm = vnm->vlib_main;
376   u32 mask;
377   clib_error_t *error = 0;
378   u32 is_create =
379     (helper_flags & VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE) != 0;
380   u32 old_flags;
381
382   mask = VNET_SW_INTERFACE_FLAG_ADMIN_UP | VNET_SW_INTERFACE_FLAG_PUNT;
383   flags &= mask;
384
385   if (is_create)
386     {
387       error =
388         call_sw_interface_add_del_callbacks (vnm, sw_if_index, is_create);
389       if (error)
390         goto done;
391
392       if (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
393         {
394           /* Notify everyone when the interface is created as admin up */
395           error = call_elf_section_interface_callbacks (vnm, sw_if_index,
396                                                         flags,
397                                                         vnm->
398                                                         sw_interface_admin_up_down_functions);
399           if (error)
400             goto done;
401         }
402     }
403   else
404     {
405       vnet_sw_interface_t *si_sup = si;
406
407       /* Check that super interface is in correct state. */
408       if (si->type == VNET_SW_INTERFACE_TYPE_SUB)
409         {
410           si_sup = vnet_get_sw_interface (vnm, si->sup_sw_if_index);
411
412           /* Check to see if we're bringing down the soft interface and if it's parent is up */
413           if ((flags != (si_sup->flags & mask)) &&
414               (!((flags == 0)
415                  && ((si_sup->flags & mask) ==
416                      VNET_SW_INTERFACE_FLAG_ADMIN_UP))))
417             {
418               error = clib_error_return (0, "super-interface %U must be %U",
419                                          format_vnet_sw_interface_name, vnm,
420                                          si_sup,
421                                          format_vnet_sw_interface_flags,
422                                          flags);
423               goto done;
424             }
425         }
426
427       /* Donot change state for slave link of bonded interfaces */
428       if (si->flags & VNET_SW_INTERFACE_FLAG_BOND_SLAVE)
429         {
430           error = clib_error_return
431             (0, "not allowed as %U belong to a BondEthernet interface",
432              format_vnet_sw_interface_name, vnm, si);
433           goto done;
434         }
435
436       /* Already in the desired state? */
437       if ((si->flags & mask) == flags)
438         goto done;
439
440       /* Sub-interfaces of hardware interfaces that do no redistribute,
441          do not redistribute themselves. */
442       if (si_sup->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
443         {
444           vnet_hw_interface_t *hi =
445             vnet_get_hw_interface (vnm, si_sup->hw_if_index);
446           vnet_device_class_t *dev_class =
447             vnet_get_device_class (vnm, hi->dev_class_index);
448           if (!dev_class->redistribute)
449             helper_flags &=
450               ~VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE;
451         }
452
453       if (vm->mc_main
454           && (helper_flags &
455               VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE))
456         {
457           vnet_sw_hw_interface_state_t s;
458           s.sw_hw_if_index = sw_if_index;
459           s.flags = flags;
460           mc_serialize (vm->mc_main, &vnet_sw_interface_set_flags_msg, &s);
461         }
462
463       /* set the flags now before invoking the registered clients
464        * so that the state they query is consistent with the state here notified */
465       old_flags = si->flags;
466       si->flags &= ~mask;
467       si->flags |= flags;
468       if ((flags | old_flags) & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
469         error = call_elf_section_interface_callbacks
470           (vnm, sw_if_index, flags,
471            vnm->sw_interface_admin_up_down_functions);
472
473       if (error)
474         {
475           /* restore flags on error */
476           si->flags = old_flags;
477           goto done;
478         }
479
480       if (si->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
481         {
482           vnet_hw_interface_t *hi =
483             vnet_get_hw_interface (vnm, si->hw_if_index);
484           vnet_hw_interface_class_t *hw_class =
485             vnet_get_hw_interface_class (vnm, hi->hw_class_index);
486           vnet_device_class_t *dev_class =
487             vnet_get_device_class (vnm, hi->dev_class_index);
488
489           if ((flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP) &&
490               (si->flags & VNET_SW_INTERFACE_FLAG_ERROR))
491             {
492               error = clib_error_return (0, "Interface in the error state");
493               goto done;
494             }
495
496           /* save the si admin up flag */
497           old_flags = si->flags;
498
499           /* update si admin up flag in advance if we are going admin down */
500           if (!(flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP))
501             si->flags &= ~VNET_SW_INTERFACE_FLAG_ADMIN_UP;
502
503           if (dev_class->admin_up_down_function
504               && (error = dev_class->admin_up_down_function (vnm,
505                                                              si->hw_if_index,
506                                                              flags)))
507             {
508               /* restore si admin up flag to it's original state on errors */
509               si->flags = old_flags;
510               goto done;
511             }
512
513           if (hw_class->admin_up_down_function
514               && (error = hw_class->admin_up_down_function (vnm,
515                                                             si->hw_if_index,
516                                                             flags)))
517             {
518               /* restore si admin up flag to it's original state on errors */
519               si->flags = old_flags;
520               goto done;
521             }
522
523           /* Admin down implies link down. */
524           if (!(flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
525               && (hi->flags & VNET_HW_INTERFACE_FLAG_LINK_UP))
526             vnet_hw_interface_set_flags_helper (vnm, si->hw_if_index,
527                                                 hi->flags &
528                                                 ~VNET_HW_INTERFACE_FLAG_LINK_UP,
529                                                 helper_flags);
530         }
531     }
532
533   si->flags &= ~mask;
534   si->flags |= flags;
535
536 done:
537   return error;
538 }
539
540 clib_error_t *
541 vnet_hw_interface_set_flags (vnet_main_t * vnm, u32 hw_if_index, u32 flags)
542 {
543   return vnet_hw_interface_set_flags_helper
544     (vnm, hw_if_index, flags,
545      VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE);
546 }
547
548 clib_error_t *
549 vnet_sw_interface_set_flags (vnet_main_t * vnm, u32 sw_if_index, u32 flags)
550 {
551   return vnet_sw_interface_set_flags_helper
552     (vnm, sw_if_index, flags,
553      VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE);
554 }
555
556 static u32
557 vnet_create_sw_interface_no_callbacks (vnet_main_t * vnm,
558                                        vnet_sw_interface_t * template)
559 {
560   vnet_interface_main_t *im = &vnm->interface_main;
561   vnet_sw_interface_t *sw;
562   u32 sw_if_index;
563
564   pool_get (im->sw_interfaces, sw);
565   sw_if_index = sw - im->sw_interfaces;
566
567   sw[0] = template[0];
568
569   sw->flags = 0;
570   sw->sw_if_index = sw_if_index;
571   if (sw->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
572     sw->sup_sw_if_index = sw->sw_if_index;
573
574   /* Allocate counters for this interface. */
575   {
576     u32 i;
577
578     vnet_interface_counter_lock (im);
579
580     for (i = 0; i < vec_len (im->sw_if_counters); i++)
581       {
582         vlib_validate_simple_counter (&im->sw_if_counters[i], sw_if_index);
583         vlib_zero_simple_counter (&im->sw_if_counters[i], sw_if_index);
584       }
585
586     for (i = 0; i < vec_len (im->combined_sw_if_counters); i++)
587       {
588         vlib_validate_combined_counter (&im->combined_sw_if_counters[i],
589                                         sw_if_index);
590         vlib_zero_combined_counter (&im->combined_sw_if_counters[i],
591                                     sw_if_index);
592       }
593
594     vnet_interface_counter_unlock (im);
595   }
596
597   return sw_if_index;
598 }
599
600 clib_error_t *
601 vnet_create_sw_interface (vnet_main_t * vnm, vnet_sw_interface_t * template,
602                           u32 * sw_if_index)
603 {
604   clib_error_t *error;
605   vnet_hw_interface_t *hi;
606   vnet_device_class_t *dev_class;
607
608   hi = vnet_get_sup_hw_interface (vnm, template->sup_sw_if_index);
609   dev_class = vnet_get_device_class (vnm, hi->dev_class_index);
610
611   if (template->type == VNET_SW_INTERFACE_TYPE_SUB &&
612       dev_class->subif_add_del_function)
613     {
614       error = dev_class->subif_add_del_function (vnm, hi->hw_if_index,
615                                                  (struct vnet_sw_interface_t
616                                                   *) template, 1);
617       if (error)
618         return error;
619     }
620
621   *sw_if_index = vnet_create_sw_interface_no_callbacks (vnm, template);
622   error = vnet_sw_interface_set_flags_helper
623     (vnm, *sw_if_index, template->flags,
624      VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
625
626   if (error)
627     {
628       /* undo the work done by vnet_create_sw_interface_no_callbacks() */
629       vnet_interface_main_t *im = &vnm->interface_main;
630       vnet_sw_interface_t *sw =
631         pool_elt_at_index (im->sw_interfaces, *sw_if_index);
632       pool_put (im->sw_interfaces, sw);
633     }
634
635   return error;
636 }
637
638 void
639 vnet_delete_sw_interface (vnet_main_t * vnm, u32 sw_if_index)
640 {
641   vnet_interface_main_t *im = &vnm->interface_main;
642   vnet_sw_interface_t *sw =
643     pool_elt_at_index (im->sw_interfaces, sw_if_index);
644
645   /* Check if the interface has config and is removed from L2 BD or XConnect */
646   vlib_main_t *vm = vlib_get_main ();
647   l2_input_config_t *config;
648   if (sw_if_index < vec_len (l2input_main.configs))
649     {
650       config = vec_elt_at_index (l2input_main.configs, sw_if_index);
651       if (config->xconnect)
652         set_int_l2_mode (vm, vnm, MODE_L3, config->output_sw_if_index, 0, 0,
653                          0, 0);
654       if (config->xconnect || config->bridge)
655         set_int_l2_mode (vm, vnm, MODE_L3, sw_if_index, 0, 0, 0, 0);
656     }
657   vnet_clear_sw_interface_tag (vnm, sw_if_index);
658
659   /* Bring down interface in case it is up. */
660   if (sw->flags != 0)
661     vnet_sw_interface_set_flags (vnm, sw_if_index, /* flags */ 0);
662
663   call_sw_interface_add_del_callbacks (vnm, sw_if_index, /* is_create */ 0);
664
665   pool_put (im->sw_interfaces, sw);
666 }
667
668 static clib_error_t *
669 call_sw_interface_mtu_change_callbacks (vnet_main_t * vnm, u32 sw_if_index)
670 {
671   return call_elf_section_interface_callbacks
672     (vnm, sw_if_index, 0, vnm->sw_interface_mtu_change_functions);
673 }
674
675 void
676 vnet_sw_interface_set_mtu (vnet_main_t * vnm, u32 sw_if_index, u32 mtu)
677 {
678   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
679
680   if (si->mtu[VNET_MTU_L3] != mtu)
681     {
682       si->mtu[VNET_MTU_L3] = mtu;
683       call_sw_interface_mtu_change_callbacks (vnm, sw_if_index);
684     }
685 }
686
687 void
688 vnet_sw_interface_set_protocol_mtu (vnet_main_t * vnm, u32 sw_if_index,
689                                     u32 mtu[])
690 {
691   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
692   bool changed = false;
693   int i;
694
695   for (i = 0; i < VNET_N_MTU; i++)
696     {
697       if (si->mtu[i] != mtu[i])
698         {
699           si->mtu[i] = mtu[i];
700           changed = true;
701         }
702     }
703   /* Notify interested parties */
704   if (changed)
705     call_sw_interface_mtu_change_callbacks (vnm, sw_if_index);
706 }
707
708 void
709 vnet_sw_interface_ip_directed_broadcast (vnet_main_t * vnm,
710                                          u32 sw_if_index, u8 enable)
711 {
712   vnet_sw_interface_t *si;
713
714   si = vnet_get_sw_interface (vnm, sw_if_index);
715
716   if (enable)
717     si->flags |= VNET_SW_INTERFACE_FLAG_DIRECTED_BCAST;
718   else
719     si->flags &= ~VNET_SW_INTERFACE_FLAG_DIRECTED_BCAST;
720
721   ip4_directed_broadcast (sw_if_index, enable);
722 }
723
724 /*
725  * Reflect a change in hardware MTU on protocol MTUs
726  */
727 static walk_rc_t
728 sw_interface_walk_callback (vnet_main_t * vnm, u32 sw_if_index, void *ctx)
729 {
730   u32 *link_mtu = ctx;
731   vnet_sw_interface_set_mtu (vnm, sw_if_index, *link_mtu);
732   return WALK_CONTINUE;
733 }
734
735 void
736 vnet_hw_interface_set_mtu (vnet_main_t * vnm, u32 hw_if_index, u32 mtu)
737 {
738   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
739
740   if (hi->max_packet_bytes != mtu)
741     {
742       hi->max_packet_bytes = mtu;
743       ethernet_set_flags (vnm, hw_if_index, ETHERNET_INTERFACE_FLAG_MTU);
744       vnet_hw_interface_walk_sw (vnm, hw_if_index, sw_interface_walk_callback,
745                                  &mtu);
746     }
747 }
748
749 static void
750 setup_tx_node (vlib_main_t * vm,
751                u32 node_index, vnet_device_class_t * dev_class)
752 {
753   vlib_node_t *n = vlib_get_node (vm, node_index);
754
755   n->function = dev_class->tx_function;
756   n->format_trace = dev_class->format_tx_trace;
757
758   vlib_register_errors (vm, node_index,
759                         dev_class->tx_function_n_errors,
760                         dev_class->tx_function_error_strings);
761 }
762
763 static void
764 setup_output_node (vlib_main_t * vm,
765                    u32 node_index, vnet_hw_interface_class_t * hw_class)
766 {
767   vlib_node_t *n = vlib_get_node (vm, node_index);
768   n->format_buffer = hw_class->format_header;
769   n->unformat_buffer = hw_class->unformat_header;
770 }
771
772 /* Register an interface instance. */
773 u32
774 vnet_register_interface (vnet_main_t * vnm,
775                          u32 dev_class_index,
776                          u32 dev_instance,
777                          u32 hw_class_index, u32 hw_instance)
778 {
779   vnet_interface_main_t *im = &vnm->interface_main;
780   vnet_hw_interface_t *hw;
781   vnet_device_class_t *dev_class =
782     vnet_get_device_class (vnm, dev_class_index);
783   vnet_hw_interface_class_t *hw_class =
784     vnet_get_hw_interface_class (vnm, hw_class_index);
785   vlib_main_t *vm = vnm->vlib_main;
786   vnet_feature_config_main_t *fcm;
787   vnet_config_main_t *cm;
788   u32 hw_index, i;
789   char *tx_node_name = NULL, *output_node_name = NULL;
790
791   pool_get (im->hw_interfaces, hw);
792   memset (hw, 0, sizeof (*hw));
793
794   hw_index = hw - im->hw_interfaces;
795   hw->hw_if_index = hw_index;
796   hw->default_rx_mode = VNET_HW_INTERFACE_RX_MODE_POLLING;
797
798   if (dev_class->format_device_name)
799     hw->name = format (0, "%U", dev_class->format_device_name, dev_instance);
800   else if (hw_class->format_interface_name)
801     hw->name = format (0, "%U", hw_class->format_interface_name,
802                        dev_instance);
803   else
804     hw->name = format (0, "%s%x", hw_class->name, dev_instance);
805
806   if (!im->hw_interface_by_name)
807     im->hw_interface_by_name = hash_create_vec ( /* size */ 0,
808                                                 sizeof (hw->name[0]),
809                                                 sizeof (uword));
810
811   hash_set_mem (im->hw_interface_by_name, hw->name, hw_index);
812
813   /* Make hardware interface point to software interface. */
814   {
815     vnet_sw_interface_t sw = {
816       .type = VNET_SW_INTERFACE_TYPE_HARDWARE,
817       .flood_class = VNET_FLOOD_CLASS_NORMAL,
818       .hw_if_index = hw_index
819     };
820     hw->sw_if_index = vnet_create_sw_interface_no_callbacks (vnm, &sw);
821   }
822
823   hw->dev_class_index = dev_class_index;
824   hw->dev_instance = dev_instance;
825   hw->hw_class_index = hw_class_index;
826   hw->hw_instance = hw_instance;
827
828   hw->max_rate_bits_per_sec = 0;
829   hw->min_packet_bytes = 0;
830   vnet_sw_interface_set_mtu (vnm, hw->sw_if_index, 0);
831
832   if (dev_class->tx_function == 0)
833     goto no_output_nodes;       /* No output/tx nodes to create */
834
835   tx_node_name = (char *) format (0, "%v-tx", hw->name);
836   output_node_name = (char *) format (0, "%v-output", hw->name);
837
838   /* If we have previously deleted interface nodes, re-use them. */
839   if (vec_len (im->deleted_hw_interface_nodes) > 0)
840     {
841       vnet_hw_interface_nodes_t *hn;
842       vlib_node_t *node;
843       vlib_node_runtime_t *nrt;
844
845       hn = vec_end (im->deleted_hw_interface_nodes) - 1;
846
847       hw->tx_node_index = hn->tx_node_index;
848       hw->output_node_index = hn->output_node_index;
849
850       vlib_node_rename (vm, hw->tx_node_index, "%v", tx_node_name);
851       vlib_node_rename (vm, hw->output_node_index, "%v", output_node_name);
852
853       /* *INDENT-OFF* */
854       foreach_vlib_main ({
855         vnet_interface_output_runtime_t *rt;
856
857         rt = vlib_node_get_runtime_data (this_vlib_main, hw->output_node_index);
858         ASSERT (rt->is_deleted == 1);
859         rt->is_deleted = 0;
860         rt->hw_if_index = hw_index;
861         rt->sw_if_index = hw->sw_if_index;
862         rt->dev_instance = hw->dev_instance;
863
864         rt = vlib_node_get_runtime_data (this_vlib_main, hw->tx_node_index);
865         rt->hw_if_index = hw_index;
866         rt->sw_if_index = hw->sw_if_index;
867         rt->dev_instance = hw->dev_instance;
868       });
869       /* *INDENT-ON* */
870
871       /* The new class may differ from the old one.
872        * Functions have to be updated. */
873       node = vlib_get_node (vm, hw->output_node_index);
874       node->function = vnet_interface_output_node_multiarch_select ();
875       node->format_trace = format_vnet_interface_output_trace;
876       /* *INDENT-OFF* */
877       foreach_vlib_main ({
878         nrt = vlib_node_get_runtime (this_vlib_main, hw->output_node_index);
879         nrt->function = node->function;
880       });
881       /* *INDENT-ON* */
882
883       node = vlib_get_node (vm, hw->tx_node_index);
884       node->function = dev_class->tx_function;
885       node->format_trace = dev_class->format_tx_trace;
886       /* *INDENT-OFF* */
887       foreach_vlib_main ({
888         nrt = vlib_node_get_runtime (this_vlib_main, hw->tx_node_index);
889         nrt->function = node->function;
890       });
891       /* *INDENT-ON* */
892
893       _vec_len (im->deleted_hw_interface_nodes) -= 1;
894     }
895   else
896     {
897       vlib_node_registration_t r;
898       vnet_interface_output_runtime_t rt = {
899         .hw_if_index = hw_index,
900         .sw_if_index = hw->sw_if_index,
901         .dev_instance = hw->dev_instance,
902         .is_deleted = 0,
903       };
904
905       memset (&r, 0, sizeof (r));
906       r.type = VLIB_NODE_TYPE_INTERNAL;
907       r.runtime_data = &rt;
908       r.runtime_data_bytes = sizeof (rt);
909       r.scalar_size = 0;
910       r.vector_size = sizeof (u32);
911
912       r.flags = VLIB_NODE_FLAG_IS_OUTPUT;
913       r.name = tx_node_name;
914       r.function = dev_class->tx_function;
915
916       hw->tx_node_index = vlib_register_node (vm, &r);
917
918       vlib_node_add_named_next_with_slot (vm, hw->tx_node_index,
919                                           "error-drop",
920                                           VNET_INTERFACE_TX_NEXT_DROP);
921
922       r.flags = 0;
923       r.name = output_node_name;
924       r.function = vnet_interface_output_node_multiarch_select ();
925       r.format_trace = format_vnet_interface_output_trace;
926
927       {
928         static char *e[] = {
929           "interface is down",
930           "interface is deleted",
931         };
932
933         r.n_errors = ARRAY_LEN (e);
934         r.error_strings = e;
935       }
936       hw->output_node_index = vlib_register_node (vm, &r);
937
938       vlib_node_add_named_next_with_slot (vm, hw->output_node_index,
939                                           "error-drop",
940                                           VNET_INTERFACE_OUTPUT_NEXT_DROP);
941       vlib_node_add_next_with_slot (vm, hw->output_node_index,
942                                     hw->tx_node_index,
943                                     VNET_INTERFACE_OUTPUT_NEXT_TX);
944
945       /* add interface to the list of "output-interface" feature arc start nodes
946          and clone nexts from 1st interface if it exists */
947       fcm = vnet_feature_get_config_main (im->output_feature_arc_index);
948       cm = &fcm->config_main;
949       i = vec_len (cm->start_node_indices);
950       vec_validate (cm->start_node_indices, i);
951       cm->start_node_indices[i] = hw->output_node_index;
952       if (hw_index)
953         {
954           /* copy nexts from 1st interface */
955           vnet_hw_interface_t *first_hw;
956           vlib_node_t *first_node;
957
958           first_hw = vnet_get_hw_interface (vnm, /* hw_if_index */ 0);
959           first_node = vlib_get_node (vm, first_hw->output_node_index);
960
961           /* 1st 2 nexts are already added above */
962           for (i = 2; i < vec_len (first_node->next_nodes); i++)
963             vlib_node_add_next_with_slot (vm, hw->output_node_index,
964                                           first_node->next_nodes[i], i);
965         }
966     }
967
968   setup_output_node (vm, hw->output_node_index, hw_class);
969   setup_tx_node (vm, hw->tx_node_index, dev_class);
970
971 no_output_nodes:
972   /* Call all up/down callbacks with zero flags when interface is created. */
973   vnet_sw_interface_set_flags_helper (vnm, hw->sw_if_index, /* flags */ 0,
974                                       VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
975   vnet_hw_interface_set_flags_helper (vnm, hw_index, /* flags */ 0,
976                                       VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
977   vec_free (tx_node_name);
978   vec_free (output_node_name);
979
980   return hw_index;
981 }
982
983 void
984 vnet_delete_hw_interface (vnet_main_t * vnm, u32 hw_if_index)
985 {
986   vnet_interface_main_t *im = &vnm->interface_main;
987   vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
988   vlib_main_t *vm = vnm->vlib_main;
989   vnet_device_class_t *dev_class = vnet_get_device_class (vnm,
990                                                           hw->dev_class_index);
991   /* If it is up, mark it down. */
992   if (hw->flags != 0)
993     vnet_hw_interface_set_flags (vnm, hw_if_index, /* flags */ 0);
994
995   /* Call delete callbacks. */
996   call_hw_interface_add_del_callbacks (vnm, hw_if_index, /* is_create */ 0);
997
998   /* Delete any sub-interfaces. */
999   {
1000     u32 id, sw_if_index;
1001     /* *INDENT-OFF* */
1002     hash_foreach (id, sw_if_index, hw->sub_interface_sw_if_index_by_id,
1003     ({
1004       vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
1005       u64 sup_and_sub_key =
1006         ((u64) (si->sup_sw_if_index) << 32) | (u64) si->sub.id;
1007       hash_unset_mem_free (&im->sw_if_index_by_sup_and_sub, &sup_and_sub_key);
1008       vnet_delete_sw_interface (vnm, sw_if_index);
1009     }));
1010     hash_free (hw->sub_interface_sw_if_index_by_id);
1011     /* *INDENT-ON* */
1012   }
1013
1014   /* Delete software interface corresponding to hardware interface. */
1015   vnet_delete_sw_interface (vnm, hw->sw_if_index);
1016
1017   if (dev_class->tx_function)
1018     {
1019       /* Put output/tx nodes into recycle pool */
1020       vnet_hw_interface_nodes_t *dn;
1021
1022       /* *INDENT-OFF* */
1023       foreach_vlib_main
1024         ({
1025           vnet_interface_output_runtime_t *rt =
1026             vlib_node_get_runtime_data (this_vlib_main, hw->output_node_index);
1027
1028           /* Mark node runtime as deleted so output node (if called)
1029            * will drop packets. */
1030           rt->is_deleted = 1;
1031         });
1032       /* *INDENT-ON* */
1033
1034       vlib_node_rename (vm, hw->output_node_index,
1035                         "interface-%d-output-deleted", hw_if_index);
1036       vlib_node_rename (vm, hw->tx_node_index, "interface-%d-tx-deleted",
1037                         hw_if_index);
1038       vec_add2 (im->deleted_hw_interface_nodes, dn, 1);
1039       dn->tx_node_index = hw->tx_node_index;
1040       dn->output_node_index = hw->output_node_index;
1041     }
1042
1043   hash_unset_mem (im->hw_interface_by_name, hw->name);
1044   vec_free (hw->name);
1045   vec_free (hw->hw_address);
1046   vec_free (hw->input_node_thread_index_by_queue);
1047   vec_free (hw->dq_runtime_index_by_queue);
1048
1049   pool_put (im->hw_interfaces, hw);
1050 }
1051
1052 void
1053 vnet_hw_interface_walk_sw (vnet_main_t * vnm,
1054                            u32 hw_if_index,
1055                            vnet_hw_sw_interface_walk_t fn, void *ctx)
1056 {
1057   vnet_hw_interface_t *hi;
1058   u32 id, sw_if_index;
1059
1060   hi = vnet_get_hw_interface (vnm, hw_if_index);
1061   /* the super first, then the sub interfaces */
1062   if (WALK_STOP == fn (vnm, hi->sw_if_index, ctx))
1063     return;
1064
1065   /* *INDENT-OFF* */
1066   hash_foreach (id, sw_if_index,
1067                 hi->sub_interface_sw_if_index_by_id,
1068   ({
1069     if (WALK_STOP == fn (vnm, sw_if_index, ctx))
1070       break;
1071   }));
1072   /* *INDENT-ON* */
1073 }
1074
1075 void
1076 vnet_hw_interface_walk (vnet_main_t * vnm,
1077                         vnet_hw_interface_walk_t fn, void *ctx)
1078 {
1079   vnet_interface_main_t *im;
1080   vnet_hw_interface_t *hi;
1081
1082   im = &vnm->interface_main;
1083
1084   /* *INDENT-OFF* */
1085   pool_foreach (hi, im->hw_interfaces,
1086   ({
1087     if (WALK_STOP == fn(vnm, hi->hw_if_index, ctx))
1088       break;
1089   }));
1090   /* *INDENT-ON* */
1091 }
1092
1093 void
1094 vnet_sw_interface_walk (vnet_main_t * vnm,
1095                         vnet_sw_interface_walk_t fn, void *ctx)
1096 {
1097   vnet_interface_main_t *im;
1098   vnet_sw_interface_t *si;
1099
1100   im = &vnm->interface_main;
1101
1102   /* *INDENT-OFF* */
1103   pool_foreach (si, im->sw_interfaces,
1104   {
1105     if (WALK_STOP == fn (vnm, si, ctx))
1106       break;
1107   });
1108   /* *INDENT-ON* */
1109 }
1110
1111 static void
1112 serialize_vnet_hw_interface_set_class (serialize_main_t * m, va_list * va)
1113 {
1114   u32 hw_if_index = va_arg (*va, u32);
1115   char *hw_class_name = va_arg (*va, char *);
1116   serialize_integer (m, hw_if_index, sizeof (hw_if_index));
1117   serialize_cstring (m, hw_class_name);
1118 }
1119
1120 static void
1121 unserialize_vnet_hw_interface_set_class (serialize_main_t * m, va_list * va)
1122 {
1123   CLIB_UNUSED (mc_main_t * mc) = va_arg (*va, mc_main_t *);
1124   vnet_main_t *vnm = vnet_get_main ();
1125   u32 hw_if_index;
1126   char *hw_class_name;
1127   uword *p;
1128   clib_error_t *error;
1129
1130   unserialize_integer (m, &hw_if_index, sizeof (hw_if_index));
1131   unserialize_cstring (m, &hw_class_name);
1132   p =
1133     hash_get (vnm->interface_main.hw_interface_class_by_name, hw_class_name);
1134   ASSERT (p != 0);
1135   error = vnet_hw_interface_set_class_helper (vnm, hw_if_index, p[0],
1136                                               /* redistribute */ 0);
1137   if (error)
1138     clib_error_report (error);
1139 }
1140
1141 MC_SERIALIZE_MSG (vnet_hw_interface_set_class_msg, static) =
1142 {
1143 .name = "vnet_hw_interface_set_class",.serialize =
1144     serialize_vnet_hw_interface_set_class,.unserialize =
1145     unserialize_vnet_hw_interface_set_class,};
1146
1147 void
1148 vnet_hw_interface_init_for_class (vnet_main_t * vnm, u32 hw_if_index,
1149                                   u32 hw_class_index, u32 hw_instance)
1150 {
1151   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1152   vnet_hw_interface_class_t *hc =
1153     vnet_get_hw_interface_class (vnm, hw_class_index);
1154
1155   hi->hw_class_index = hw_class_index;
1156   hi->hw_instance = hw_instance;
1157   setup_output_node (vnm->vlib_main, hi->output_node_index, hc);
1158 }
1159
1160 static clib_error_t *
1161 vnet_hw_interface_set_class_helper (vnet_main_t * vnm, u32 hw_if_index,
1162                                     u32 hw_class_index, u32 redistribute)
1163 {
1164   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1165   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, hi->sw_if_index);
1166   vnet_hw_interface_class_t *old_class =
1167     vnet_get_hw_interface_class (vnm, hi->hw_class_index);
1168   vnet_hw_interface_class_t *new_class =
1169     vnet_get_hw_interface_class (vnm, hw_class_index);
1170   vnet_device_class_t *dev_class =
1171     vnet_get_device_class (vnm, hi->dev_class_index);
1172   clib_error_t *error = 0;
1173
1174   /* New class equals old class?  Nothing to do. */
1175   if (hi->hw_class_index == hw_class_index)
1176     return 0;
1177
1178   /* No need (and incorrect since admin up flag may be set) to do error checking when
1179      receiving unserialize message. */
1180   if (redistribute)
1181     {
1182       if (si->flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
1183         return clib_error_return (0,
1184                                   "%v must be admin down to change class from %s to %s",
1185                                   hi->name, old_class->name, new_class->name);
1186
1187       /* Make sure interface supports given class. */
1188       if ((new_class->is_valid_class_for_interface
1189            && !new_class->is_valid_class_for_interface (vnm, hw_if_index,
1190                                                         hw_class_index))
1191           || (dev_class->is_valid_class_for_interface
1192               && !dev_class->is_valid_class_for_interface (vnm, hw_if_index,
1193                                                            hw_class_index)))
1194         return clib_error_return (0,
1195                                   "%v class cannot be changed from %s to %s",
1196                                   hi->name, old_class->name, new_class->name);
1197
1198       if (vnm->vlib_main->mc_main)
1199         {
1200           mc_serialize (vnm->vlib_main->mc_main,
1201                         &vnet_hw_interface_set_class_msg, hw_if_index,
1202                         new_class->name);
1203           return 0;
1204         }
1205     }
1206
1207   if (old_class->hw_class_change)
1208     old_class->hw_class_change (vnm, hw_if_index, old_class->index,
1209                                 new_class->index);
1210
1211   vnet_hw_interface_init_for_class (vnm, hw_if_index, new_class->index,
1212                                     /* instance */ ~0);
1213
1214   if (new_class->hw_class_change)
1215     new_class->hw_class_change (vnm, hw_if_index, old_class->index,
1216                                 new_class->index);
1217
1218   if (dev_class->hw_class_change)
1219     dev_class->hw_class_change (vnm, hw_if_index, new_class->index);
1220
1221   return error;
1222 }
1223
1224 clib_error_t *
1225 vnet_hw_interface_set_class (vnet_main_t * vnm, u32 hw_if_index,
1226                              u32 hw_class_index)
1227 {
1228   return vnet_hw_interface_set_class_helper (vnm, hw_if_index, hw_class_index,
1229                                              /* redistribute */ 1);
1230 }
1231
1232 static int
1233 vnet_hw_interface_rx_redirect_to_node_helper (vnet_main_t * vnm,
1234                                               u32 hw_if_index,
1235                                               u32 node_index,
1236                                               u32 redistribute)
1237 {
1238   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1239   vnet_device_class_t *dev_class = vnet_get_device_class
1240     (vnm, hi->dev_class_index);
1241
1242   if (redistribute)
1243     {
1244       /* $$$$ fixme someday maybe */
1245       ASSERT (vnm->vlib_main->mc_main == 0);
1246     }
1247   if (dev_class->rx_redirect_to_node)
1248     {
1249       dev_class->rx_redirect_to_node (vnm, hw_if_index, node_index);
1250       return 0;
1251     }
1252
1253   return VNET_API_ERROR_UNIMPLEMENTED;
1254 }
1255
1256 int
1257 vnet_hw_interface_rx_redirect_to_node (vnet_main_t * vnm, u32 hw_if_index,
1258                                        u32 node_index)
1259 {
1260   return vnet_hw_interface_rx_redirect_to_node_helper (vnm, hw_if_index,
1261                                                        node_index,
1262                                                        1 /* redistribute */ );
1263 }
1264
1265 word
1266 vnet_sw_interface_compare (vnet_main_t * vnm,
1267                            uword sw_if_index0, uword sw_if_index1)
1268 {
1269   vnet_sw_interface_t *sup0 = vnet_get_sup_sw_interface (vnm, sw_if_index0);
1270   vnet_sw_interface_t *sup1 = vnet_get_sup_sw_interface (vnm, sw_if_index1);
1271   vnet_hw_interface_t *h0 = vnet_get_hw_interface (vnm, sup0->hw_if_index);
1272   vnet_hw_interface_t *h1 = vnet_get_hw_interface (vnm, sup1->hw_if_index);
1273
1274   if (h0 != h1)
1275     return vec_cmp (h0->name, h1->name);
1276   return (word) h0->hw_instance - (word) h1->hw_instance;
1277 }
1278
1279 word
1280 vnet_hw_interface_compare (vnet_main_t * vnm,
1281                            uword hw_if_index0, uword hw_if_index1)
1282 {
1283   vnet_hw_interface_t *h0 = vnet_get_hw_interface (vnm, hw_if_index0);
1284   vnet_hw_interface_t *h1 = vnet_get_hw_interface (vnm, hw_if_index1);
1285
1286   if (h0 != h1)
1287     return vec_cmp (h0->name, h1->name);
1288   return (word) h0->hw_instance - (word) h1->hw_instance;
1289 }
1290
1291 int
1292 vnet_sw_interface_is_p2p (vnet_main_t * vnm, u32 sw_if_index)
1293 {
1294   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
1295   if ((si->type == VNET_SW_INTERFACE_TYPE_P2P) ||
1296       (si->type == VNET_SW_INTERFACE_TYPE_PIPE))
1297     return 1;
1298
1299   vnet_hw_interface_t *hw = vnet_get_sup_hw_interface (vnm, sw_if_index);
1300   vnet_hw_interface_class_t *hc =
1301     vnet_get_hw_interface_class (vnm, hw->hw_class_index);
1302
1303   return (hc->flags & VNET_HW_INTERFACE_CLASS_FLAG_P2P);
1304 }
1305
1306 clib_error_t *
1307 vnet_interface_init (vlib_main_t * vm)
1308 {
1309   vnet_main_t *vnm = vnet_get_main ();
1310   vnet_interface_main_t *im = &vnm->interface_main;
1311   vlib_buffer_t *b = 0;
1312   vnet_buffer_opaque_t *o = 0;
1313   clib_error_t *error;
1314
1315   /*
1316    * Keep people from shooting themselves in the foot.
1317    */
1318   if (sizeof (b->opaque) != sizeof (vnet_buffer_opaque_t))
1319     {
1320 #define _(a) if (sizeof(o->a) > sizeof (o->unused))                     \
1321       clib_warning                                                      \
1322         ("FATAL: size of opaque union subtype %s is %d (max %d)",       \
1323          #a, sizeof(o->a), sizeof (o->unused));
1324       foreach_buffer_opaque_union_subtype;
1325 #undef _
1326
1327       return clib_error_return
1328         (0, "FATAL: size of vlib buffer opaque %d, size of vnet opaque %d",
1329          sizeof (b->opaque), sizeof (vnet_buffer_opaque_t));
1330     }
1331
1332   im->sw_if_counter_lock = clib_mem_alloc_aligned (CLIB_CACHE_LINE_BYTES,
1333                                                    CLIB_CACHE_LINE_BYTES);
1334   im->sw_if_counter_lock[0] = 1;        /* should be no need */
1335
1336   vec_validate (im->sw_if_counters, VNET_N_SIMPLE_INTERFACE_COUNTER - 1);
1337 #define _(E,n,p)                                                        \
1338   im->sw_if_counters[VNET_INTERFACE_COUNTER_##E].name = #n;             \
1339   im->sw_if_counters[VNET_INTERFACE_COUNTER_##E].stat_segment_name = "/" #p "/" #n;
1340   foreach_simple_interface_counter_name
1341 #undef _
1342     vec_validate (im->combined_sw_if_counters,
1343                   VNET_N_COMBINED_INTERFACE_COUNTER - 1);
1344 #define _(E,n,p)                                                        \
1345   im->combined_sw_if_counters[VNET_INTERFACE_COUNTER_##E].name = #n;    \
1346   im->combined_sw_if_counters[VNET_INTERFACE_COUNTER_##E].stat_segment_name = "/" #p "/" #n;
1347   foreach_combined_interface_counter_name
1348 #undef _
1349     im->sw_if_counter_lock[0] = 0;
1350
1351   im->device_class_by_name = hash_create_string ( /* size */ 0,
1352                                                  sizeof (uword));
1353   {
1354     vnet_device_class_t *c;
1355
1356     c = vnm->device_class_registrations;
1357
1358     while (c)
1359       {
1360         c->index = vec_len (im->device_classes);
1361         hash_set_mem (im->device_class_by_name, c->name, c->index);
1362         vec_add1 (im->device_classes, c[0]);
1363         c = c->next_class_registration;
1364       }
1365   }
1366
1367   im->hw_interface_class_by_name = hash_create_string ( /* size */ 0,
1368                                                        sizeof (uword));
1369
1370   im->sw_if_index_by_sup_and_sub = hash_create_mem (0, sizeof (u64),
1371                                                     sizeof (uword));
1372   {
1373     vnet_hw_interface_class_t *c;
1374
1375     c = vnm->hw_interface_class_registrations;
1376
1377     while (c)
1378       {
1379         c->index = vec_len (im->hw_interface_classes);
1380         hash_set_mem (im->hw_interface_class_by_name, c->name, c->index);
1381
1382         if (NULL == c->build_rewrite)
1383           c->build_rewrite = default_build_rewrite;
1384         if (NULL == c->update_adjacency)
1385           c->update_adjacency = default_update_adjacency;
1386
1387         vec_add1 (im->hw_interface_classes, c[0]);
1388         c = c->next_class_registration;
1389       }
1390   }
1391
1392   if ((error = vlib_call_init_function (vm, vnet_interface_cli_init)))
1393     return error;
1394
1395   vnm->interface_tag_by_sw_if_index = hash_create (0, sizeof (uword));
1396
1397 #if VLIB_BUFFER_TRACE_TRAJECTORY > 0
1398   if ((error = vlib_call_init_function (vm, trajectory_trace_init)))
1399     return error;
1400 #endif
1401
1402   return 0;
1403 }
1404
1405 VLIB_INIT_FUNCTION (vnet_interface_init);
1406
1407 /* Kludge to renumber interface names [only!] */
1408 int
1409 vnet_interface_name_renumber (u32 sw_if_index, u32 new_show_dev_instance)
1410 {
1411   int rv;
1412   vnet_main_t *vnm = vnet_get_main ();
1413   vnet_interface_main_t *im = &vnm->interface_main;
1414   vnet_hw_interface_t *hi = vnet_get_sup_hw_interface (vnm, sw_if_index);
1415
1416   vnet_device_class_t *dev_class = vnet_get_device_class
1417     (vnm, hi->dev_class_index);
1418
1419   if (dev_class->name_renumber == 0 || dev_class->format_device_name == 0)
1420     return VNET_API_ERROR_UNIMPLEMENTED;
1421
1422   rv = dev_class->name_renumber (hi, new_show_dev_instance);
1423
1424   if (rv)
1425     return rv;
1426
1427   hash_unset_mem (im->hw_interface_by_name, hi->name);
1428   vec_free (hi->name);
1429   /* Use the mapping we set up to call it Ishmael */
1430   hi->name = format (0, "%U", dev_class->format_device_name,
1431                      hi->dev_instance);
1432
1433   hash_set_mem (im->hw_interface_by_name, hi->name, hi->hw_if_index);
1434   return rv;
1435 }
1436
1437 clib_error_t *
1438 vnet_rename_interface (vnet_main_t * vnm, u32 hw_if_index, char *new_name)
1439 {
1440   vnet_interface_main_t *im = &vnm->interface_main;
1441   vlib_main_t *vm = vnm->vlib_main;
1442   vnet_hw_interface_t *hw;
1443   u8 *old_name;
1444   clib_error_t *error = 0;
1445
1446   hw = vnet_get_hw_interface (vnm, hw_if_index);
1447   if (!hw)
1448     {
1449       return clib_error_return (0,
1450                                 "unable to find hw interface for index %u",
1451                                 hw_if_index);
1452     }
1453
1454   old_name = hw->name;
1455
1456   /* set new hw->name */
1457   hw->name = format (0, "%s", new_name);
1458
1459   /* remove the old name to hw_if_index mapping and install the new one */
1460   hash_unset_mem (im->hw_interface_by_name, old_name);
1461   hash_set_mem (im->hw_interface_by_name, hw->name, hw_if_index);
1462
1463   /* rename tx/output nodes */
1464   vlib_node_rename (vm, hw->tx_node_index, "%v-tx", hw->name);
1465   vlib_node_rename (vm, hw->output_node_index, "%v-output", hw->name);
1466
1467   /* free the old name vector */
1468   vec_free (old_name);
1469
1470   return error;
1471 }
1472
1473 static clib_error_t *
1474 vnet_hw_interface_change_mac_address_helper (vnet_main_t * vnm,
1475                                              u32 hw_if_index,
1476                                              u8 * mac_address)
1477 {
1478   clib_error_t *error = 0;
1479   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1480
1481   if (hi->hw_address)
1482     {
1483       vnet_device_class_t *dev_class =
1484         vnet_get_device_class (vnm, hi->dev_class_index);
1485       if (dev_class->mac_addr_change_function)
1486         {
1487           error =
1488             dev_class->mac_addr_change_function (hi, (char *) mac_address);
1489         }
1490       if (!error)
1491         {
1492           vnet_hw_interface_class_t *hw_class;
1493
1494           hw_class = vnet_get_hw_interface_class (vnm, hi->hw_class_index);
1495
1496           if (NULL != hw_class->mac_addr_change_function)
1497             hw_class->mac_addr_change_function (hi, (char *) mac_address);
1498         }
1499       else
1500         {
1501           error =
1502             clib_error_return (0,
1503                                "MAC Address Change is not supported on this interface");
1504         }
1505     }
1506   else
1507     {
1508       error =
1509         clib_error_return (0,
1510                            "mac address change is not supported for interface index %u",
1511                            hw_if_index);
1512     }
1513   return error;
1514 }
1515
1516 clib_error_t *
1517 vnet_hw_interface_change_mac_address (vnet_main_t * vnm, u32 hw_if_index,
1518                                       u8 * mac_address)
1519 {
1520   return vnet_hw_interface_change_mac_address_helper
1521     (vnm, hw_if_index, mac_address);
1522 }
1523
1524 /* update the unnumbered state of an interface*/
1525 void
1526 vnet_sw_interface_update_unnumbered (u32 unnumbered_sw_if_index,
1527                                      u32 ip_sw_if_index, u8 enable)
1528 {
1529   vnet_main_t *vnm = vnet_get_main ();
1530   vnet_sw_interface_t *si;
1531   u32 was_unnum;
1532
1533   si = vnet_get_sw_interface (vnm, unnumbered_sw_if_index);
1534   was_unnum = (si->flags & VNET_SW_INTERFACE_FLAG_UNNUMBERED);
1535
1536   if (enable)
1537     {
1538       si->flags |= VNET_SW_INTERFACE_FLAG_UNNUMBERED;
1539       si->unnumbered_sw_if_index = ip_sw_if_index;
1540
1541       ip4_main.lookup_main.if_address_pool_index_by_sw_if_index
1542         [unnumbered_sw_if_index] =
1543         ip4_main.
1544         lookup_main.if_address_pool_index_by_sw_if_index[ip_sw_if_index];
1545       ip6_main.
1546         lookup_main.if_address_pool_index_by_sw_if_index
1547         [unnumbered_sw_if_index] =
1548         ip6_main.
1549         lookup_main.if_address_pool_index_by_sw_if_index[ip_sw_if_index];
1550     }
1551   else
1552     {
1553       si->flags &= ~(VNET_SW_INTERFACE_FLAG_UNNUMBERED);
1554       si->unnumbered_sw_if_index = (u32) ~ 0;
1555
1556       ip4_main.lookup_main.if_address_pool_index_by_sw_if_index
1557         [unnumbered_sw_if_index] = ~0;
1558       ip6_main.lookup_main.if_address_pool_index_by_sw_if_index
1559         [unnumbered_sw_if_index] = ~0;
1560     }
1561
1562   if (was_unnum != (si->flags & VNET_SW_INTERFACE_FLAG_UNNUMBERED))
1563     {
1564       ip4_sw_interface_enable_disable (unnumbered_sw_if_index, enable);
1565       ip6_sw_interface_enable_disable (unnumbered_sw_if_index, enable);
1566     }
1567 }
1568
1569 vnet_l3_packet_type_t
1570 vnet_link_to_l3_proto (vnet_link_t link)
1571 {
1572   switch (link)
1573     {
1574     case VNET_LINK_IP4:
1575       return (VNET_L3_PACKET_TYPE_IP4);
1576     case VNET_LINK_IP6:
1577       return (VNET_L3_PACKET_TYPE_IP6);
1578     case VNET_LINK_MPLS:
1579       return (VNET_L3_PACKET_TYPE_MPLS);
1580     case VNET_LINK_ARP:
1581       return (VNET_L3_PACKET_TYPE_ARP);
1582     case VNET_LINK_ETHERNET:
1583     case VNET_LINK_NSH:
1584       ASSERT (0);
1585       break;
1586     }
1587   ASSERT (0);
1588   return (0);
1589 }
1590
1591 vnet_mtu_t
1592 vnet_link_to_mtu (vnet_link_t link)
1593 {
1594   switch (link)
1595     {
1596     case VNET_LINK_IP4:
1597       return (VNET_MTU_IP4);
1598     case VNET_LINK_IP6:
1599       return (VNET_MTU_IP6);
1600     case VNET_LINK_MPLS:
1601       return (VNET_MTU_MPLS);
1602     default:
1603       return (VNET_MTU_L3);
1604     }
1605 }
1606
1607 u8 *
1608 default_build_rewrite (vnet_main_t * vnm,
1609                        u32 sw_if_index,
1610                        vnet_link_t link_type, const void *dst_address)
1611 {
1612   return (NULL);
1613 }
1614
1615 void
1616 default_update_adjacency (vnet_main_t * vnm, u32 sw_if_index, u32 ai)
1617 {
1618   ip_adjacency_t *adj;
1619
1620   adj = adj_get (ai);
1621
1622   switch (adj->lookup_next_index)
1623     {
1624     case IP_LOOKUP_NEXT_GLEAN:
1625       adj_glean_update_rewrite (ai);
1626       break;
1627     case IP_LOOKUP_NEXT_ARP:
1628     case IP_LOOKUP_NEXT_BCAST:
1629       /*
1630        * default rewirte in neighbour adj
1631        */
1632       adj_nbr_update_rewrite
1633         (ai,
1634          ADJ_NBR_REWRITE_FLAG_COMPLETE,
1635          vnet_build_rewrite_for_sw_interface (vnm,
1636                                               sw_if_index,
1637                                               adj_get_link_type (ai), NULL));
1638       break;
1639     case IP_LOOKUP_NEXT_MCAST:
1640       /*
1641        * mcast traffic also uses default rewrite string with no mcast
1642        * switch time updates.
1643        */
1644       adj_mcast_update_rewrite
1645         (ai,
1646          vnet_build_rewrite_for_sw_interface (vnm,
1647                                               sw_if_index,
1648                                               adj_get_link_type (ai),
1649                                               NULL), 0);
1650       break;
1651     case IP_LOOKUP_NEXT_DROP:
1652     case IP_LOOKUP_NEXT_PUNT:
1653     case IP_LOOKUP_NEXT_LOCAL:
1654     case IP_LOOKUP_NEXT_REWRITE:
1655     case IP_LOOKUP_NEXT_MCAST_MIDCHAIN:
1656     case IP_LOOKUP_NEXT_MIDCHAIN:
1657     case IP_LOOKUP_NEXT_ICMP_ERROR:
1658     case IP_LOOKUP_N_NEXT:
1659       ASSERT (0);
1660       break;
1661     }
1662 }
1663
1664 int collect_detailed_interface_stats_flag = 0;
1665
1666 void
1667 collect_detailed_interface_stats_flag_set (void)
1668 {
1669   collect_detailed_interface_stats_flag = 1;
1670 }
1671
1672 void
1673 collect_detailed_interface_stats_flag_clear (void)
1674 {
1675   collect_detailed_interface_stats_flag = 0;
1676 }
1677
1678 static clib_error_t *
1679 collect_detailed_interface_stats_cli (vlib_main_t * vm,
1680                                       unformat_input_t * input,
1681                                       vlib_cli_command_t * cmd)
1682 {
1683   unformat_input_t _line_input, *line_input = &_line_input;
1684   clib_error_t *error = NULL;
1685
1686   /* Get a line of input. */
1687   if (!unformat_user (input, unformat_line_input, line_input))
1688     return clib_error_return (0, "expected enable | disable");
1689
1690   while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
1691     {
1692       if (unformat (line_input, "enable") || unformat (line_input, "on"))
1693         collect_detailed_interface_stats_flag_set ();
1694       else if (unformat (line_input, "disable")
1695                || unformat (line_input, "off"))
1696         collect_detailed_interface_stats_flag_clear ();
1697       else
1698         {
1699           error = clib_error_return (0, "unknown input `%U'",
1700                                      format_unformat_error, line_input);
1701           goto done;
1702         }
1703     }
1704
1705 done:
1706   unformat_free (line_input);
1707   return error;
1708 }
1709
1710 /* *INDENT-OFF* */
1711 VLIB_CLI_COMMAND (collect_detailed_interface_stats_command, static) = {
1712   .path = "interface collect detailed-stats",
1713   .short_help = "interface collect detailed-stats <enable|disable>",
1714   .function = collect_detailed_interface_stats_cli,
1715 };
1716 /* *INDENT-ON* */
1717
1718 /*
1719  * fd.io coding-style-patch-verification: ON
1720  *
1721  * Local Variables:
1722  * eval: (c-set-style "gnu")
1723  * End:
1724  */