5ee3a74fe0bd9ddabd512a454ec408dd1ffef745
[vpp.git] / src / vnet / interface.c
1 /*
2  * Copyright (c) 2015 Cisco and/or its affiliates.
3  * Licensed under the Apache License, Version 2.0 (the "License");
4  * you may not use this file except in compliance with the License.
5  * You may obtain a copy of the License at:
6  *
7  *     http://www.apache.org/licenses/LICENSE-2.0
8  *
9  * Unless required by applicable law or agreed to in writing, software
10  * distributed under the License is distributed on an "AS IS" BASIS,
11  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12  * See the License for the specific language governing permissions and
13  * limitations under the License.
14  */
15 /*
16  * interface.c: VNET interfaces/sub-interfaces
17  *
18  * Copyright (c) 2008 Eliot Dresselhaus
19  *
20  * Permission is hereby granted, free of charge, to any person obtaining
21  * a copy of this software and associated documentation files (the
22  * "Software"), to deal in the Software without restriction, including
23  * without limitation the rights to use, copy, modify, merge, publish,
24  * distribute, sublicense, and/or sell copies of the Software, and to
25  * permit persons to whom the Software is furnished to do so, subject to
26  * the following conditions:
27  *
28  * The above copyright notice and this permission notice shall be
29  * included in all copies or substantial portions of the Software.
30  *
31  *  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32  *  EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33  *  MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34  *  NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35  *  LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36  *  OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37  *  WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
38  */
39
40 #include <vnet/vnet.h>
41 #include <vnet/plugin/plugin.h>
42 #include <vnet/fib/ip6_fib.h>
43 #include <vnet/adj/adj.h>
44 #include <vnet/adj/adj_mcast.h>
45 #include <vnet/l2/l2_input.h>
46
47 typedef enum vnet_interface_helper_flags_t_
48 {
49   VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE = (1 << 0),
50   VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE = (1 << 1),
51 } vnet_interface_helper_flags_t;
52
53 static clib_error_t *vnet_hw_interface_set_flags_helper (vnet_main_t * vnm,
54                                                          u32 hw_if_index,
55                                                          vnet_hw_interface_flags_t
56                                                          flags,
57                                                          vnet_interface_helper_flags_t
58                                                          helper_flags);
59
60 static clib_error_t *vnet_sw_interface_set_flags_helper (vnet_main_t * vnm,
61                                                          u32 sw_if_index,
62                                                          vnet_sw_interface_flags_t
63                                                          flags,
64                                                          vnet_interface_helper_flags_t
65                                                          helper_flags);
66
67 static clib_error_t *vnet_hw_interface_set_class_helper (vnet_main_t * vnm,
68                                                          u32 hw_if_index,
69                                                          u32 hw_class_index,
70                                                          u32 redistribute);
71
72 typedef struct
73 {
74   /* Either sw or hw interface index. */
75   u32 sw_hw_if_index;
76
77   /* Flags. */
78   u32 flags;
79 } vnet_sw_hw_interface_state_t;
80
81 static void
82 serialize_vec_vnet_sw_hw_interface_state (serialize_main_t * m, va_list * va)
83 {
84   vnet_sw_hw_interface_state_t *s =
85     va_arg (*va, vnet_sw_hw_interface_state_t *);
86   u32 n = va_arg (*va, u32);
87   u32 i;
88   for (i = 0; i < n; i++)
89     {
90       serialize_integer (m, s[i].sw_hw_if_index,
91                          sizeof (s[i].sw_hw_if_index));
92       serialize_integer (m, s[i].flags, sizeof (s[i].flags));
93     }
94 }
95
96 static void
97 unserialize_vec_vnet_sw_hw_interface_state (serialize_main_t * m,
98                                             va_list * va)
99 {
100   vnet_sw_hw_interface_state_t *s =
101     va_arg (*va, vnet_sw_hw_interface_state_t *);
102   u32 n = va_arg (*va, u32);
103   u32 i;
104   for (i = 0; i < n; i++)
105     {
106       unserialize_integer (m, &s[i].sw_hw_if_index,
107                            sizeof (s[i].sw_hw_if_index));
108       unserialize_integer (m, &s[i].flags, sizeof (s[i].flags));
109     }
110 }
111
112 static vnet_sw_interface_flags_t
113 vnet_hw_interface_flags_to_sw (vnet_hw_interface_flags_t hwf)
114 {
115   vnet_sw_interface_flags_t swf = VNET_SW_INTERFACE_FLAG_NONE;
116
117   if (hwf & VNET_HW_INTERFACE_FLAG_LINK_UP)
118     swf |= VNET_SW_INTERFACE_FLAG_ADMIN_UP;
119
120   return (swf);
121 }
122
123 void
124 serialize_vnet_interface_state (serialize_main_t * m, va_list * va)
125 {
126   vnet_main_t *vnm = va_arg (*va, vnet_main_t *);
127   vnet_sw_hw_interface_state_t *sts = 0, *st;
128   vnet_sw_interface_t *sif;
129   vnet_hw_interface_t *hif;
130   vnet_interface_main_t *im = &vnm->interface_main;
131
132   /* Serialize hardware interface classes since they may have changed.
133      Must do this before sending up/down flags. */
134   /* *INDENT-OFF* */
135   pool_foreach (hif, im->hw_interfaces, ({
136     vnet_hw_interface_class_t * hw_class = vnet_get_hw_interface_class (vnm, hif->hw_class_index);
137     serialize_cstring (m, hw_class->name);
138   }));
139   /* *INDENT-ON* */
140
141   /* Send sw/hw interface state when non-zero. */
142   /* *INDENT-OFF* */
143   pool_foreach (sif, im->sw_interfaces, ({
144     if (sif->flags != 0)
145       {
146         vec_add2 (sts, st, 1);
147         st->sw_hw_if_index = sif->sw_if_index;
148         st->flags = sif->flags;
149       }
150   }));
151   /* *INDENT-ON* */
152
153   vec_serialize (m, sts, serialize_vec_vnet_sw_hw_interface_state);
154
155   if (sts)
156     _vec_len (sts) = 0;
157
158   /* *INDENT-OFF* */
159   pool_foreach (hif, im->hw_interfaces, ({
160     if (hif->flags != 0)
161       {
162         vec_add2 (sts, st, 1);
163         st->sw_hw_if_index = hif->hw_if_index;
164         st->flags = vnet_hw_interface_flags_to_sw(hif->flags);
165       }
166   }));
167   /* *INDENT-ON* */
168
169   vec_serialize (m, sts, serialize_vec_vnet_sw_hw_interface_state);
170
171   vec_free (sts);
172 }
173
174 static vnet_hw_interface_flags_t
175 vnet_sw_interface_flags_to_hw (vnet_sw_interface_flags_t swf)
176 {
177   vnet_hw_interface_flags_t hwf = VNET_HW_INTERFACE_FLAG_NONE;
178
179   if (swf & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
180     hwf |= VNET_HW_INTERFACE_FLAG_LINK_UP;
181
182   return (hwf);
183 }
184
185 void
186 unserialize_vnet_interface_state (serialize_main_t * m, va_list * va)
187 {
188   vnet_main_t *vnm = va_arg (*va, vnet_main_t *);
189   vnet_sw_hw_interface_state_t *sts = 0, *st;
190
191   /* First set interface hardware class. */
192   {
193     vnet_interface_main_t *im = &vnm->interface_main;
194     vnet_hw_interface_t *hif;
195     char *class_name;
196     uword *p;
197     clib_error_t *error;
198
199     /* *INDENT-OFF* */
200     pool_foreach (hif, im->hw_interfaces, ({
201       unserialize_cstring (m, &class_name);
202       p = hash_get_mem (im->hw_interface_class_by_name, class_name);
203       ASSERT (p != 0);
204       error = vnet_hw_interface_set_class_helper (vnm, hif->hw_if_index, p[0], /* redistribute */ 0);
205       if (error)
206         clib_error_report (error);
207       vec_free (class_name);
208     }));
209     /* *INDENT-ON* */
210   }
211
212   vec_unserialize (m, &sts, unserialize_vec_vnet_sw_hw_interface_state);
213   vec_foreach (st, sts)
214     vnet_sw_interface_set_flags_helper (vnm, st->sw_hw_if_index, st->flags,
215                                         /* no distribute */ 0);
216   vec_free (sts);
217
218   vec_unserialize (m, &sts, unserialize_vec_vnet_sw_hw_interface_state);
219   vec_foreach (st, sts)
220   {
221     vnet_hw_interface_set_flags_helper
222       (vnm, st->sw_hw_if_index, vnet_sw_interface_flags_to_hw (st->flags),
223        /* no distribute */ 0);
224   }
225   vec_free (sts);
226 }
227
228 static clib_error_t *
229 call_elf_section_interface_callbacks (vnet_main_t * vnm, u32 if_index,
230                                       u32 flags,
231                                       _vnet_interface_function_list_elt_t **
232                                       elts)
233 {
234   _vnet_interface_function_list_elt_t *elt;
235   vnet_interface_function_priority_t prio;
236   clib_error_t *error = 0;
237
238   for (prio = VNET_ITF_FUNC_PRIORITY_LOW;
239        prio <= VNET_ITF_FUNC_PRIORITY_HIGH; prio++)
240     {
241       elt = elts[prio];
242
243       while (elt)
244         {
245           error = elt->fp (vnm, if_index, flags);
246           if (error)
247             return error;
248           elt = elt->next_interface_function;
249         }
250     }
251   return error;
252 }
253
254 static clib_error_t *
255 call_hw_interface_add_del_callbacks (vnet_main_t * vnm, u32 hw_if_index,
256                                      u32 is_create)
257 {
258   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
259   vnet_hw_interface_class_t *hw_class =
260     vnet_get_hw_interface_class (vnm, hi->hw_class_index);
261   vnet_device_class_t *dev_class =
262     vnet_get_device_class (vnm, hi->dev_class_index);
263   clib_error_t *error = 0;
264
265   if (hw_class->interface_add_del_function
266       && (error =
267           hw_class->interface_add_del_function (vnm, hw_if_index, is_create)))
268     return error;
269
270   if (dev_class->interface_add_del_function
271       && (error =
272           dev_class->interface_add_del_function (vnm, hw_if_index,
273                                                  is_create)))
274     return error;
275
276   error = call_elf_section_interface_callbacks
277     (vnm, hw_if_index, is_create, vnm->hw_interface_add_del_functions);
278
279   return error;
280 }
281
282 static clib_error_t *
283 call_sw_interface_add_del_callbacks (vnet_main_t * vnm, u32 sw_if_index,
284                                      u32 is_create)
285 {
286   return call_elf_section_interface_callbacks
287     (vnm, sw_if_index, is_create, vnm->sw_interface_add_del_functions);
288 }
289
290 static clib_error_t *
291 vnet_hw_interface_set_flags_helper (vnet_main_t * vnm, u32 hw_if_index,
292                                     vnet_hw_interface_flags_t flags,
293                                     vnet_interface_helper_flags_t
294                                     helper_flags)
295 {
296   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
297   vnet_hw_interface_class_t *hw_class =
298     vnet_get_hw_interface_class (vnm, hi->hw_class_index);
299   u32 mask;
300   clib_error_t *error = 0;
301   u32 is_create =
302     (helper_flags & VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE) != 0;
303
304   mask =
305     (VNET_HW_INTERFACE_FLAG_LINK_UP | VNET_HW_INTERFACE_FLAG_DUPLEX_MASK);
306   flags &= mask;
307
308   /* Call hardware interface add/del callbacks. */
309   if (is_create)
310     call_hw_interface_add_del_callbacks (vnm, hw_if_index, is_create);
311
312   /* Already in the desired state? */
313   if (!is_create && (hi->flags & mask) == flags)
314     goto done;
315
316   if ((hi->flags & VNET_HW_INTERFACE_FLAG_LINK_UP) !=
317       (flags & VNET_HW_INTERFACE_FLAG_LINK_UP))
318     {
319       /* Do hardware class (e.g. ethernet). */
320       if (hw_class->link_up_down_function
321           && (error = hw_class->link_up_down_function (vnm, hw_if_index,
322                                                        flags)))
323         goto done;
324
325       error = call_elf_section_interface_callbacks
326         (vnm, hw_if_index, flags, vnm->hw_interface_link_up_down_functions);
327
328       if (error)
329         goto done;
330     }
331
332   hi->flags &= ~mask;
333   hi->flags |= flags;
334
335 done:
336   return error;
337 }
338
339 static clib_error_t *
340 vnet_sw_interface_set_flags_helper (vnet_main_t * vnm, u32 sw_if_index,
341                                     vnet_sw_interface_flags_t flags,
342                                     vnet_interface_helper_flags_t
343                                     helper_flags)
344 {
345   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
346   u32 mask;
347   clib_error_t *error = 0;
348   u32 is_create =
349     (helper_flags & VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE) != 0;
350   u32 old_flags;
351
352   mask = VNET_SW_INTERFACE_FLAG_ADMIN_UP | VNET_SW_INTERFACE_FLAG_PUNT;
353   flags &= mask;
354
355   if (is_create)
356     {
357       error =
358         call_sw_interface_add_del_callbacks (vnm, sw_if_index, is_create);
359       if (error)
360         goto done;
361
362       if (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
363         {
364           /* Notify everyone when the interface is created as admin up */
365           error = call_elf_section_interface_callbacks (vnm, sw_if_index,
366                                                         flags,
367                                                         vnm->
368                                                         sw_interface_admin_up_down_functions);
369           if (error)
370             goto done;
371         }
372     }
373   else
374     {
375       vnet_sw_interface_t *si_sup = si;
376
377       /* Check that super interface is in correct state. */
378       if (si->type == VNET_SW_INTERFACE_TYPE_SUB)
379         {
380           si_sup = vnet_get_sw_interface (vnm, si->sup_sw_if_index);
381
382           /* Check to see if we're bringing down the soft interface and if it's parent is up */
383           if ((flags != (si_sup->flags & mask)) &&
384               (!((flags == 0)
385                  && ((si_sup->flags & mask) ==
386                      VNET_SW_INTERFACE_FLAG_ADMIN_UP))))
387             {
388               error = clib_error_return (0, "super-interface %U must be %U",
389                                          format_vnet_sw_interface_name, vnm,
390                                          si_sup,
391                                          format_vnet_sw_interface_flags,
392                                          flags);
393               goto done;
394             }
395         }
396
397       /* Already in the desired state? */
398       if ((si->flags & mask) == flags)
399         goto done;
400
401       /* Sub-interfaces of hardware interfaces that do no redistribute,
402          do not redistribute themselves. */
403       if (si_sup->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
404         {
405           vnet_hw_interface_t *hi =
406             vnet_get_hw_interface (vnm, si_sup->hw_if_index);
407           vnet_device_class_t *dev_class =
408             vnet_get_device_class (vnm, hi->dev_class_index);
409           if (!dev_class->redistribute)
410             helper_flags &=
411               ~VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE;
412         }
413
414       /* set the flags now before invoking the registered clients
415        * so that the state they query is consistent with the state here notified */
416       old_flags = si->flags;
417       si->flags &= ~mask;
418       si->flags |= flags;
419       if ((flags | old_flags) & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
420         error = call_elf_section_interface_callbacks
421           (vnm, sw_if_index, flags,
422            vnm->sw_interface_admin_up_down_functions);
423
424       if (error)
425         {
426           /* restore flags on error */
427           si->flags = old_flags;
428           goto done;
429         }
430
431       if (si->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
432         {
433           vnet_hw_interface_t *hi =
434             vnet_get_hw_interface (vnm, si->hw_if_index);
435           vnet_hw_interface_class_t *hw_class =
436             vnet_get_hw_interface_class (vnm, hi->hw_class_index);
437           vnet_device_class_t *dev_class =
438             vnet_get_device_class (vnm, hi->dev_class_index);
439
440           if ((flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP) &&
441               (si->flags & VNET_SW_INTERFACE_FLAG_ERROR))
442             {
443               error = clib_error_return (0, "Interface in the error state");
444               goto done;
445             }
446
447           /* save the si admin up flag */
448           old_flags = si->flags;
449
450           /* update si admin up flag in advance if we are going admin down */
451           if (!(flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP))
452             si->flags &= ~VNET_SW_INTERFACE_FLAG_ADMIN_UP;
453
454           if (dev_class->admin_up_down_function
455               && (error = dev_class->admin_up_down_function (vnm,
456                                                              si->hw_if_index,
457                                                              flags)))
458             {
459               /* restore si admin up flag to it's original state on errors */
460               si->flags = old_flags;
461               goto done;
462             }
463
464           if (hw_class->admin_up_down_function
465               && (error = hw_class->admin_up_down_function (vnm,
466                                                             si->hw_if_index,
467                                                             flags)))
468             {
469               /* restore si admin up flag to it's original state on errors */
470               si->flags = old_flags;
471               goto done;
472             }
473
474           /* Admin down implies link down. */
475           if (!(flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
476               && (hi->flags & VNET_HW_INTERFACE_FLAG_LINK_UP))
477             vnet_hw_interface_set_flags_helper (vnm, si->hw_if_index,
478                                                 hi->flags &
479                                                 ~VNET_HW_INTERFACE_FLAG_LINK_UP,
480                                                 helper_flags);
481         }
482     }
483
484   si->flags &= ~mask;
485   si->flags |= flags;
486
487 done:
488   return error;
489 }
490
491 clib_error_t *
492 vnet_hw_interface_set_flags (vnet_main_t * vnm, u32 hw_if_index,
493                              vnet_hw_interface_flags_t flags)
494 {
495   return vnet_hw_interface_set_flags_helper
496     (vnm, hw_if_index, flags,
497      VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE);
498 }
499
500 clib_error_t *
501 vnet_sw_interface_set_flags (vnet_main_t * vnm, u32 sw_if_index,
502                              vnet_sw_interface_flags_t flags)
503 {
504   return vnet_sw_interface_set_flags_helper
505     (vnm, sw_if_index, flags,
506      VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE);
507 }
508
509 void
510 vnet_sw_interface_admin_up (vnet_main_t * vnm, u32 sw_if_index)
511 {
512   u32 flags = vnet_sw_interface_get_flags (vnm, sw_if_index);
513
514   if (!(flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP))
515     {
516       flags |= VNET_SW_INTERFACE_FLAG_ADMIN_UP;
517       vnet_sw_interface_set_flags (vnm, sw_if_index, flags);
518     }
519 }
520
521 void
522 vnet_sw_interface_admin_down (vnet_main_t * vnm, u32 sw_if_index)
523 {
524   u32 flags = vnet_sw_interface_get_flags (vnm, sw_if_index);
525
526   if (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
527     {
528       flags &= ~(VNET_SW_INTERFACE_FLAG_ADMIN_UP);
529       vnet_sw_interface_set_flags (vnm, sw_if_index, flags);
530     }
531 }
532
533 static u32
534 vnet_create_sw_interface_no_callbacks (vnet_main_t * vnm,
535                                        vnet_sw_interface_t * template)
536 {
537   vnet_interface_main_t *im = &vnm->interface_main;
538   vnet_sw_interface_t *sw;
539   u32 sw_if_index;
540
541   pool_get (im->sw_interfaces, sw);
542   sw_if_index = sw - im->sw_interfaces;
543
544   sw[0] = template[0];
545
546   sw->flags = 0;
547   sw->sw_if_index = sw_if_index;
548   if (sw->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
549     sw->sup_sw_if_index = sw->sw_if_index;
550
551   /* Allocate counters for this interface. */
552   {
553     u32 i;
554
555     vnet_interface_counter_lock (im);
556
557     for (i = 0; i < vec_len (im->sw_if_counters); i++)
558       {
559         vlib_validate_simple_counter (&im->sw_if_counters[i], sw_if_index);
560         vlib_zero_simple_counter (&im->sw_if_counters[i], sw_if_index);
561       }
562
563     for (i = 0; i < vec_len (im->combined_sw_if_counters); i++)
564       {
565         vlib_validate_combined_counter (&im->combined_sw_if_counters[i],
566                                         sw_if_index);
567         vlib_zero_combined_counter (&im->combined_sw_if_counters[i],
568                                     sw_if_index);
569       }
570
571     vnet_interface_counter_unlock (im);
572   }
573
574   return sw_if_index;
575 }
576
577 clib_error_t *
578 vnet_create_sw_interface (vnet_main_t * vnm, vnet_sw_interface_t * template,
579                           u32 * sw_if_index)
580 {
581   clib_error_t *error;
582   vnet_hw_interface_t *hi;
583   vnet_device_class_t *dev_class;
584
585   if (template->sub.eth.flags.two_tags == 1
586       && template->sub.eth.flags.exact_match == 1
587       && (template->sub.eth.flags.inner_vlan_id_any == 1
588           || template->sub.eth.flags.outer_vlan_id_any == 1))
589     {
590       error = clib_error_return (0,
591                                  "inner-dot1q any exact-match is unsupported");
592       return error;
593     }
594
595   hi = vnet_get_sup_hw_interface (vnm, template->sup_sw_if_index);
596   dev_class = vnet_get_device_class (vnm, hi->dev_class_index);
597
598   if (template->type == VNET_SW_INTERFACE_TYPE_SUB &&
599       dev_class->subif_add_del_function)
600     {
601       error = dev_class->subif_add_del_function (vnm, hi->hw_if_index,
602                                                  (struct vnet_sw_interface_t
603                                                   *) template, 1);
604       if (error)
605         return error;
606     }
607
608   *sw_if_index = vnet_create_sw_interface_no_callbacks (vnm, template);
609   error = vnet_sw_interface_set_flags_helper
610     (vnm, *sw_if_index, template->flags,
611      VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
612
613   if (error)
614     {
615       /* undo the work done by vnet_create_sw_interface_no_callbacks() */
616       vnet_interface_main_t *im = &vnm->interface_main;
617       vnet_sw_interface_t *sw =
618         pool_elt_at_index (im->sw_interfaces, *sw_if_index);
619       pool_put (im->sw_interfaces, sw);
620     }
621
622   return error;
623 }
624
625 void
626 vnet_delete_sw_interface (vnet_main_t * vnm, u32 sw_if_index)
627 {
628   vnet_interface_main_t *im = &vnm->interface_main;
629   vnet_sw_interface_t *sw =
630     pool_elt_at_index (im->sw_interfaces, sw_if_index);
631
632   /* Check if the interface has config and is removed from L2 BD or XConnect */
633   vlib_main_t *vm = vlib_get_main ();
634   l2_input_config_t *config;
635   if (sw_if_index < vec_len (l2input_main.configs))
636     {
637       config = vec_elt_at_index (l2input_main.configs, sw_if_index);
638       if (config->xconnect)
639         set_int_l2_mode (vm, vnm, MODE_L3, config->output_sw_if_index, 0,
640                          L2_BD_PORT_TYPE_NORMAL, 0, 0);
641       if (config->xconnect || config->bridge)
642         set_int_l2_mode (vm, vnm, MODE_L3, sw_if_index, 0,
643                          L2_BD_PORT_TYPE_NORMAL, 0, 0);
644     }
645   vnet_clear_sw_interface_tag (vnm, sw_if_index);
646
647   /* Bring down interface in case it is up. */
648   if (sw->flags != 0)
649     vnet_sw_interface_set_flags (vnm, sw_if_index, /* flags */ 0);
650
651   call_sw_interface_add_del_callbacks (vnm, sw_if_index, /* is_create */ 0);
652
653   pool_put (im->sw_interfaces, sw);
654 }
655
656 static clib_error_t *
657 call_sw_interface_mtu_change_callbacks (vnet_main_t * vnm, u32 sw_if_index)
658 {
659   return call_elf_section_interface_callbacks
660     (vnm, sw_if_index, 0, vnm->sw_interface_mtu_change_functions);
661 }
662
663 void
664 vnet_sw_interface_set_mtu (vnet_main_t * vnm, u32 sw_if_index, u32 mtu)
665 {
666   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
667
668   if (si->mtu[VNET_MTU_L3] != mtu)
669     {
670       si->mtu[VNET_MTU_L3] = mtu;
671       call_sw_interface_mtu_change_callbacks (vnm, sw_if_index);
672     }
673 }
674
675 void
676 vnet_sw_interface_set_protocol_mtu (vnet_main_t * vnm, u32 sw_if_index,
677                                     u32 mtu[])
678 {
679   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
680   bool changed = false;
681   int i;
682
683   for (i = 0; i < VNET_N_MTU; i++)
684     {
685       if (si->mtu[i] != mtu[i])
686         {
687           si->mtu[i] = mtu[i];
688           changed = true;
689         }
690     }
691   /* Notify interested parties */
692   if (changed)
693     call_sw_interface_mtu_change_callbacks (vnm, sw_if_index);
694 }
695
696 void
697 vnet_sw_interface_ip_directed_broadcast (vnet_main_t * vnm,
698                                          u32 sw_if_index, u8 enable)
699 {
700   vnet_sw_interface_t *si;
701
702   si = vnet_get_sw_interface (vnm, sw_if_index);
703
704   if (enable)
705     si->flags |= VNET_SW_INTERFACE_FLAG_DIRECTED_BCAST;
706   else
707     si->flags &= ~VNET_SW_INTERFACE_FLAG_DIRECTED_BCAST;
708
709   ip4_directed_broadcast (sw_if_index, enable);
710 }
711
712 /*
713  * Reflect a change in hardware MTU on protocol MTUs
714  */
715 static walk_rc_t
716 sw_interface_walk_callback (vnet_main_t * vnm, u32 sw_if_index, void *ctx)
717 {
718   u32 *link_mtu = ctx;
719   vnet_sw_interface_set_mtu (vnm, sw_if_index, *link_mtu);
720   return WALK_CONTINUE;
721 }
722
723 void
724 vnet_hw_interface_set_mtu (vnet_main_t * vnm, u32 hw_if_index, u32 mtu)
725 {
726   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
727
728   if (hi->max_packet_bytes != mtu)
729     {
730       hi->max_packet_bytes = mtu;
731       ethernet_set_flags (vnm, hw_if_index, ETHERNET_INTERFACE_FLAG_MTU);
732       vnet_hw_interface_walk_sw (vnm, hw_if_index, sw_interface_walk_callback,
733                                  &mtu);
734     }
735 }
736
737 static void
738 setup_tx_node (vlib_main_t * vm,
739                u32 node_index, vnet_device_class_t * dev_class)
740 {
741   vlib_node_t *n = vlib_get_node (vm, node_index);
742
743   n->function = dev_class->tx_function;
744   n->format_trace = dev_class->format_tx_trace;
745
746   vlib_register_errors (vm, node_index,
747                         dev_class->tx_function_n_errors,
748                         dev_class->tx_function_error_strings);
749 }
750
751 static void
752 setup_output_node (vlib_main_t * vm,
753                    u32 node_index, vnet_hw_interface_class_t * hw_class)
754 {
755   vlib_node_t *n = vlib_get_node (vm, node_index);
756   n->format_buffer = hw_class->format_header;
757   n->unformat_buffer = hw_class->unformat_header;
758 }
759
760 /* Register an interface instance. */
761 u32
762 vnet_register_interface (vnet_main_t * vnm,
763                          u32 dev_class_index,
764                          u32 dev_instance,
765                          u32 hw_class_index, u32 hw_instance)
766 {
767   vnet_interface_main_t *im = &vnm->interface_main;
768   vnet_hw_interface_t *hw;
769   vnet_device_class_t *dev_class =
770     vnet_get_device_class (vnm, dev_class_index);
771   vnet_hw_interface_class_t *hw_class =
772     vnet_get_hw_interface_class (vnm, hw_class_index);
773   vlib_main_t *vm = vnm->vlib_main;
774   vnet_feature_config_main_t *fcm;
775   vnet_config_main_t *cm;
776   u32 hw_index, i;
777   char *tx_node_name = NULL, *output_node_name = NULL;
778
779   pool_get (im->hw_interfaces, hw);
780   clib_memset (hw, 0, sizeof (*hw));
781   hw->trace_classify_table_index = ~0;
782
783   hw_index = hw - im->hw_interfaces;
784   hw->hw_if_index = hw_index;
785   hw->default_rx_mode = VNET_HW_INTERFACE_RX_MODE_POLLING;
786
787   if (dev_class->format_device_name)
788     hw->name = format (0, "%U", dev_class->format_device_name, dev_instance);
789   else if (hw_class->format_interface_name)
790     hw->name = format (0, "%U", hw_class->format_interface_name,
791                        dev_instance);
792   else
793     hw->name = format (0, "%s%x", hw_class->name, dev_instance);
794
795   if (!im->hw_interface_by_name)
796     im->hw_interface_by_name = hash_create_vec ( /* size */ 0,
797                                                 sizeof (hw->name[0]),
798                                                 sizeof (uword));
799
800   hash_set_mem (im->hw_interface_by_name, hw->name, hw_index);
801
802   /* Make hardware interface point to software interface. */
803   {
804     vnet_sw_interface_t sw = {
805       .type = VNET_SW_INTERFACE_TYPE_HARDWARE,
806       .flood_class = VNET_FLOOD_CLASS_NORMAL,
807       .hw_if_index = hw_index
808     };
809     hw->sw_if_index = vnet_create_sw_interface_no_callbacks (vnm, &sw);
810   }
811
812   hw->dev_class_index = dev_class_index;
813   hw->dev_instance = dev_instance;
814   hw->hw_class_index = hw_class_index;
815   hw->hw_instance = hw_instance;
816
817   hw->max_rate_bits_per_sec = 0;
818   hw->min_packet_bytes = 0;
819   vnet_sw_interface_set_mtu (vnm, hw->sw_if_index, 0);
820
821   if (dev_class->tx_function == 0)
822     goto no_output_nodes;       /* No output/tx nodes to create */
823
824   tx_node_name = (char *) format (0, "%v-tx", hw->name);
825   output_node_name = (char *) format (0, "%v-output", hw->name);
826
827   /* If we have previously deleted interface nodes, re-use them. */
828   if (vec_len (im->deleted_hw_interface_nodes) > 0)
829     {
830       vnet_hw_interface_nodes_t *hn;
831       vlib_node_t *node;
832       vlib_node_runtime_t *nrt;
833
834       hn = vec_end (im->deleted_hw_interface_nodes) - 1;
835
836       hw->tx_node_index = hn->tx_node_index;
837       hw->output_node_index = hn->output_node_index;
838
839       vlib_node_rename (vm, hw->tx_node_index, "%v", tx_node_name);
840       vlib_node_rename (vm, hw->output_node_index, "%v", output_node_name);
841
842       /* *INDENT-OFF* */
843       foreach_vlib_main ({
844         vnet_interface_output_runtime_t *rt;
845
846         rt = vlib_node_get_runtime_data (this_vlib_main, hw->output_node_index);
847         ASSERT (rt->is_deleted == 1);
848         rt->is_deleted = 0;
849         rt->hw_if_index = hw_index;
850         rt->sw_if_index = hw->sw_if_index;
851         rt->dev_instance = hw->dev_instance;
852
853         rt = vlib_node_get_runtime_data (this_vlib_main, hw->tx_node_index);
854         rt->hw_if_index = hw_index;
855         rt->sw_if_index = hw->sw_if_index;
856         rt->dev_instance = hw->dev_instance;
857       });
858       /* *INDENT-ON* */
859
860       /* The new class may differ from the old one.
861        * Functions have to be updated. */
862       node = vlib_get_node (vm, hw->output_node_index);
863       node->function = vnet_interface_output_node;
864       node->format_trace = format_vnet_interface_output_trace;
865       /* *INDENT-OFF* */
866       foreach_vlib_main ({
867         nrt = vlib_node_get_runtime (this_vlib_main, hw->output_node_index);
868         nrt->function = node->function;
869       });
870       /* *INDENT-ON* */
871
872       node = vlib_get_node (vm, hw->tx_node_index);
873       node->function = dev_class->tx_function;
874       node->format_trace = dev_class->format_tx_trace;
875       /* *INDENT-OFF* */
876       foreach_vlib_main ({
877         nrt = vlib_node_get_runtime (this_vlib_main, hw->tx_node_index);
878         nrt->function = node->function;
879       });
880       /* *INDENT-ON* */
881
882       _vec_len (im->deleted_hw_interface_nodes) -= 1;
883     }
884   else
885     {
886       vlib_node_registration_t r;
887       vnet_interface_output_runtime_t rt = {
888         .hw_if_index = hw_index,
889         .sw_if_index = hw->sw_if_index,
890         .dev_instance = hw->dev_instance,
891         .is_deleted = 0,
892       };
893
894       clib_memset (&r, 0, sizeof (r));
895       r.type = VLIB_NODE_TYPE_INTERNAL;
896       r.runtime_data = &rt;
897       r.runtime_data_bytes = sizeof (rt);
898       r.scalar_size = 0;
899       r.vector_size = sizeof (u32);
900
901       r.flags = VLIB_NODE_FLAG_IS_OUTPUT;
902       r.name = tx_node_name;
903       r.function = dev_class->tx_function;
904
905       hw->tx_node_index = vlib_register_node (vm, &r);
906
907       vlib_node_add_named_next_with_slot (vm, hw->tx_node_index,
908                                           "error-drop",
909                                           VNET_INTERFACE_TX_NEXT_DROP);
910
911       r.flags = 0;
912       r.name = output_node_name;
913       r.function = vnet_interface_output_node;
914       r.format_trace = format_vnet_interface_output_trace;
915
916       {
917         static char *e[] = {
918           "interface is down",
919           "interface is deleted",
920           "no buffers to segment GSO",
921         };
922
923         r.n_errors = ARRAY_LEN (e);
924         r.error_strings = e;
925       }
926       hw->output_node_index = vlib_register_node (vm, &r);
927
928       vlib_node_add_named_next_with_slot (vm, hw->output_node_index,
929                                           "error-drop",
930                                           VNET_INTERFACE_OUTPUT_NEXT_DROP);
931       vlib_node_add_next_with_slot (vm, hw->output_node_index,
932                                     hw->tx_node_index,
933                                     VNET_INTERFACE_OUTPUT_NEXT_TX);
934
935       /* add interface to the list of "output-interface" feature arc start nodes
936          and clone nexts from 1st interface if it exists */
937       fcm = vnet_feature_get_config_main (im->output_feature_arc_index);
938       cm = &fcm->config_main;
939       i = vec_len (cm->start_node_indices);
940       vec_validate (cm->start_node_indices, i);
941       cm->start_node_indices[i] = hw->output_node_index;
942       if (hw_index)
943         {
944           /* copy nexts from 1st interface */
945           vnet_hw_interface_t *first_hw;
946           vlib_node_t *first_node;
947
948           first_hw = vnet_get_hw_interface (vnm, /* hw_if_index */ 0);
949           first_node = vlib_get_node (vm, first_hw->output_node_index);
950
951           /* 1st 2 nexts are already added above */
952           for (i = 2; i < vec_len (first_node->next_nodes); i++)
953             vlib_node_add_next_with_slot (vm, hw->output_node_index,
954                                           first_node->next_nodes[i], i);
955         }
956     }
957
958   setup_output_node (vm, hw->output_node_index, hw_class);
959   setup_tx_node (vm, hw->tx_node_index, dev_class);
960
961 no_output_nodes:
962   /* Call all up/down callbacks with zero flags when interface is created. */
963   vnet_sw_interface_set_flags_helper (vnm, hw->sw_if_index, /* flags */ 0,
964                                       VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
965   vnet_hw_interface_set_flags_helper (vnm, hw_index, /* flags */ 0,
966                                       VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
967   vec_free (tx_node_name);
968   vec_free (output_node_name);
969
970   return hw_index;
971 }
972
973 void
974 vnet_delete_hw_interface (vnet_main_t * vnm, u32 hw_if_index)
975 {
976   vnet_interface_main_t *im = &vnm->interface_main;
977   vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
978   vlib_main_t *vm = vnm->vlib_main;
979   vnet_device_class_t *dev_class = vnet_get_device_class (vnm,
980                                                           hw->dev_class_index);
981   /* If it is up, mark it down. */
982   if (hw->flags != 0)
983     vnet_hw_interface_set_flags (vnm, hw_if_index, /* flags */ 0);
984
985   /* Call delete callbacks. */
986   call_hw_interface_add_del_callbacks (vnm, hw_if_index, /* is_create */ 0);
987
988   /* Delete any sub-interfaces. */
989   {
990     u32 id, sw_if_index;
991     /* *INDENT-OFF* */
992     hash_foreach (id, sw_if_index, hw->sub_interface_sw_if_index_by_id,
993     ({
994       vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
995       u64 sup_and_sub_key =
996         ((u64) (si->sup_sw_if_index) << 32) | (u64) si->sub.id;
997       hash_unset_mem_free (&im->sw_if_index_by_sup_and_sub, &sup_and_sub_key);
998       vnet_delete_sw_interface (vnm, sw_if_index);
999     }));
1000     hash_free (hw->sub_interface_sw_if_index_by_id);
1001     /* *INDENT-ON* */
1002   }
1003
1004   /* Delete software interface corresponding to hardware interface. */
1005   vnet_delete_sw_interface (vnm, hw->sw_if_index);
1006
1007   if (dev_class->tx_function)
1008     {
1009       /* Put output/tx nodes into recycle pool */
1010       vnet_hw_interface_nodes_t *dn;
1011
1012       /* *INDENT-OFF* */
1013       foreach_vlib_main
1014         ({
1015           vnet_interface_output_runtime_t *rt =
1016             vlib_node_get_runtime_data (this_vlib_main, hw->output_node_index);
1017
1018           /* Mark node runtime as deleted so output node (if called)
1019            * will drop packets. */
1020           rt->is_deleted = 1;
1021         });
1022       /* *INDENT-ON* */
1023
1024       vlib_node_rename (vm, hw->output_node_index,
1025                         "interface-%d-output-deleted", hw_if_index);
1026       vlib_node_rename (vm, hw->tx_node_index, "interface-%d-tx-deleted",
1027                         hw_if_index);
1028       vec_add2 (im->deleted_hw_interface_nodes, dn, 1);
1029       dn->tx_node_index = hw->tx_node_index;
1030       dn->output_node_index = hw->output_node_index;
1031     }
1032
1033   hash_unset_mem (im->hw_interface_by_name, hw->name);
1034   vec_free (hw->name);
1035   vec_free (hw->hw_address);
1036   vec_free (hw->input_node_thread_index_by_queue);
1037   vec_free (hw->dq_runtime_index_by_queue);
1038
1039   pool_put (im->hw_interfaces, hw);
1040 }
1041
1042 void
1043 vnet_hw_interface_walk_sw (vnet_main_t * vnm,
1044                            u32 hw_if_index,
1045                            vnet_hw_sw_interface_walk_t fn, void *ctx)
1046 {
1047   vnet_hw_interface_t *hi;
1048   u32 id, sw_if_index;
1049
1050   hi = vnet_get_hw_interface (vnm, hw_if_index);
1051   /* the super first, then the sub interfaces */
1052   if (WALK_STOP == fn (vnm, hi->sw_if_index, ctx))
1053     return;
1054
1055   /* *INDENT-OFF* */
1056   hash_foreach (id, sw_if_index,
1057                 hi->sub_interface_sw_if_index_by_id,
1058   ({
1059     if (WALK_STOP == fn (vnm, sw_if_index, ctx))
1060       break;
1061   }));
1062   /* *INDENT-ON* */
1063 }
1064
1065 void
1066 vnet_hw_interface_walk (vnet_main_t * vnm,
1067                         vnet_hw_interface_walk_t fn, void *ctx)
1068 {
1069   vnet_interface_main_t *im;
1070   vnet_hw_interface_t *hi;
1071
1072   im = &vnm->interface_main;
1073
1074   /* *INDENT-OFF* */
1075   pool_foreach (hi, im->hw_interfaces,
1076   ({
1077     if (WALK_STOP == fn(vnm, hi->hw_if_index, ctx))
1078       break;
1079   }));
1080   /* *INDENT-ON* */
1081 }
1082
1083 void
1084 vnet_sw_interface_walk (vnet_main_t * vnm,
1085                         vnet_sw_interface_walk_t fn, void *ctx)
1086 {
1087   vnet_interface_main_t *im;
1088   vnet_sw_interface_t *si;
1089
1090   im = &vnm->interface_main;
1091
1092   /* *INDENT-OFF* */
1093   pool_foreach (si, im->sw_interfaces,
1094   {
1095     if (WALK_STOP == fn (vnm, si, ctx))
1096       break;
1097   });
1098   /* *INDENT-ON* */
1099 }
1100
1101 void
1102 vnet_hw_interface_init_for_class (vnet_main_t * vnm, u32 hw_if_index,
1103                                   u32 hw_class_index, u32 hw_instance)
1104 {
1105   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1106   vnet_hw_interface_class_t *hc =
1107     vnet_get_hw_interface_class (vnm, hw_class_index);
1108
1109   hi->hw_class_index = hw_class_index;
1110   hi->hw_instance = hw_instance;
1111   setup_output_node (vnm->vlib_main, hi->output_node_index, hc);
1112 }
1113
1114 static clib_error_t *
1115 vnet_hw_interface_set_class_helper (vnet_main_t * vnm, u32 hw_if_index,
1116                                     u32 hw_class_index, u32 redistribute)
1117 {
1118   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1119   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, hi->sw_if_index);
1120   vnet_hw_interface_class_t *old_class =
1121     vnet_get_hw_interface_class (vnm, hi->hw_class_index);
1122   vnet_hw_interface_class_t *new_class =
1123     vnet_get_hw_interface_class (vnm, hw_class_index);
1124   vnet_device_class_t *dev_class =
1125     vnet_get_device_class (vnm, hi->dev_class_index);
1126   clib_error_t *error = 0;
1127
1128   /* New class equals old class?  Nothing to do. */
1129   if (hi->hw_class_index == hw_class_index)
1130     return 0;
1131
1132   /* No need (and incorrect since admin up flag may be set) to do error checking when
1133      receiving unserialize message. */
1134   if (redistribute)
1135     {
1136       if (si->flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
1137         return clib_error_return (0,
1138                                   "%v must be admin down to change class from %s to %s",
1139                                   hi->name, old_class->name, new_class->name);
1140
1141       /* Make sure interface supports given class. */
1142       if ((new_class->is_valid_class_for_interface
1143            && !new_class->is_valid_class_for_interface (vnm, hw_if_index,
1144                                                         hw_class_index))
1145           || (dev_class->is_valid_class_for_interface
1146               && !dev_class->is_valid_class_for_interface (vnm, hw_if_index,
1147                                                            hw_class_index)))
1148         return clib_error_return (0,
1149                                   "%v class cannot be changed from %s to %s",
1150                                   hi->name, old_class->name, new_class->name);
1151
1152     }
1153
1154   if (old_class->hw_class_change)
1155     old_class->hw_class_change (vnm, hw_if_index, old_class->index,
1156                                 new_class->index);
1157
1158   vnet_hw_interface_init_for_class (vnm, hw_if_index, new_class->index,
1159                                     /* instance */ ~0);
1160
1161   if (new_class->hw_class_change)
1162     new_class->hw_class_change (vnm, hw_if_index, old_class->index,
1163                                 new_class->index);
1164
1165   if (dev_class->hw_class_change)
1166     dev_class->hw_class_change (vnm, hw_if_index, new_class->index);
1167
1168   return error;
1169 }
1170
1171 clib_error_t *
1172 vnet_hw_interface_set_class (vnet_main_t * vnm, u32 hw_if_index,
1173                              u32 hw_class_index)
1174 {
1175   return vnet_hw_interface_set_class_helper (vnm, hw_if_index, hw_class_index,
1176                                              /* redistribute */ 1);
1177 }
1178
1179 static int
1180 vnet_hw_interface_rx_redirect_to_node_helper (vnet_main_t * vnm,
1181                                               u32 hw_if_index,
1182                                               u32 node_index,
1183                                               u32 redistribute)
1184 {
1185   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1186   vnet_device_class_t *dev_class = vnet_get_device_class
1187     (vnm, hi->dev_class_index);
1188
1189   if (dev_class->rx_redirect_to_node)
1190     {
1191       dev_class->rx_redirect_to_node (vnm, hw_if_index, node_index);
1192       return 0;
1193     }
1194
1195   return VNET_API_ERROR_UNIMPLEMENTED;
1196 }
1197
1198 int
1199 vnet_hw_interface_rx_redirect_to_node (vnet_main_t * vnm, u32 hw_if_index,
1200                                        u32 node_index)
1201 {
1202   return vnet_hw_interface_rx_redirect_to_node_helper (vnm, hw_if_index,
1203                                                        node_index,
1204                                                        1 /* redistribute */ );
1205 }
1206
1207 word
1208 vnet_sw_interface_compare (vnet_main_t * vnm,
1209                            uword sw_if_index0, uword sw_if_index1)
1210 {
1211   vnet_sw_interface_t *sup0 = vnet_get_sup_sw_interface (vnm, sw_if_index0);
1212   vnet_sw_interface_t *sup1 = vnet_get_sup_sw_interface (vnm, sw_if_index1);
1213   vnet_hw_interface_t *h0 = vnet_get_hw_interface (vnm, sup0->hw_if_index);
1214   vnet_hw_interface_t *h1 = vnet_get_hw_interface (vnm, sup1->hw_if_index);
1215
1216   if (h0 != h1)
1217     return vec_cmp (h0->name, h1->name);
1218   return (word) h0->hw_instance - (word) h1->hw_instance;
1219 }
1220
1221 word
1222 vnet_hw_interface_compare (vnet_main_t * vnm,
1223                            uword hw_if_index0, uword hw_if_index1)
1224 {
1225   vnet_hw_interface_t *h0 = vnet_get_hw_interface (vnm, hw_if_index0);
1226   vnet_hw_interface_t *h1 = vnet_get_hw_interface (vnm, hw_if_index1);
1227
1228   if (h0 != h1)
1229     return vec_cmp (h0->name, h1->name);
1230   return (word) h0->hw_instance - (word) h1->hw_instance;
1231 }
1232
1233 int
1234 vnet_sw_interface_is_p2p (vnet_main_t * vnm, u32 sw_if_index)
1235 {
1236   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
1237   if ((si->type == VNET_SW_INTERFACE_TYPE_P2P) ||
1238       (si->type == VNET_SW_INTERFACE_TYPE_PIPE))
1239     return 1;
1240
1241   vnet_hw_interface_t *hw = vnet_get_sup_hw_interface (vnm, sw_if_index);
1242   vnet_hw_interface_class_t *hc =
1243     vnet_get_hw_interface_class (vnm, hw->hw_class_index);
1244
1245   return (hc->flags & VNET_HW_INTERFACE_CLASS_FLAG_P2P);
1246 }
1247
1248 int
1249 vnet_sw_interface_is_nbma (vnet_main_t * vnm, u32 sw_if_index)
1250 {
1251   vnet_hw_interface_t *hw = vnet_get_sup_hw_interface (vnm, sw_if_index);
1252   vnet_hw_interface_class_t *hc =
1253     vnet_get_hw_interface_class (vnm, hw->hw_class_index);
1254
1255   return (hc->flags & VNET_HW_INTERFACE_CLASS_FLAG_NBMA);
1256 }
1257
1258 clib_error_t *
1259 vnet_interface_init (vlib_main_t * vm)
1260 {
1261   vnet_main_t *vnm = vnet_get_main ();
1262   vnet_interface_main_t *im = &vnm->interface_main;
1263   vlib_buffer_t *b = 0;
1264   vnet_buffer_opaque_t *o = 0;
1265   clib_error_t *error;
1266
1267   /*
1268    * Keep people from shooting themselves in the foot.
1269    */
1270   if (sizeof (b->opaque) != sizeof (vnet_buffer_opaque_t))
1271     {
1272 #define _(a) if (sizeof(o->a) > sizeof (o->unused))                     \
1273       clib_warning                                                      \
1274         ("FATAL: size of opaque union subtype %s is %d (max %d)",       \
1275          #a, sizeof(o->a), sizeof (o->unused));
1276       foreach_buffer_opaque_union_subtype;
1277 #undef _
1278
1279       return clib_error_return
1280         (0, "FATAL: size of vlib buffer opaque %d, size of vnet opaque %d",
1281          sizeof (b->opaque), sizeof (vnet_buffer_opaque_t));
1282     }
1283
1284   clib_spinlock_init (&im->sw_if_counter_lock);
1285   clib_spinlock_lock (&im->sw_if_counter_lock); /* should be no need */
1286
1287   vec_validate (im->sw_if_counters, VNET_N_SIMPLE_INTERFACE_COUNTER - 1);
1288 #define _(E,n,p)                                                        \
1289   im->sw_if_counters[VNET_INTERFACE_COUNTER_##E].name = #n;             \
1290   im->sw_if_counters[VNET_INTERFACE_COUNTER_##E].stat_segment_name = "/" #p "/" #n;
1291   foreach_simple_interface_counter_name
1292 #undef _
1293     vec_validate (im->combined_sw_if_counters,
1294                   VNET_N_COMBINED_INTERFACE_COUNTER - 1);
1295 #define _(E,n,p)                                                        \
1296   im->combined_sw_if_counters[VNET_INTERFACE_COUNTER_##E].name = #n;    \
1297   im->combined_sw_if_counters[VNET_INTERFACE_COUNTER_##E].stat_segment_name = "/" #p "/" #n;
1298   foreach_combined_interface_counter_name
1299 #undef _
1300     clib_spinlock_unlock (&im->sw_if_counter_lock);
1301
1302   im->device_class_by_name = hash_create_string ( /* size */ 0,
1303                                                  sizeof (uword));
1304   {
1305     vnet_device_class_t *c;
1306
1307     c = vnm->device_class_registrations;
1308
1309     while (c)
1310       {
1311         c->index = vec_len (im->device_classes);
1312         hash_set_mem (im->device_class_by_name, c->name, c->index);
1313
1314         if (c->tx_fn_registrations)
1315           {
1316             vlib_node_fn_registration_t *fnr = c->tx_fn_registrations;
1317             int priority = -1;
1318
1319             /* to avoid confusion, please remove ".tx_function" statement
1320                from VNET_DEVICE_CLASS() if using function candidates */
1321             ASSERT (c->tx_function == 0);
1322
1323             while (fnr)
1324               {
1325                 if (fnr->priority > priority)
1326                   {
1327                     priority = fnr->priority;
1328                     c->tx_function = fnr->function;
1329                   }
1330                 fnr = fnr->next_registration;
1331               }
1332           }
1333
1334         vec_add1 (im->device_classes, c[0]);
1335         c = c->next_class_registration;
1336       }
1337   }
1338
1339   im->hw_interface_class_by_name = hash_create_string ( /* size */ 0,
1340                                                        sizeof (uword));
1341
1342   im->sw_if_index_by_sup_and_sub = hash_create_mem (0, sizeof (u64),
1343                                                     sizeof (uword));
1344   {
1345     vnet_hw_interface_class_t *c;
1346
1347     c = vnm->hw_interface_class_registrations;
1348
1349     while (c)
1350       {
1351         c->index = vec_len (im->hw_interface_classes);
1352         hash_set_mem (im->hw_interface_class_by_name, c->name, c->index);
1353
1354         if (NULL == c->build_rewrite)
1355           c->build_rewrite = default_build_rewrite;
1356         if (NULL == c->update_adjacency)
1357           c->update_adjacency = default_update_adjacency;
1358
1359         vec_add1 (im->hw_interface_classes, c[0]);
1360         c = c->next_class_registration;
1361       }
1362   }
1363
1364   /* init per-thread data */
1365   vec_validate_aligned (im->per_thread_data, vlib_num_workers (),
1366                         CLIB_CACHE_LINE_BYTES);
1367
1368   if ((error = vlib_call_init_function (vm, vnet_interface_cli_init)))
1369     return error;
1370
1371   vnm->interface_tag_by_sw_if_index = hash_create (0, sizeof (uword));
1372
1373 #if VLIB_BUFFER_TRACE_TRAJECTORY > 0
1374   if ((error = vlib_call_init_function (vm, trajectory_trace_init)))
1375     return error;
1376 #endif
1377
1378   return 0;
1379 }
1380
1381 VLIB_INIT_FUNCTION (vnet_interface_init);
1382
1383 /* Kludge to renumber interface names [only!] */
1384 int
1385 vnet_interface_name_renumber (u32 sw_if_index, u32 new_show_dev_instance)
1386 {
1387   int rv;
1388   vnet_main_t *vnm = vnet_get_main ();
1389   vnet_interface_main_t *im = &vnm->interface_main;
1390   vnet_hw_interface_t *hi = vnet_get_sup_hw_interface (vnm, sw_if_index);
1391
1392   vnet_device_class_t *dev_class = vnet_get_device_class
1393     (vnm, hi->dev_class_index);
1394
1395   if (dev_class->name_renumber == 0 || dev_class->format_device_name == 0)
1396     return VNET_API_ERROR_UNIMPLEMENTED;
1397
1398   rv = dev_class->name_renumber (hi, new_show_dev_instance);
1399
1400   if (rv)
1401     return rv;
1402
1403   hash_unset_mem (im->hw_interface_by_name, hi->name);
1404   vec_free (hi->name);
1405   /* Use the mapping we set up to call it Ishmael */
1406   hi->name = format (0, "%U", dev_class->format_device_name,
1407                      hi->dev_instance);
1408
1409   hash_set_mem (im->hw_interface_by_name, hi->name, hi->hw_if_index);
1410   return rv;
1411 }
1412
1413 clib_error_t *
1414 vnet_rename_interface (vnet_main_t * vnm, u32 hw_if_index, char *new_name)
1415 {
1416   vnet_interface_main_t *im = &vnm->interface_main;
1417   vlib_main_t *vm = vnm->vlib_main;
1418   vnet_hw_interface_t *hw;
1419   u8 *old_name;
1420   clib_error_t *error = 0;
1421
1422   hw = vnet_get_hw_interface (vnm, hw_if_index);
1423   if (!hw)
1424     {
1425       return clib_error_return (0,
1426                                 "unable to find hw interface for index %u",
1427                                 hw_if_index);
1428     }
1429
1430   old_name = hw->name;
1431
1432   /* set new hw->name */
1433   hw->name = format (0, "%s", new_name);
1434
1435   /* remove the old name to hw_if_index mapping and install the new one */
1436   hash_unset_mem (im->hw_interface_by_name, old_name);
1437   hash_set_mem (im->hw_interface_by_name, hw->name, hw_if_index);
1438
1439   /* rename tx/output nodes */
1440   vlib_node_rename (vm, hw->tx_node_index, "%v-tx", hw->name);
1441   vlib_node_rename (vm, hw->output_node_index, "%v-output", hw->name);
1442
1443   /* free the old name vector */
1444   vec_free (old_name);
1445
1446   return error;
1447 }
1448
1449 clib_error_t *
1450 vnet_hw_interface_add_del_mac_address (vnet_main_t * vnm,
1451                                        u32 hw_if_index,
1452                                        const u8 * mac_address, u8 is_add)
1453 {
1454   clib_error_t *error = 0;
1455   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1456
1457   vnet_device_class_t *dev_class =
1458     vnet_get_device_class (vnm, hi->dev_class_index);
1459
1460   if (!hi->hw_address)
1461     {
1462       error =
1463         clib_error_return
1464         (0, "Secondary MAC Addresses not supported for interface index %u",
1465          hw_if_index);
1466       goto done;
1467     }
1468
1469   if (dev_class->mac_addr_add_del_function)
1470     error = dev_class->mac_addr_add_del_function (hi, mac_address, is_add);
1471
1472   if (!error)
1473     {
1474       vnet_hw_interface_class_t *hw_class;
1475
1476       hw_class = vnet_get_hw_interface_class (vnm, hi->hw_class_index);
1477
1478       if (NULL != hw_class->mac_addr_add_del_function)
1479         error = hw_class->mac_addr_add_del_function (hi, mac_address, is_add);
1480     }
1481
1482   /* If no errors, add to the list of secondary MACs on the ethernet intf */
1483   if (!error)
1484     ethernet_interface_add_del_address (&ethernet_main, hw_if_index,
1485                                         mac_address, is_add);
1486
1487 done:
1488   return error;
1489 }
1490
1491 static clib_error_t *
1492 vnet_hw_interface_change_mac_address_helper (vnet_main_t * vnm,
1493                                              u32 hw_if_index,
1494                                              const u8 * mac_address)
1495 {
1496   clib_error_t *error = 0;
1497   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1498
1499   if (hi->hw_address)
1500     {
1501       u8 *old_address = vec_dup (hi->hw_address);
1502       vnet_device_class_t *dev_class =
1503         vnet_get_device_class (vnm, hi->dev_class_index);
1504       if (dev_class->mac_addr_change_function)
1505         {
1506           error =
1507             dev_class->mac_addr_change_function (hi, old_address,
1508                                                  mac_address);
1509         }
1510       if (!error)
1511         {
1512           vnet_hw_interface_class_t *hw_class;
1513
1514           hw_class = vnet_get_hw_interface_class (vnm, hi->hw_class_index);
1515
1516           if (NULL != hw_class->mac_addr_change_function)
1517             hw_class->mac_addr_change_function (hi, old_address, mac_address);
1518         }
1519       else
1520         {
1521           error =
1522             clib_error_return (0,
1523                                "MAC Address Change is not supported on this interface");
1524         }
1525       vec_free (old_address);
1526     }
1527   else
1528     {
1529       error =
1530         clib_error_return (0,
1531                            "mac address change is not supported for interface index %u",
1532                            hw_if_index);
1533     }
1534   return error;
1535 }
1536
1537 clib_error_t *
1538 vnet_hw_interface_change_mac_address (vnet_main_t * vnm, u32 hw_if_index,
1539                                       const u8 * mac_address)
1540 {
1541   return vnet_hw_interface_change_mac_address_helper
1542     (vnm, hw_if_index, mac_address);
1543 }
1544
1545 /* update the unnumbered state of an interface*/
1546 void
1547 vnet_sw_interface_update_unnumbered (u32 unnumbered_sw_if_index,
1548                                      u32 ip_sw_if_index, u8 enable)
1549 {
1550   vnet_main_t *vnm = vnet_get_main ();
1551   vnet_sw_interface_t *si;
1552   u32 was_unnum;
1553
1554   si = vnet_get_sw_interface (vnm, unnumbered_sw_if_index);
1555   was_unnum = (si->flags & VNET_SW_INTERFACE_FLAG_UNNUMBERED);
1556
1557   if (enable)
1558     {
1559       si->flags |= VNET_SW_INTERFACE_FLAG_UNNUMBERED;
1560       si->unnumbered_sw_if_index = ip_sw_if_index;
1561
1562       ip4_main.lookup_main.if_address_pool_index_by_sw_if_index
1563         [unnumbered_sw_if_index] =
1564         ip4_main.
1565         lookup_main.if_address_pool_index_by_sw_if_index[ip_sw_if_index];
1566       ip6_main.
1567         lookup_main.if_address_pool_index_by_sw_if_index
1568         [unnumbered_sw_if_index] =
1569         ip6_main.
1570         lookup_main.if_address_pool_index_by_sw_if_index[ip_sw_if_index];
1571     }
1572   else
1573     {
1574       si->flags &= ~(VNET_SW_INTERFACE_FLAG_UNNUMBERED);
1575       si->unnumbered_sw_if_index = (u32) ~ 0;
1576
1577       ip4_main.lookup_main.if_address_pool_index_by_sw_if_index
1578         [unnumbered_sw_if_index] = ~0;
1579       ip6_main.lookup_main.if_address_pool_index_by_sw_if_index
1580         [unnumbered_sw_if_index] = ~0;
1581     }
1582
1583   if (was_unnum != (si->flags & VNET_SW_INTERFACE_FLAG_UNNUMBERED))
1584     {
1585       ip4_sw_interface_enable_disable (unnumbered_sw_if_index, enable);
1586       ip6_sw_interface_enable_disable (unnumbered_sw_if_index, enable);
1587     }
1588 }
1589
1590 vnet_l3_packet_type_t
1591 vnet_link_to_l3_proto (vnet_link_t link)
1592 {
1593   switch (link)
1594     {
1595     case VNET_LINK_IP4:
1596       return (VNET_L3_PACKET_TYPE_IP4);
1597     case VNET_LINK_IP6:
1598       return (VNET_L3_PACKET_TYPE_IP6);
1599     case VNET_LINK_MPLS:
1600       return (VNET_L3_PACKET_TYPE_MPLS);
1601     case VNET_LINK_ARP:
1602       return (VNET_L3_PACKET_TYPE_ARP);
1603     case VNET_LINK_ETHERNET:
1604     case VNET_LINK_NSH:
1605       ASSERT (0);
1606       break;
1607     }
1608   ASSERT (0);
1609   return (0);
1610 }
1611
1612 vnet_mtu_t
1613 vnet_link_to_mtu (vnet_link_t link)
1614 {
1615   switch (link)
1616     {
1617     case VNET_LINK_IP4:
1618       return (VNET_MTU_IP4);
1619     case VNET_LINK_IP6:
1620       return (VNET_MTU_IP6);
1621     case VNET_LINK_MPLS:
1622       return (VNET_MTU_MPLS);
1623     default:
1624       return (VNET_MTU_L3);
1625     }
1626 }
1627
1628 u8 *
1629 default_build_rewrite (vnet_main_t * vnm,
1630                        u32 sw_if_index,
1631                        vnet_link_t link_type, const void *dst_address)
1632 {
1633   return (NULL);
1634 }
1635
1636 void
1637 default_update_adjacency (vnet_main_t * vnm, u32 sw_if_index, u32 ai)
1638 {
1639   ip_adjacency_t *adj;
1640
1641   adj = adj_get (ai);
1642
1643   switch (adj->lookup_next_index)
1644     {
1645     case IP_LOOKUP_NEXT_GLEAN:
1646       adj_glean_update_rewrite (ai);
1647       break;
1648     case IP_LOOKUP_NEXT_ARP:
1649     case IP_LOOKUP_NEXT_BCAST:
1650       /*
1651        * default rewrite in neighbour adj
1652        */
1653       adj_nbr_update_rewrite
1654         (ai,
1655          ADJ_NBR_REWRITE_FLAG_COMPLETE,
1656          vnet_build_rewrite_for_sw_interface (vnm,
1657                                               sw_if_index,
1658                                               adj_get_link_type (ai), NULL));
1659       break;
1660     case IP_LOOKUP_NEXT_MCAST:
1661       /*
1662        * mcast traffic also uses default rewrite string with no mcast
1663        * switch time updates.
1664        */
1665       adj_mcast_update_rewrite
1666         (ai,
1667          vnet_build_rewrite_for_sw_interface (vnm,
1668                                               sw_if_index,
1669                                               adj_get_link_type (ai),
1670                                               NULL), 0);
1671       break;
1672     case IP_LOOKUP_NEXT_DROP:
1673     case IP_LOOKUP_NEXT_PUNT:
1674     case IP_LOOKUP_NEXT_LOCAL:
1675     case IP_LOOKUP_NEXT_REWRITE:
1676     case IP_LOOKUP_NEXT_MCAST_MIDCHAIN:
1677     case IP_LOOKUP_NEXT_MIDCHAIN:
1678     case IP_LOOKUP_NEXT_ICMP_ERROR:
1679     case IP_LOOKUP_N_NEXT:
1680       ASSERT (0);
1681       break;
1682     }
1683 }
1684
1685 int collect_detailed_interface_stats_flag = 0;
1686
1687 void
1688 collect_detailed_interface_stats_flag_set (void)
1689 {
1690   collect_detailed_interface_stats_flag = 1;
1691 }
1692
1693 void
1694 collect_detailed_interface_stats_flag_clear (void)
1695 {
1696   collect_detailed_interface_stats_flag = 0;
1697 }
1698
1699 static clib_error_t *
1700 collect_detailed_interface_stats_cli (vlib_main_t * vm,
1701                                       unformat_input_t * input,
1702                                       vlib_cli_command_t * cmd)
1703 {
1704   unformat_input_t _line_input, *line_input = &_line_input;
1705   clib_error_t *error = NULL;
1706
1707   /* Get a line of input. */
1708   if (!unformat_user (input, unformat_line_input, line_input))
1709     return clib_error_return (0, "expected enable | disable");
1710
1711   while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
1712     {
1713       if (unformat (line_input, "enable") || unformat (line_input, "on"))
1714         collect_detailed_interface_stats_flag_set ();
1715       else if (unformat (line_input, "disable")
1716                || unformat (line_input, "off"))
1717         collect_detailed_interface_stats_flag_clear ();
1718       else
1719         {
1720           error = clib_error_return (0, "unknown input `%U'",
1721                                      format_unformat_error, line_input);
1722           goto done;
1723         }
1724     }
1725
1726 done:
1727   unformat_free (line_input);
1728   return error;
1729 }
1730
1731 /* *INDENT-OFF* */
1732 VLIB_CLI_COMMAND (collect_detailed_interface_stats_command, static) = {
1733   .path = "interface collect detailed-stats",
1734   .short_help = "interface collect detailed-stats <enable|disable>",
1735   .function = collect_detailed_interface_stats_cli,
1736 };
1737 /* *INDENT-ON* */
1738
1739 /*
1740  * fd.io coding-style-patch-verification: ON
1741  *
1742  * Local Variables:
1743  * eval: (c-set-style "gnu")
1744  * End:
1745  */