interface: add multiarch support for per-interface tx node
[vpp.git] / src / vnet / interface.c
1 /*
2  * Copyright (c) 2015 Cisco and/or its affiliates.
3  * Licensed under the Apache License, Version 2.0 (the "License");
4  * you may not use this file except in compliance with the License.
5  * You may obtain a copy of the License at:
6  *
7  *     http://www.apache.org/licenses/LICENSE-2.0
8  *
9  * Unless required by applicable law or agreed to in writing, software
10  * distributed under the License is distributed on an "AS IS" BASIS,
11  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12  * See the License for the specific language governing permissions and
13  * limitations under the License.
14  */
15 /*
16  * interface.c: VNET interfaces/sub-interfaces
17  *
18  * Copyright (c) 2008 Eliot Dresselhaus
19  *
20  * Permission is hereby granted, free of charge, to any person obtaining
21  * a copy of this software and associated documentation files (the
22  * "Software"), to deal in the Software without restriction, including
23  * without limitation the rights to use, copy, modify, merge, publish,
24  * distribute, sublicense, and/or sell copies of the Software, and to
25  * permit persons to whom the Software is furnished to do so, subject to
26  * the following conditions:
27  *
28  * The above copyright notice and this permission notice shall be
29  * included in all copies or substantial portions of the Software.
30  *
31  *  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32  *  EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33  *  MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34  *  NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35  *  LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36  *  OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37  *  WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
38  */
39
40 #include <vnet/vnet.h>
41 #include <vnet/plugin/plugin.h>
42 #include <vnet/adj/adj.h>
43 #include <vnet/adj/adj_mcast.h>
44 #include <vnet/ip/ip.h>
45
46 typedef enum vnet_interface_helper_flags_t_
47 {
48   VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE = (1 << 0),
49   VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE = (1 << 1),
50 } vnet_interface_helper_flags_t;
51
52 static clib_error_t *vnet_hw_interface_set_flags_helper (vnet_main_t * vnm,
53                                                          u32 hw_if_index,
54                                                          vnet_hw_interface_flags_t
55                                                          flags,
56                                                          vnet_interface_helper_flags_t
57                                                          helper_flags);
58
59 static clib_error_t *vnet_sw_interface_set_flags_helper (vnet_main_t * vnm,
60                                                          u32 sw_if_index,
61                                                          vnet_sw_interface_flags_t
62                                                          flags,
63                                                          vnet_interface_helper_flags_t
64                                                          helper_flags);
65
66 static clib_error_t *vnet_hw_interface_set_class_helper (vnet_main_t * vnm,
67                                                          u32 hw_if_index,
68                                                          u32 hw_class_index,
69                                                          u32 redistribute);
70
71 typedef struct
72 {
73   /* Either sw or hw interface index. */
74   u32 sw_hw_if_index;
75
76   /* Flags. */
77   u32 flags;
78 } vnet_sw_hw_interface_state_t;
79
80 static void
81 serialize_vec_vnet_sw_hw_interface_state (serialize_main_t * m, va_list * va)
82 {
83   vnet_sw_hw_interface_state_t *s =
84     va_arg (*va, vnet_sw_hw_interface_state_t *);
85   u32 n = va_arg (*va, u32);
86   u32 i;
87   for (i = 0; i < n; i++)
88     {
89       serialize_integer (m, s[i].sw_hw_if_index,
90                          sizeof (s[i].sw_hw_if_index));
91       serialize_integer (m, s[i].flags, sizeof (s[i].flags));
92     }
93 }
94
95 static void
96 unserialize_vec_vnet_sw_hw_interface_state (serialize_main_t * m,
97                                             va_list * va)
98 {
99   vnet_sw_hw_interface_state_t *s =
100     va_arg (*va, vnet_sw_hw_interface_state_t *);
101   u32 n = va_arg (*va, u32);
102   u32 i;
103   for (i = 0; i < n; i++)
104     {
105       unserialize_integer (m, &s[i].sw_hw_if_index,
106                            sizeof (s[i].sw_hw_if_index));
107       unserialize_integer (m, &s[i].flags, sizeof (s[i].flags));
108     }
109 }
110
111 static vnet_sw_interface_flags_t
112 vnet_hw_interface_flags_to_sw (vnet_hw_interface_flags_t hwf)
113 {
114   vnet_sw_interface_flags_t swf = VNET_SW_INTERFACE_FLAG_NONE;
115
116   if (hwf & VNET_HW_INTERFACE_FLAG_LINK_UP)
117     swf |= VNET_SW_INTERFACE_FLAG_ADMIN_UP;
118
119   return (swf);
120 }
121
122 void
123 serialize_vnet_interface_state (serialize_main_t * m, va_list * va)
124 {
125   vnet_main_t *vnm = va_arg (*va, vnet_main_t *);
126   vnet_sw_hw_interface_state_t *sts = 0, *st;
127   vnet_sw_interface_t *sif;
128   vnet_hw_interface_t *hif;
129   vnet_interface_main_t *im = &vnm->interface_main;
130
131   /* Serialize hardware interface classes since they may have changed.
132      Must do this before sending up/down flags. */
133   /* *INDENT-OFF* */
134   pool_foreach (hif, im->hw_interfaces, ({
135     vnet_hw_interface_class_t * hw_class = vnet_get_hw_interface_class (vnm, hif->hw_class_index);
136     serialize_cstring (m, hw_class->name);
137   }));
138   /* *INDENT-ON* */
139
140   /* Send sw/hw interface state when non-zero. */
141   /* *INDENT-OFF* */
142   pool_foreach (sif, im->sw_interfaces, ({
143     if (sif->flags != 0)
144       {
145         vec_add2 (sts, st, 1);
146         st->sw_hw_if_index = sif->sw_if_index;
147         st->flags = sif->flags;
148       }
149   }));
150   /* *INDENT-ON* */
151
152   vec_serialize (m, sts, serialize_vec_vnet_sw_hw_interface_state);
153
154   if (sts)
155     _vec_len (sts) = 0;
156
157   /* *INDENT-OFF* */
158   pool_foreach (hif, im->hw_interfaces, ({
159     if (hif->flags != 0)
160       {
161         vec_add2 (sts, st, 1);
162         st->sw_hw_if_index = hif->hw_if_index;
163         st->flags = vnet_hw_interface_flags_to_sw(hif->flags);
164       }
165   }));
166   /* *INDENT-ON* */
167
168   vec_serialize (m, sts, serialize_vec_vnet_sw_hw_interface_state);
169
170   vec_free (sts);
171 }
172
173 static vnet_hw_interface_flags_t
174 vnet_sw_interface_flags_to_hw (vnet_sw_interface_flags_t swf)
175 {
176   vnet_hw_interface_flags_t hwf = VNET_HW_INTERFACE_FLAG_NONE;
177
178   if (swf & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
179     hwf |= VNET_HW_INTERFACE_FLAG_LINK_UP;
180
181   return (hwf);
182 }
183
184 void
185 unserialize_vnet_interface_state (serialize_main_t * m, va_list * va)
186 {
187   vnet_main_t *vnm = va_arg (*va, vnet_main_t *);
188   vnet_sw_hw_interface_state_t *sts = 0, *st;
189
190   /* First set interface hardware class. */
191   {
192     vnet_interface_main_t *im = &vnm->interface_main;
193     vnet_hw_interface_t *hif;
194     char *class_name;
195     uword *p;
196     clib_error_t *error;
197
198     /* *INDENT-OFF* */
199     pool_foreach (hif, im->hw_interfaces, ({
200       unserialize_cstring (m, &class_name);
201       p = hash_get_mem (im->hw_interface_class_by_name, class_name);
202       if (p)
203         {
204           error = vnet_hw_interface_set_class_helper
205             (vnm, hif->hw_if_index, p[0], /* redistribute */ 0);
206         }
207       else
208         error = clib_error_return (0, "hw class %s AWOL?", class_name);
209
210       if (error)
211         clib_error_report (error);
212       vec_free (class_name);
213     }));
214     /* *INDENT-ON* */
215   }
216
217   vec_unserialize (m, &sts, unserialize_vec_vnet_sw_hw_interface_state);
218   vec_foreach (st, sts)
219     vnet_sw_interface_set_flags_helper (vnm, st->sw_hw_if_index, st->flags,
220                                         /* no distribute */ 0);
221   vec_free (sts);
222
223   vec_unserialize (m, &sts, unserialize_vec_vnet_sw_hw_interface_state);
224   vec_foreach (st, sts)
225   {
226     vnet_hw_interface_set_flags_helper
227       (vnm, st->sw_hw_if_index, vnet_sw_interface_flags_to_hw (st->flags),
228        /* no distribute */ 0);
229   }
230   vec_free (sts);
231 }
232
233 static clib_error_t *
234 call_elf_section_interface_callbacks (vnet_main_t * vnm, u32 if_index,
235                                       u32 flags,
236                                       _vnet_interface_function_list_elt_t **
237                                       elts)
238 {
239   _vnet_interface_function_list_elt_t *elt;
240   vnet_interface_function_priority_t prio;
241   clib_error_t *error = 0;
242
243   for (prio = VNET_ITF_FUNC_PRIORITY_LOW;
244        prio <= VNET_ITF_FUNC_PRIORITY_HIGH; prio++)
245     {
246       elt = elts[prio];
247
248       while (elt)
249         {
250           error = elt->fp (vnm, if_index, flags);
251           if (error)
252             return error;
253           elt = elt->next_interface_function;
254         }
255     }
256   return error;
257 }
258
259 static clib_error_t *
260 call_hw_interface_add_del_callbacks (vnet_main_t * vnm, u32 hw_if_index,
261                                      u32 is_create)
262 {
263   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
264   vnet_hw_interface_class_t *hw_class =
265     vnet_get_hw_interface_class (vnm, hi->hw_class_index);
266   vnet_device_class_t *dev_class =
267     vnet_get_device_class (vnm, hi->dev_class_index);
268   clib_error_t *error = 0;
269
270   if (hw_class->interface_add_del_function
271       && (error =
272           hw_class->interface_add_del_function (vnm, hw_if_index, is_create)))
273     return error;
274
275   if (dev_class->interface_add_del_function
276       && (error =
277           dev_class->interface_add_del_function (vnm, hw_if_index,
278                                                  is_create)))
279     return error;
280
281   error = call_elf_section_interface_callbacks
282     (vnm, hw_if_index, is_create, vnm->hw_interface_add_del_functions);
283
284   return error;
285 }
286
287 static clib_error_t *
288 call_sw_interface_add_del_callbacks (vnet_main_t * vnm, u32 sw_if_index,
289                                      u32 is_create)
290 {
291   return call_elf_section_interface_callbacks
292     (vnm, sw_if_index, is_create, vnm->sw_interface_add_del_functions);
293 }
294
295 static clib_error_t *
296 vnet_hw_interface_set_flags_helper (vnet_main_t * vnm, u32 hw_if_index,
297                                     vnet_hw_interface_flags_t flags,
298                                     vnet_interface_helper_flags_t
299                                     helper_flags)
300 {
301   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
302   vnet_hw_interface_class_t *hw_class =
303     vnet_get_hw_interface_class (vnm, hi->hw_class_index);
304   u32 mask;
305   clib_error_t *error = 0;
306   u32 is_create =
307     (helper_flags & VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE) != 0;
308
309   mask =
310     (VNET_HW_INTERFACE_FLAG_LINK_UP | VNET_HW_INTERFACE_FLAG_DUPLEX_MASK);
311   flags &= mask;
312
313   /* Call hardware interface add/del callbacks. */
314   if (is_create)
315     call_hw_interface_add_del_callbacks (vnm, hw_if_index, is_create);
316
317   /* Already in the desired state? */
318   if (!is_create && (hi->flags & mask) == flags)
319     goto done;
320
321   if ((hi->flags & VNET_HW_INTERFACE_FLAG_LINK_UP) !=
322       (flags & VNET_HW_INTERFACE_FLAG_LINK_UP))
323     {
324       /* Do hardware class (e.g. ethernet). */
325       if (hw_class->link_up_down_function
326           && (error = hw_class->link_up_down_function (vnm, hw_if_index,
327                                                        flags)))
328         goto done;
329
330       error = call_elf_section_interface_callbacks
331         (vnm, hw_if_index, flags, vnm->hw_interface_link_up_down_functions);
332
333       if (error)
334         goto done;
335     }
336
337   hi->flags &= ~mask;
338   hi->flags |= flags;
339
340 done:
341   return error;
342 }
343
344 static clib_error_t *
345 vnet_sw_interface_set_flags_helper (vnet_main_t * vnm, u32 sw_if_index,
346                                     vnet_sw_interface_flags_t flags,
347                                     vnet_interface_helper_flags_t
348                                     helper_flags)
349 {
350   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
351   u32 mask;
352   clib_error_t *error = 0;
353   u32 is_create =
354     (helper_flags & VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE) != 0;
355   u32 old_flags;
356
357   mask = VNET_SW_INTERFACE_FLAG_ADMIN_UP | VNET_SW_INTERFACE_FLAG_PUNT;
358   flags &= mask;
359
360   if (is_create)
361     {
362       error =
363         call_sw_interface_add_del_callbacks (vnm, sw_if_index, is_create);
364       if (error)
365         goto done;
366
367       if (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
368         {
369           /* Notify everyone when the interface is created as admin up */
370           error = call_elf_section_interface_callbacks (vnm, sw_if_index,
371                                                         flags,
372                                                         vnm->
373                                                         sw_interface_admin_up_down_functions);
374           if (error)
375             goto done;
376         }
377     }
378   else
379     {
380       vnet_sw_interface_t *si_sup = si;
381
382       /* Check that super interface is in correct state. */
383       if (si->type == VNET_SW_INTERFACE_TYPE_SUB)
384         {
385           si_sup = vnet_get_sw_interface (vnm, si->sup_sw_if_index);
386
387           /* Check to see if we're bringing down the soft interface and if it's parent is up */
388           if ((flags != (si_sup->flags & mask)) &&
389               (!((flags == 0)
390                  && ((si_sup->flags & mask) ==
391                      VNET_SW_INTERFACE_FLAG_ADMIN_UP))))
392             {
393               error = clib_error_return (0, "super-interface %U must be %U",
394                                          format_vnet_sw_interface_name, vnm,
395                                          si_sup,
396                                          format_vnet_sw_interface_flags,
397                                          flags);
398               goto done;
399             }
400         }
401
402       /* Already in the desired state? */
403       if ((si->flags & mask) == flags)
404         goto done;
405
406       /* Sub-interfaces of hardware interfaces that do no redistribute,
407          do not redistribute themselves. */
408       if (si_sup->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
409         {
410           vnet_hw_interface_t *hi =
411             vnet_get_hw_interface (vnm, si_sup->hw_if_index);
412           vnet_device_class_t *dev_class =
413             vnet_get_device_class (vnm, hi->dev_class_index);
414           if (!dev_class->redistribute)
415             helper_flags &=
416               ~VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE;
417         }
418
419       /* set the flags now before invoking the registered clients
420        * so that the state they query is consistent with the state here notified */
421       old_flags = si->flags;
422       si->flags &= ~mask;
423       si->flags |= flags;
424       if ((flags | old_flags) & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
425         error = call_elf_section_interface_callbacks
426           (vnm, sw_if_index, flags,
427            vnm->sw_interface_admin_up_down_functions);
428
429       if (error)
430         {
431           /* restore flags on error */
432           si->flags = old_flags;
433           goto done;
434         }
435
436       if (si->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
437         {
438           vnet_hw_interface_t *hi =
439             vnet_get_hw_interface (vnm, si->hw_if_index);
440           vnet_hw_interface_class_t *hw_class =
441             vnet_get_hw_interface_class (vnm, hi->hw_class_index);
442           vnet_device_class_t *dev_class =
443             vnet_get_device_class (vnm, hi->dev_class_index);
444
445           if ((flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP) &&
446               (si->flags & VNET_SW_INTERFACE_FLAG_ERROR))
447             {
448               error = clib_error_return (0, "Interface in the error state");
449               goto done;
450             }
451
452           /* save the si admin up flag */
453           old_flags = si->flags;
454
455           /* update si admin up flag in advance if we are going admin down */
456           if (!(flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP))
457             si->flags &= ~VNET_SW_INTERFACE_FLAG_ADMIN_UP;
458
459           if (dev_class->admin_up_down_function
460               && (error = dev_class->admin_up_down_function (vnm,
461                                                              si->hw_if_index,
462                                                              flags)))
463             {
464               /* restore si admin up flag to it's original state on errors */
465               si->flags = old_flags;
466               goto done;
467             }
468
469           if (hw_class->admin_up_down_function
470               && (error = hw_class->admin_up_down_function (vnm,
471                                                             si->hw_if_index,
472                                                             flags)))
473             {
474               /* restore si admin up flag to it's original state on errors */
475               si->flags = old_flags;
476               goto done;
477             }
478
479           /* Admin down implies link down. */
480           if (!(flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
481               && (hi->flags & VNET_HW_INTERFACE_FLAG_LINK_UP))
482             vnet_hw_interface_set_flags_helper (vnm, si->hw_if_index,
483                                                 hi->flags &
484                                                 ~VNET_HW_INTERFACE_FLAG_LINK_UP,
485                                                 helper_flags);
486         }
487     }
488
489   si->flags &= ~mask;
490   si->flags |= flags;
491
492 done:
493   return error;
494 }
495
496 clib_error_t *
497 vnet_hw_interface_set_flags (vnet_main_t * vnm, u32 hw_if_index,
498                              vnet_hw_interface_flags_t flags)
499 {
500   return vnet_hw_interface_set_flags_helper
501     (vnm, hw_if_index, flags,
502      VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE);
503 }
504
505 clib_error_t *
506 vnet_sw_interface_set_flags (vnet_main_t * vnm, u32 sw_if_index,
507                              vnet_sw_interface_flags_t flags)
508 {
509   return vnet_sw_interface_set_flags_helper
510     (vnm, sw_if_index, flags,
511      VNET_INTERFACE_SET_FLAGS_HELPER_WANT_REDISTRIBUTE);
512 }
513
514 void
515 vnet_sw_interface_admin_up (vnet_main_t * vnm, u32 sw_if_index)
516 {
517   u32 flags = vnet_sw_interface_get_flags (vnm, sw_if_index);
518
519   if (!(flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP))
520     {
521       flags |= VNET_SW_INTERFACE_FLAG_ADMIN_UP;
522       vnet_sw_interface_set_flags (vnm, sw_if_index, flags);
523     }
524 }
525
526 void
527 vnet_sw_interface_admin_down (vnet_main_t * vnm, u32 sw_if_index)
528 {
529   u32 flags = vnet_sw_interface_get_flags (vnm, sw_if_index);
530
531   if (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
532     {
533       flags &= ~(VNET_SW_INTERFACE_FLAG_ADMIN_UP);
534       vnet_sw_interface_set_flags (vnm, sw_if_index, flags);
535     }
536 }
537
538 static u32
539 vnet_create_sw_interface_no_callbacks (vnet_main_t * vnm,
540                                        vnet_sw_interface_t * template)
541 {
542   vnet_interface_main_t *im = &vnm->interface_main;
543   vnet_sw_interface_t *sw;
544   u32 sw_if_index;
545
546   pool_get (im->sw_interfaces, sw);
547   sw_if_index = sw - im->sw_interfaces;
548
549   sw[0] = template[0];
550
551   sw->flags = 0;
552   sw->sw_if_index = sw_if_index;
553   if (sw->type == VNET_SW_INTERFACE_TYPE_HARDWARE)
554     sw->sup_sw_if_index = sw->sw_if_index;
555
556   /* Allocate counters for this interface. */
557   {
558     u32 i;
559
560     vnet_interface_counter_lock (im);
561
562     for (i = 0; i < vec_len (im->sw_if_counters); i++)
563       {
564         vlib_validate_simple_counter (&im->sw_if_counters[i], sw_if_index);
565         vlib_zero_simple_counter (&im->sw_if_counters[i], sw_if_index);
566       }
567
568     for (i = 0; i < vec_len (im->combined_sw_if_counters); i++)
569       {
570         vlib_validate_combined_counter (&im->combined_sw_if_counters[i],
571                                         sw_if_index);
572         vlib_zero_combined_counter (&im->combined_sw_if_counters[i],
573                                     sw_if_index);
574       }
575
576     vnet_interface_counter_unlock (im);
577   }
578
579   return sw_if_index;
580 }
581
582 clib_error_t *
583 vnet_create_sw_interface (vnet_main_t * vnm, vnet_sw_interface_t * template,
584                           u32 * sw_if_index)
585 {
586   clib_error_t *error;
587   vnet_hw_interface_t *hi;
588   vnet_device_class_t *dev_class;
589
590   if (template->sub.eth.flags.two_tags == 1
591       && template->sub.eth.flags.exact_match == 1
592       && (template->sub.eth.flags.inner_vlan_id_any == 1
593           || template->sub.eth.flags.outer_vlan_id_any == 1))
594     {
595       error = clib_error_return (0,
596                                  "inner-dot1q any exact-match is unsupported");
597       return error;
598     }
599
600   hi = vnet_get_sup_hw_interface (vnm, template->sup_sw_if_index);
601   dev_class = vnet_get_device_class (vnm, hi->dev_class_index);
602
603   if (template->type == VNET_SW_INTERFACE_TYPE_SUB &&
604       dev_class->subif_add_del_function)
605     {
606       error = dev_class->subif_add_del_function (vnm, hi->hw_if_index,
607                                                  (struct vnet_sw_interface_t
608                                                   *) template, 1);
609       if (error)
610         return error;
611     }
612
613   *sw_if_index = vnet_create_sw_interface_no_callbacks (vnm, template);
614   error = vnet_sw_interface_set_flags_helper
615     (vnm, *sw_if_index, template->flags,
616      VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
617
618   if (error)
619     {
620       /* undo the work done by vnet_create_sw_interface_no_callbacks() */
621       vnet_interface_main_t *im = &vnm->interface_main;
622       vnet_sw_interface_t *sw =
623         pool_elt_at_index (im->sw_interfaces, *sw_if_index);
624       pool_put (im->sw_interfaces, sw);
625     }
626
627   return error;
628 }
629
630 void
631 vnet_delete_sw_interface (vnet_main_t * vnm, u32 sw_if_index)
632 {
633   vnet_interface_main_t *im = &vnm->interface_main;
634   vnet_sw_interface_t *sw =
635     pool_elt_at_index (im->sw_interfaces, sw_if_index);
636
637   /* Check if the interface has config and is removed from L2 BD or XConnect */
638   vnet_clear_sw_interface_tag (vnm, sw_if_index);
639
640   /* Bring down interface in case it is up. */
641   if (sw->flags != 0)
642     vnet_sw_interface_set_flags (vnm, sw_if_index, /* flags */ 0);
643
644   call_sw_interface_add_del_callbacks (vnm, sw_if_index, /* is_create */ 0);
645
646   pool_put (im->sw_interfaces, sw);
647 }
648
649 static clib_error_t *
650 call_sw_interface_mtu_change_callbacks (vnet_main_t * vnm, u32 sw_if_index)
651 {
652   return call_elf_section_interface_callbacks
653     (vnm, sw_if_index, 0, vnm->sw_interface_mtu_change_functions);
654 }
655
656 void
657 vnet_sw_interface_set_mtu (vnet_main_t * vnm, u32 sw_if_index, u32 mtu)
658 {
659   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
660
661   if (si->mtu[VNET_MTU_L3] != mtu)
662     {
663       si->mtu[VNET_MTU_L3] = mtu;
664       call_sw_interface_mtu_change_callbacks (vnm, sw_if_index);
665     }
666 }
667
668 void
669 vnet_sw_interface_set_protocol_mtu (vnet_main_t * vnm, u32 sw_if_index,
670                                     u32 mtu[])
671 {
672   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
673   bool changed = false;
674   int i;
675
676   for (i = 0; i < VNET_N_MTU; i++)
677     {
678       if (si->mtu[i] != mtu[i])
679         {
680           si->mtu[i] = mtu[i];
681           changed = true;
682         }
683     }
684   /* Notify interested parties */
685   if (changed)
686     call_sw_interface_mtu_change_callbacks (vnm, sw_if_index);
687 }
688
689 void
690 vnet_sw_interface_ip_directed_broadcast (vnet_main_t * vnm,
691                                          u32 sw_if_index, u8 enable)
692 {
693   vnet_sw_interface_t *si;
694
695   si = vnet_get_sw_interface (vnm, sw_if_index);
696
697   if (enable)
698     si->flags |= VNET_SW_INTERFACE_FLAG_DIRECTED_BCAST;
699   else
700     si->flags &= ~VNET_SW_INTERFACE_FLAG_DIRECTED_BCAST;
701
702   ip4_directed_broadcast (sw_if_index, enable);
703 }
704
705 /*
706  * Reflect a change in hardware MTU on protocol MTUs
707  */
708 static walk_rc_t
709 sw_interface_walk_callback (vnet_main_t * vnm, u32 sw_if_index, void *ctx)
710 {
711   u32 *link_mtu = ctx;
712   vnet_sw_interface_set_mtu (vnm, sw_if_index, *link_mtu);
713   return WALK_CONTINUE;
714 }
715
716 void
717 vnet_hw_interface_set_mtu (vnet_main_t * vnm, u32 hw_if_index, u32 mtu)
718 {
719   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
720
721   if (hi->max_packet_bytes != mtu)
722     {
723       hi->max_packet_bytes = mtu;
724       ethernet_set_flags (vnm, hw_if_index, ETHERNET_INTERFACE_FLAG_MTU);
725       vnet_hw_interface_walk_sw (vnm, hw_if_index, sw_interface_walk_callback,
726                                  &mtu);
727     }
728 }
729
730 static void
731 setup_tx_node (vlib_main_t * vm,
732                u32 node_index, vnet_device_class_t * dev_class)
733 {
734   vlib_node_t *n = vlib_get_node (vm, node_index);
735
736   n->function = dev_class->tx_function;
737   n->format_trace = dev_class->format_tx_trace;
738
739   /// XXX: Update this to use counter structure
740   vlib_register_errors (vm, node_index,
741                         dev_class->tx_function_n_errors,
742                         dev_class->tx_function_error_strings, 0);
743 }
744
745 static void
746 setup_output_node (vlib_main_t * vm,
747                    u32 node_index, vnet_hw_interface_class_t * hw_class)
748 {
749   vlib_node_t *n = vlib_get_node (vm, node_index);
750   n->format_buffer = hw_class->format_header;
751   n->unformat_buffer = hw_class->unformat_header;
752 }
753
754 /* Register an interface instance. */
755 u32
756 vnet_register_interface (vnet_main_t * vnm,
757                          u32 dev_class_index,
758                          u32 dev_instance,
759                          u32 hw_class_index, u32 hw_instance)
760 {
761   vnet_interface_main_t *im = &vnm->interface_main;
762   vnet_hw_interface_t *hw;
763   vnet_device_class_t *dev_class =
764     vnet_get_device_class (vnm, dev_class_index);
765   vnet_hw_interface_class_t *hw_class =
766     vnet_get_hw_interface_class (vnm, hw_class_index);
767   vlib_main_t *vm = vnm->vlib_main;
768   vnet_feature_config_main_t *fcm;
769   vnet_config_main_t *cm;
770   u32 hw_index, i;
771   char *tx_node_name = NULL, *output_node_name = NULL;
772   vlib_node_function_t *output_node = vnet_interface_output_node_get ();
773
774   pool_get (im->hw_interfaces, hw);
775   clib_memset (hw, 0, sizeof (*hw));
776   hw->trace_classify_table_index = ~0;
777
778   hw_index = hw - im->hw_interfaces;
779   hw->hw_if_index = hw_index;
780   hw->default_rx_mode = VNET_HW_IF_RX_MODE_POLLING;
781
782   if (dev_class->format_device_name)
783     hw->name = format (0, "%U", dev_class->format_device_name, dev_instance);
784   else if (hw_class->format_interface_name)
785     hw->name = format (0, "%U", hw_class->format_interface_name,
786                        dev_instance);
787   else
788     hw->name = format (0, "%s%x", hw_class->name, dev_instance);
789
790   if (!im->hw_interface_by_name)
791     im->hw_interface_by_name = hash_create_vec ( /* size */ 0,
792                                                 sizeof (hw->name[0]),
793                                                 sizeof (uword));
794
795   hash_set_mem (im->hw_interface_by_name, hw->name, hw_index);
796
797   /* Make hardware interface point to software interface. */
798   {
799     vnet_sw_interface_t sw = {
800       .type = VNET_SW_INTERFACE_TYPE_HARDWARE,
801       .flood_class = VNET_FLOOD_CLASS_NORMAL,
802       .hw_if_index = hw_index
803     };
804     hw->sw_if_index = vnet_create_sw_interface_no_callbacks (vnm, &sw);
805   }
806
807   hw->dev_class_index = dev_class_index;
808   hw->dev_instance = dev_instance;
809   hw->hw_class_index = hw_class_index;
810   hw->hw_instance = hw_instance;
811
812   hw->max_rate_bits_per_sec = 0;
813   hw->min_packet_bytes = 0;
814   vnet_sw_interface_set_mtu (vnm, hw->sw_if_index, 0);
815
816   if (dev_class->tx_function == 0)
817     goto no_output_nodes;       /* No output/tx nodes to create */
818
819   tx_node_name = (char *) format (0, "%v-tx", hw->name);
820   output_node_name = (char *) format (0, "%v-output", hw->name);
821
822   /* If we have previously deleted interface nodes, re-use them. */
823   if (vec_len (im->deleted_hw_interface_nodes) > 0)
824     {
825       vnet_hw_interface_nodes_t *hn;
826       vlib_node_t *node;
827       vlib_node_runtime_t *nrt;
828
829       hn = vec_end (im->deleted_hw_interface_nodes) - 1;
830
831       hw->tx_node_index = hn->tx_node_index;
832       hw->output_node_index = hn->output_node_index;
833
834       vlib_node_rename (vm, hw->tx_node_index, "%v", tx_node_name);
835       vlib_node_rename (vm, hw->output_node_index, "%v", output_node_name);
836
837       /* *INDENT-OFF* */
838       foreach_vlib_main ({
839         vnet_interface_output_runtime_t *rt;
840
841         rt = vlib_node_get_runtime_data (this_vlib_main, hw->output_node_index);
842         ASSERT (rt->is_deleted == 1);
843         rt->is_deleted = 0;
844         rt->hw_if_index = hw_index;
845         rt->sw_if_index = hw->sw_if_index;
846         rt->dev_instance = hw->dev_instance;
847
848         rt = vlib_node_get_runtime_data (this_vlib_main, hw->tx_node_index);
849         rt->hw_if_index = hw_index;
850         rt->sw_if_index = hw->sw_if_index;
851         rt->dev_instance = hw->dev_instance;
852       });
853       /* *INDENT-ON* */
854
855       /* The new class may differ from the old one.
856        * Functions have to be updated. */
857       node = vlib_get_node (vm, hw->output_node_index);
858       node->function = output_node;
859       node->format_trace = format_vnet_interface_output_trace;
860       /* *INDENT-OFF* */
861       foreach_vlib_main ({
862         nrt = vlib_node_get_runtime (this_vlib_main, hw->output_node_index);
863         nrt->function = node->function;
864         vlib_node_runtime_perf_counter (this_vlib_main, nrt, 0, 0, 0,
865                                         VLIB_NODE_RUNTIME_PERF_RESET);
866       });
867       /* *INDENT-ON* */
868
869       node = vlib_get_node (vm, hw->tx_node_index);
870       node->function = dev_class->tx_function;
871       node->format_trace = dev_class->format_tx_trace;
872       /* *INDENT-OFF* */
873       foreach_vlib_main ({
874         nrt = vlib_node_get_runtime (this_vlib_main, hw->tx_node_index);
875         nrt->function = node->function;
876         vlib_node_runtime_perf_counter (this_vlib_main, nrt, 0, 0, 0,
877                                         VLIB_NODE_RUNTIME_PERF_RESET);
878       });
879       /* *INDENT-ON* */
880
881       _vec_len (im->deleted_hw_interface_nodes) -= 1;
882     }
883   else
884     {
885       vlib_node_registration_t r;
886       vnet_interface_output_runtime_t rt = {
887         .hw_if_index = hw_index,
888         .sw_if_index = hw->sw_if_index,
889         .dev_instance = hw->dev_instance,
890         .is_deleted = 0,
891       };
892
893       clib_memset (&r, 0, sizeof (r));
894       r.type = VLIB_NODE_TYPE_INTERNAL;
895       r.runtime_data = &rt;
896       r.runtime_data_bytes = sizeof (rt);
897       r.scalar_size = 0;
898       r.vector_size = sizeof (u32);
899
900       r.flags = VLIB_NODE_FLAG_IS_OUTPUT;
901       r.name = tx_node_name;
902       r.function = dev_class->tx_function;
903
904       hw->tx_node_index = vlib_register_node (vm, &r);
905
906       vlib_node_add_named_next_with_slot (vm, hw->tx_node_index,
907                                           "error-drop",
908                                           VNET_INTERFACE_TX_NEXT_DROP);
909
910       r.flags = 0;
911       r.name = output_node_name;
912       r.function = output_node;
913       r.format_trace = format_vnet_interface_output_trace;
914
915       {
916         static char *e[] = {
917           "interface is down",
918           "interface is deleted",
919           "no buffers to segment GSO",
920         };
921
922         r.n_errors = ARRAY_LEN (e);
923         r.error_strings = e;
924       }
925       hw->output_node_index = vlib_register_node (vm, &r);
926
927       vlib_node_add_named_next_with_slot (vm, hw->output_node_index,
928                                           "error-drop",
929                                           VNET_INTERFACE_OUTPUT_NEXT_DROP);
930       vlib_node_add_next_with_slot (vm, hw->output_node_index,
931                                     hw->tx_node_index,
932                                     VNET_INTERFACE_OUTPUT_NEXT_TX);
933
934       /* add interface to the list of "output-interface" feature arc start nodes
935          and clone nexts from 1st interface if it exists */
936       fcm = vnet_feature_get_config_main (im->output_feature_arc_index);
937       cm = &fcm->config_main;
938       i = vec_len (cm->start_node_indices);
939       vec_validate (cm->start_node_indices, i);
940       cm->start_node_indices[i] = hw->output_node_index;
941       if (hw_index)
942         {
943           /* copy nexts from 1st interface */
944           vnet_hw_interface_t *first_hw;
945           vlib_node_t *first_node;
946
947           first_hw = vnet_get_hw_interface (vnm, /* hw_if_index */ 0);
948           first_node = vlib_get_node (vm, first_hw->output_node_index);
949
950           /* 1st 2 nexts are already added above */
951           for (i = 2; i < vec_len (first_node->next_nodes); i++)
952             vlib_node_add_next_with_slot (vm, hw->output_node_index,
953                                           first_node->next_nodes[i], i);
954         }
955     }
956
957   setup_output_node (vm, hw->output_node_index, hw_class);
958   setup_tx_node (vm, hw->tx_node_index, dev_class);
959
960 no_output_nodes:
961   /* Call all up/down callbacks with zero flags when interface is created. */
962   vnet_sw_interface_set_flags_helper (vnm, hw->sw_if_index, /* flags */ 0,
963                                       VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
964   vnet_hw_interface_set_flags_helper (vnm, hw_index, /* flags */ 0,
965                                       VNET_INTERFACE_SET_FLAGS_HELPER_IS_CREATE);
966   vec_free (tx_node_name);
967   vec_free (output_node_name);
968
969   return hw_index;
970 }
971
972 void
973 vnet_delete_hw_interface (vnet_main_t * vnm, u32 hw_if_index)
974 {
975   vnet_interface_main_t *im = &vnm->interface_main;
976   vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
977   vlib_main_t *vm = vnm->vlib_main;
978   vnet_device_class_t *dev_class = vnet_get_device_class (vnm,
979                                                           hw->dev_class_index);
980   /* If it is up, mark it down. */
981   if (hw->flags != 0)
982     vnet_hw_interface_set_flags (vnm, hw_if_index, /* flags */ 0);
983
984   /* Call delete callbacks. */
985   call_hw_interface_add_del_callbacks (vnm, hw_if_index, /* is_create */ 0);
986
987   /* Delete any sub-interfaces. */
988   {
989     u32 id, sw_if_index;
990     /* *INDENT-OFF* */
991     hash_foreach (id, sw_if_index, hw->sub_interface_sw_if_index_by_id,
992     ({
993       vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
994       u64 sup_and_sub_key =
995         ((u64) (si->sup_sw_if_index) << 32) | (u64) si->sub.id;
996       hash_unset_mem_free (&im->sw_if_index_by_sup_and_sub, &sup_and_sub_key);
997       vnet_delete_sw_interface (vnm, sw_if_index);
998     }));
999     hash_free (hw->sub_interface_sw_if_index_by_id);
1000     /* *INDENT-ON* */
1001   }
1002
1003   /* Delete software interface corresponding to hardware interface. */
1004   vnet_delete_sw_interface (vnm, hw->sw_if_index);
1005
1006   if (dev_class->tx_function)
1007     {
1008       /* Put output/tx nodes into recycle pool */
1009       vnet_hw_interface_nodes_t *dn;
1010
1011       /* *INDENT-OFF* */
1012       foreach_vlib_main
1013         ({
1014           vnet_interface_output_runtime_t *rt =
1015             vlib_node_get_runtime_data (this_vlib_main, hw->output_node_index);
1016
1017           /* Mark node runtime as deleted so output node (if called)
1018            * will drop packets. */
1019           rt->is_deleted = 1;
1020         });
1021       /* *INDENT-ON* */
1022
1023       vlib_node_rename (vm, hw->output_node_index,
1024                         "interface-%d-output-deleted", hw_if_index);
1025       vlib_node_rename (vm, hw->tx_node_index, "interface-%d-tx-deleted",
1026                         hw_if_index);
1027       vec_add2 (im->deleted_hw_interface_nodes, dn, 1);
1028       dn->tx_node_index = hw->tx_node_index;
1029       dn->output_node_index = hw->output_node_index;
1030     }
1031
1032   hash_unset_mem (im->hw_interface_by_name, hw->name);
1033   vec_free (hw->name);
1034   vec_free (hw->hw_address);
1035   vec_free (hw->input_node_thread_index_by_queue);
1036   vec_free (hw->dq_runtime_index_by_queue);
1037
1038   pool_put (im->hw_interfaces, hw);
1039 }
1040
1041 void
1042 vnet_hw_interface_walk_sw (vnet_main_t * vnm,
1043                            u32 hw_if_index,
1044                            vnet_hw_sw_interface_walk_t fn, void *ctx)
1045 {
1046   vnet_hw_interface_t *hi;
1047   u32 id, sw_if_index;
1048
1049   hi = vnet_get_hw_interface (vnm, hw_if_index);
1050   /* the super first, then the sub interfaces */
1051   if (WALK_STOP == fn (vnm, hi->sw_if_index, ctx))
1052     return;
1053
1054   /* *INDENT-OFF* */
1055   hash_foreach (id, sw_if_index,
1056                 hi->sub_interface_sw_if_index_by_id,
1057   ({
1058     if (WALK_STOP == fn (vnm, sw_if_index, ctx))
1059       break;
1060   }));
1061   /* *INDENT-ON* */
1062 }
1063
1064 void
1065 vnet_hw_interface_walk (vnet_main_t * vnm,
1066                         vnet_hw_interface_walk_t fn, void *ctx)
1067 {
1068   vnet_interface_main_t *im;
1069   vnet_hw_interface_t *hi;
1070
1071   im = &vnm->interface_main;
1072
1073   /* *INDENT-OFF* */
1074   pool_foreach (hi, im->hw_interfaces,
1075   ({
1076     if (WALK_STOP == fn(vnm, hi->hw_if_index, ctx))
1077       break;
1078   }));
1079   /* *INDENT-ON* */
1080 }
1081
1082 void
1083 vnet_sw_interface_walk (vnet_main_t * vnm,
1084                         vnet_sw_interface_walk_t fn, void *ctx)
1085 {
1086   vnet_interface_main_t *im;
1087   vnet_sw_interface_t *si;
1088
1089   im = &vnm->interface_main;
1090
1091   /* *INDENT-OFF* */
1092   pool_foreach (si, im->sw_interfaces,
1093   {
1094     if (WALK_STOP == fn (vnm, si, ctx))
1095       break;
1096   });
1097   /* *INDENT-ON* */
1098 }
1099
1100 void
1101 vnet_hw_interface_init_for_class (vnet_main_t * vnm, u32 hw_if_index,
1102                                   u32 hw_class_index, u32 hw_instance)
1103 {
1104   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1105   vnet_hw_interface_class_t *hc =
1106     vnet_get_hw_interface_class (vnm, hw_class_index);
1107
1108   hi->hw_class_index = hw_class_index;
1109   hi->hw_instance = hw_instance;
1110   setup_output_node (vnm->vlib_main, hi->output_node_index, hc);
1111 }
1112
1113 static clib_error_t *
1114 vnet_hw_interface_set_class_helper (vnet_main_t * vnm, u32 hw_if_index,
1115                                     u32 hw_class_index, u32 redistribute)
1116 {
1117   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1118   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, hi->sw_if_index);
1119   vnet_hw_interface_class_t *old_class =
1120     vnet_get_hw_interface_class (vnm, hi->hw_class_index);
1121   vnet_hw_interface_class_t *new_class =
1122     vnet_get_hw_interface_class (vnm, hw_class_index);
1123   vnet_device_class_t *dev_class =
1124     vnet_get_device_class (vnm, hi->dev_class_index);
1125   clib_error_t *error = 0;
1126
1127   /* New class equals old class?  Nothing to do. */
1128   if (hi->hw_class_index == hw_class_index)
1129     return 0;
1130
1131   /* No need (and incorrect since admin up flag may be set) to do error checking when
1132      receiving unserialize message. */
1133   if (redistribute)
1134     {
1135       if (si->flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP)
1136         return clib_error_return (0,
1137                                   "%v must be admin down to change class from %s to %s",
1138                                   hi->name, old_class->name, new_class->name);
1139
1140       /* Make sure interface supports given class. */
1141       if ((new_class->is_valid_class_for_interface
1142            && !new_class->is_valid_class_for_interface (vnm, hw_if_index,
1143                                                         hw_class_index))
1144           || (dev_class->is_valid_class_for_interface
1145               && !dev_class->is_valid_class_for_interface (vnm, hw_if_index,
1146                                                            hw_class_index)))
1147         return clib_error_return (0,
1148                                   "%v class cannot be changed from %s to %s",
1149                                   hi->name, old_class->name, new_class->name);
1150
1151     }
1152
1153   if (old_class->hw_class_change)
1154     old_class->hw_class_change (vnm, hw_if_index, old_class->index,
1155                                 new_class->index);
1156
1157   vnet_hw_interface_init_for_class (vnm, hw_if_index, new_class->index,
1158                                     /* instance */ ~0);
1159
1160   if (new_class->hw_class_change)
1161     new_class->hw_class_change (vnm, hw_if_index, old_class->index,
1162                                 new_class->index);
1163
1164   if (dev_class->hw_class_change)
1165     dev_class->hw_class_change (vnm, hw_if_index, new_class->index);
1166
1167   return error;
1168 }
1169
1170 clib_error_t *
1171 vnet_hw_interface_set_class (vnet_main_t * vnm, u32 hw_if_index,
1172                              u32 hw_class_index)
1173 {
1174   return vnet_hw_interface_set_class_helper (vnm, hw_if_index, hw_class_index,
1175                                              /* redistribute */ 1);
1176 }
1177
1178 static int
1179 vnet_hw_interface_rx_redirect_to_node_helper (vnet_main_t * vnm,
1180                                               u32 hw_if_index,
1181                                               u32 node_index,
1182                                               u32 redistribute)
1183 {
1184   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1185   vnet_device_class_t *dev_class = vnet_get_device_class
1186     (vnm, hi->dev_class_index);
1187
1188   if (dev_class->rx_redirect_to_node)
1189     {
1190       dev_class->rx_redirect_to_node (vnm, hw_if_index, node_index);
1191       return 0;
1192     }
1193
1194   return VNET_API_ERROR_UNIMPLEMENTED;
1195 }
1196
1197 int
1198 vnet_hw_interface_rx_redirect_to_node (vnet_main_t * vnm, u32 hw_if_index,
1199                                        u32 node_index)
1200 {
1201   return vnet_hw_interface_rx_redirect_to_node_helper (vnm, hw_if_index,
1202                                                        node_index,
1203                                                        1 /* redistribute */ );
1204 }
1205
1206 word
1207 vnet_sw_interface_compare (vnet_main_t * vnm,
1208                            uword sw_if_index0, uword sw_if_index1)
1209 {
1210   vnet_sw_interface_t *sup0 = vnet_get_sup_sw_interface (vnm, sw_if_index0);
1211   vnet_sw_interface_t *sup1 = vnet_get_sup_sw_interface (vnm, sw_if_index1);
1212   vnet_hw_interface_t *h0 = vnet_get_hw_interface (vnm, sup0->hw_if_index);
1213   vnet_hw_interface_t *h1 = vnet_get_hw_interface (vnm, sup1->hw_if_index);
1214
1215   if (h0 != h1)
1216     return vec_cmp (h0->name, h1->name);
1217   return (word) h0->hw_instance - (word) h1->hw_instance;
1218 }
1219
1220 word
1221 vnet_hw_interface_compare (vnet_main_t * vnm,
1222                            uword hw_if_index0, uword hw_if_index1)
1223 {
1224   vnet_hw_interface_t *h0 = vnet_get_hw_interface (vnm, hw_if_index0);
1225   vnet_hw_interface_t *h1 = vnet_get_hw_interface (vnm, hw_if_index1);
1226
1227   if (h0 != h1)
1228     return vec_cmp (h0->name, h1->name);
1229   return (word) h0->hw_instance - (word) h1->hw_instance;
1230 }
1231
1232 int
1233 vnet_sw_interface_is_p2p (vnet_main_t * vnm, u32 sw_if_index)
1234 {
1235   vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index);
1236   if ((si->type == VNET_SW_INTERFACE_TYPE_P2P) ||
1237       (si->type == VNET_SW_INTERFACE_TYPE_PIPE))
1238     return 1;
1239
1240   vnet_hw_interface_t *hw = vnet_get_sup_hw_interface (vnm, sw_if_index);
1241   vnet_hw_interface_class_t *hc =
1242     vnet_get_hw_interface_class (vnm, hw->hw_class_index);
1243
1244   return (hc->flags & VNET_HW_INTERFACE_CLASS_FLAG_P2P);
1245 }
1246
1247 int
1248 vnet_sw_interface_is_nbma (vnet_main_t * vnm, u32 sw_if_index)
1249 {
1250   vnet_hw_interface_t *hw = vnet_get_sup_hw_interface (vnm, sw_if_index);
1251   vnet_hw_interface_class_t *hc =
1252     vnet_get_hw_interface_class (vnm, hw->hw_class_index);
1253
1254   return (hc->flags & VNET_HW_INTERFACE_CLASS_FLAG_NBMA);
1255 }
1256
1257 clib_error_t *
1258 vnet_interface_init (vlib_main_t * vm)
1259 {
1260   vnet_main_t *vnm = vnet_get_main ();
1261   vnet_interface_main_t *im = &vnm->interface_main;
1262   vlib_buffer_t *b = 0;
1263   vnet_buffer_opaque_t *o = 0;
1264   clib_error_t *error;
1265
1266   /*
1267    * Keep people from shooting themselves in the foot.
1268    */
1269   if (sizeof (b->opaque) != sizeof (vnet_buffer_opaque_t))
1270     {
1271 #define _(a) if (sizeof(o->a) > sizeof (o->unused))                     \
1272       clib_warning                                                      \
1273         ("FATAL: size of opaque union subtype %s is %d (max %d)",       \
1274          #a, sizeof(o->a), sizeof (o->unused));
1275       foreach_buffer_opaque_union_subtype;
1276 #undef _
1277
1278       return clib_error_return
1279         (0, "FATAL: size of vlib buffer opaque %d, size of vnet opaque %d",
1280          sizeof (b->opaque), sizeof (vnet_buffer_opaque_t));
1281     }
1282
1283   clib_spinlock_init (&im->sw_if_counter_lock);
1284   clib_spinlock_lock (&im->sw_if_counter_lock); /* should be no need */
1285
1286   vec_validate (im->sw_if_counters, VNET_N_SIMPLE_INTERFACE_COUNTER - 1);
1287 #define _(E,n,p)                                                        \
1288   im->sw_if_counters[VNET_INTERFACE_COUNTER_##E].name = #n;             \
1289   im->sw_if_counters[VNET_INTERFACE_COUNTER_##E].stat_segment_name = "/" #p "/" #n;
1290   foreach_simple_interface_counter_name
1291 #undef _
1292     vec_validate (im->combined_sw_if_counters,
1293                   VNET_N_COMBINED_INTERFACE_COUNTER - 1);
1294 #define _(E,n,p)                                                        \
1295   im->combined_sw_if_counters[VNET_INTERFACE_COUNTER_##E].name = #n;    \
1296   im->combined_sw_if_counters[VNET_INTERFACE_COUNTER_##E].stat_segment_name = "/" #p "/" #n;
1297   foreach_combined_interface_counter_name
1298 #undef _
1299     clib_spinlock_unlock (&im->sw_if_counter_lock);
1300
1301   im->device_class_by_name = hash_create_string ( /* size */ 0,
1302                                                  sizeof (uword));
1303   {
1304     vnet_device_class_t *c;
1305
1306     c = vnm->device_class_registrations;
1307
1308     while (c)
1309       {
1310         c->index = vec_len (im->device_classes);
1311         hash_set_mem (im->device_class_by_name, c->name, c->index);
1312
1313         if (c->tx_fn_registrations)
1314           {
1315             vlib_node_fn_registration_t *fnr = c->tx_fn_registrations;
1316             int priority = -1;
1317
1318             /* to avoid confusion, please remove ".tx_function" statement
1319                from VNET_DEVICE_CLASS() if using function candidates */
1320             ASSERT (c->tx_function == 0);
1321
1322             while (fnr)
1323               {
1324                 if (fnr->priority > priority)
1325                   {
1326                     priority = fnr->priority;
1327                     c->tx_function = fnr->function;
1328                   }
1329                 fnr = fnr->next_registration;
1330               }
1331           }
1332
1333         vec_add1 (im->device_classes, c[0]);
1334         c = c->next_class_registration;
1335       }
1336   }
1337
1338   im->hw_interface_class_by_name = hash_create_string ( /* size */ 0,
1339                                                        sizeof (uword));
1340
1341   im->sw_if_index_by_sup_and_sub = hash_create_mem (0, sizeof (u64),
1342                                                     sizeof (uword));
1343   {
1344     vnet_hw_interface_class_t *c;
1345
1346     c = vnm->hw_interface_class_registrations;
1347
1348     while (c)
1349       {
1350         c->index = vec_len (im->hw_interface_classes);
1351         hash_set_mem (im->hw_interface_class_by_name, c->name, c->index);
1352
1353         if (NULL == c->build_rewrite)
1354           c->build_rewrite = default_build_rewrite;
1355         if (NULL == c->update_adjacency)
1356           c->update_adjacency = default_update_adjacency;
1357
1358         vec_add1 (im->hw_interface_classes, c[0]);
1359         c = c->next_class_registration;
1360       }
1361   }
1362
1363   /* init per-thread data */
1364   vec_validate_aligned (im->per_thread_data, vlib_num_workers (),
1365                         CLIB_CACHE_LINE_BYTES);
1366
1367   if ((error = vlib_call_init_function (vm, vnet_interface_cli_init)))
1368     return error;
1369
1370   vnm->interface_tag_by_sw_if_index = hash_create (0, sizeof (uword));
1371
1372 #if VLIB_BUFFER_TRACE_TRAJECTORY > 0
1373   if ((error = vlib_call_init_function (vm, trajectory_trace_init)))
1374     return error;
1375 #endif
1376
1377   return 0;
1378 }
1379
1380 VLIB_INIT_FUNCTION (vnet_interface_init);
1381
1382 /* Kludge to renumber interface names [only!] */
1383 int
1384 vnet_interface_name_renumber (u32 sw_if_index, u32 new_show_dev_instance)
1385 {
1386   int rv;
1387   vnet_main_t *vnm = vnet_get_main ();
1388   vnet_interface_main_t *im = &vnm->interface_main;
1389   vnet_hw_interface_t *hi = vnet_get_sup_hw_interface (vnm, sw_if_index);
1390
1391   vnet_device_class_t *dev_class = vnet_get_device_class
1392     (vnm, hi->dev_class_index);
1393
1394   if (dev_class->name_renumber == 0 || dev_class->format_device_name == 0)
1395     return VNET_API_ERROR_UNIMPLEMENTED;
1396
1397   rv = dev_class->name_renumber (hi, new_show_dev_instance);
1398
1399   if (rv)
1400     return rv;
1401
1402   hash_unset_mem (im->hw_interface_by_name, hi->name);
1403   vec_free (hi->name);
1404   /* Use the mapping we set up to call it Ishmael */
1405   hi->name = format (0, "%U", dev_class->format_device_name,
1406                      hi->dev_instance);
1407
1408   hash_set_mem (im->hw_interface_by_name, hi->name, hi->hw_if_index);
1409   return rv;
1410 }
1411
1412 clib_error_t *
1413 vnet_rename_interface (vnet_main_t * vnm, u32 hw_if_index, char *new_name)
1414 {
1415   vnet_interface_main_t *im = &vnm->interface_main;
1416   vlib_main_t *vm = vnm->vlib_main;
1417   vnet_hw_interface_t *hw;
1418   u8 *old_name;
1419   clib_error_t *error = 0;
1420
1421   hw = vnet_get_hw_interface (vnm, hw_if_index);
1422   if (!hw)
1423     {
1424       return clib_error_return (0,
1425                                 "unable to find hw interface for index %u",
1426                                 hw_if_index);
1427     }
1428
1429   old_name = hw->name;
1430
1431   /* set new hw->name */
1432   hw->name = format (0, "%s", new_name);
1433
1434   /* remove the old name to hw_if_index mapping and install the new one */
1435   hash_unset_mem (im->hw_interface_by_name, old_name);
1436   hash_set_mem (im->hw_interface_by_name, hw->name, hw_if_index);
1437
1438   /* rename tx/output nodes */
1439   vlib_node_rename (vm, hw->tx_node_index, "%v-tx", hw->name);
1440   vlib_node_rename (vm, hw->output_node_index, "%v-output", hw->name);
1441
1442   /* free the old name vector */
1443   vec_free (old_name);
1444
1445   return error;
1446 }
1447
1448 clib_error_t *
1449 vnet_hw_interface_add_del_mac_address (vnet_main_t * vnm,
1450                                        u32 hw_if_index,
1451                                        const u8 * mac_address, u8 is_add)
1452 {
1453   clib_error_t *error = 0;
1454   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1455
1456   vnet_device_class_t *dev_class =
1457     vnet_get_device_class (vnm, hi->dev_class_index);
1458
1459   if (!hi->hw_address)
1460     {
1461       error =
1462         clib_error_return
1463         (0, "Secondary MAC Addresses not supported for interface index %u",
1464          hw_if_index);
1465       goto done;
1466     }
1467
1468   if (dev_class->mac_addr_add_del_function)
1469     error = dev_class->mac_addr_add_del_function (hi, mac_address, is_add);
1470
1471   if (!error)
1472     {
1473       vnet_hw_interface_class_t *hw_class;
1474
1475       hw_class = vnet_get_hw_interface_class (vnm, hi->hw_class_index);
1476
1477       if (NULL != hw_class->mac_addr_add_del_function)
1478         error = hw_class->mac_addr_add_del_function (hi, mac_address, is_add);
1479     }
1480
1481   /* If no errors, add to the list of secondary MACs on the ethernet intf */
1482   if (!error)
1483     ethernet_interface_add_del_address (&ethernet_main, hw_if_index,
1484                                         mac_address, is_add);
1485
1486 done:
1487   return error;
1488 }
1489
1490 static clib_error_t *
1491 vnet_hw_interface_change_mac_address_helper (vnet_main_t * vnm,
1492                                              u32 hw_if_index,
1493                                              const u8 * mac_address)
1494 {
1495   clib_error_t *error = 0;
1496   vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
1497
1498   if (hi->hw_address)
1499     {
1500       u8 *old_address = vec_dup (hi->hw_address);
1501       vnet_device_class_t *dev_class =
1502         vnet_get_device_class (vnm, hi->dev_class_index);
1503       if (dev_class->mac_addr_change_function)
1504         {
1505           error =
1506             dev_class->mac_addr_change_function (hi, old_address,
1507                                                  mac_address);
1508         }
1509       if (!error)
1510         {
1511           vnet_hw_interface_class_t *hw_class;
1512
1513           hw_class = vnet_get_hw_interface_class (vnm, hi->hw_class_index);
1514
1515           if (NULL != hw_class->mac_addr_change_function)
1516             hw_class->mac_addr_change_function (hi, old_address, mac_address);
1517         }
1518       else
1519         {
1520           error =
1521             clib_error_return (0,
1522                                "MAC Address Change is not supported on this interface");
1523         }
1524       vec_free (old_address);
1525     }
1526   else
1527     {
1528       error =
1529         clib_error_return (0,
1530                            "mac address change is not supported for interface index %u",
1531                            hw_if_index);
1532     }
1533   return error;
1534 }
1535
1536 clib_error_t *
1537 vnet_hw_interface_change_mac_address (vnet_main_t * vnm, u32 hw_if_index,
1538                                       const u8 * mac_address)
1539 {
1540   return vnet_hw_interface_change_mac_address_helper
1541     (vnm, hw_if_index, mac_address);
1542 }
1543
1544 /* update the unnumbered state of an interface*/
1545 void
1546 vnet_sw_interface_update_unnumbered (u32 unnumbered_sw_if_index,
1547                                      u32 ip_sw_if_index, u8 enable)
1548 {
1549   vnet_main_t *vnm = vnet_get_main ();
1550   vnet_sw_interface_t *si;
1551   u32 was_unnum;
1552
1553   si = vnet_get_sw_interface (vnm, unnumbered_sw_if_index);
1554   was_unnum = (si->flags & VNET_SW_INTERFACE_FLAG_UNNUMBERED);
1555
1556   if (enable)
1557     {
1558       si->flags |= VNET_SW_INTERFACE_FLAG_UNNUMBERED;
1559       si->unnumbered_sw_if_index = ip_sw_if_index;
1560
1561       ip4_main.lookup_main.if_address_pool_index_by_sw_if_index
1562         [unnumbered_sw_if_index] =
1563         ip4_main.
1564         lookup_main.if_address_pool_index_by_sw_if_index[ip_sw_if_index];
1565       ip6_main.
1566         lookup_main.if_address_pool_index_by_sw_if_index
1567         [unnumbered_sw_if_index] =
1568         ip6_main.
1569         lookup_main.if_address_pool_index_by_sw_if_index[ip_sw_if_index];
1570     }
1571   else
1572     {
1573       si->flags &= ~(VNET_SW_INTERFACE_FLAG_UNNUMBERED);
1574       si->unnumbered_sw_if_index = (u32) ~ 0;
1575
1576       ip4_main.lookup_main.if_address_pool_index_by_sw_if_index
1577         [unnumbered_sw_if_index] = ~0;
1578       ip6_main.lookup_main.if_address_pool_index_by_sw_if_index
1579         [unnumbered_sw_if_index] = ~0;
1580     }
1581
1582   if (was_unnum != (si->flags & VNET_SW_INTERFACE_FLAG_UNNUMBERED))
1583     {
1584       ip4_sw_interface_enable_disable (unnumbered_sw_if_index, enable);
1585       ip6_sw_interface_enable_disable (unnumbered_sw_if_index, enable);
1586     }
1587 }
1588
1589 vnet_l3_packet_type_t
1590 vnet_link_to_l3_proto (vnet_link_t link)
1591 {
1592   switch (link)
1593     {
1594     case VNET_LINK_IP4:
1595       return (VNET_L3_PACKET_TYPE_IP4);
1596     case VNET_LINK_IP6:
1597       return (VNET_L3_PACKET_TYPE_IP6);
1598     case VNET_LINK_MPLS:
1599       return (VNET_L3_PACKET_TYPE_MPLS);
1600     case VNET_LINK_ARP:
1601       return (VNET_L3_PACKET_TYPE_ARP);
1602     case VNET_LINK_ETHERNET:
1603     case VNET_LINK_NSH:
1604       ASSERT (0);
1605       break;
1606     }
1607   ASSERT (0);
1608   return (0);
1609 }
1610
1611 vnet_mtu_t
1612 vnet_link_to_mtu (vnet_link_t link)
1613 {
1614   switch (link)
1615     {
1616     case VNET_LINK_IP4:
1617       return (VNET_MTU_IP4);
1618     case VNET_LINK_IP6:
1619       return (VNET_MTU_IP6);
1620     case VNET_LINK_MPLS:
1621       return (VNET_MTU_MPLS);
1622     default:
1623       return (VNET_MTU_L3);
1624     }
1625 }
1626
1627 u8 *
1628 default_build_rewrite (vnet_main_t * vnm,
1629                        u32 sw_if_index,
1630                        vnet_link_t link_type, const void *dst_address)
1631 {
1632   return (NULL);
1633 }
1634
1635 void
1636 default_update_adjacency (vnet_main_t * vnm, u32 sw_if_index, u32 ai)
1637 {
1638   ip_adjacency_t *adj;
1639
1640   adj = adj_get (ai);
1641
1642   switch (adj->lookup_next_index)
1643     {
1644     case IP_LOOKUP_NEXT_GLEAN:
1645       adj_glean_update_rewrite (ai);
1646       break;
1647     case IP_LOOKUP_NEXT_ARP:
1648     case IP_LOOKUP_NEXT_BCAST:
1649       /*
1650        * default rewrite in neighbour adj
1651        */
1652       adj_nbr_update_rewrite
1653         (ai,
1654          ADJ_NBR_REWRITE_FLAG_COMPLETE,
1655          vnet_build_rewrite_for_sw_interface (vnm,
1656                                               sw_if_index,
1657                                               adj_get_link_type (ai), NULL));
1658       break;
1659     case IP_LOOKUP_NEXT_MCAST:
1660       /*
1661        * mcast traffic also uses default rewrite string with no mcast
1662        * switch time updates.
1663        */
1664       adj_mcast_update_rewrite
1665         (ai,
1666          vnet_build_rewrite_for_sw_interface (vnm,
1667                                               sw_if_index,
1668                                               adj_get_link_type (ai),
1669                                               NULL), 0);
1670       break;
1671     case IP_LOOKUP_NEXT_DROP:
1672     case IP_LOOKUP_NEXT_PUNT:
1673     case IP_LOOKUP_NEXT_LOCAL:
1674     case IP_LOOKUP_NEXT_REWRITE:
1675     case IP_LOOKUP_NEXT_MCAST_MIDCHAIN:
1676     case IP_LOOKUP_NEXT_MIDCHAIN:
1677     case IP_LOOKUP_NEXT_ICMP_ERROR:
1678     case IP_LOOKUP_N_NEXT:
1679       ASSERT (0);
1680       break;
1681     }
1682 }
1683
1684 clib_error_t *
1685 vnet_hw_interface_set_rss_queues (vnet_main_t * vnm,
1686                                   vnet_hw_interface_t * hi,
1687                                   clib_bitmap_t * bitmap)
1688 {
1689   clib_error_t *error = 0;
1690   vnet_device_class_t *dev_class =
1691     vnet_get_device_class (vnm, hi->dev_class_index);
1692
1693   if (dev_class->set_rss_queues_function)
1694     {
1695       if (clib_bitmap_count_set_bits (bitmap) == 0)
1696         {
1697           error = clib_error_return (0,
1698                                      "must assign at least one valid rss queue");
1699           goto done;
1700         }
1701
1702       error = dev_class->set_rss_queues_function (vnm, hi, bitmap);
1703     }
1704   else
1705     {
1706       error = clib_error_return (0,
1707                                  "setting rss queues is not supported on this interface");
1708     }
1709
1710   if (!error)
1711     {
1712       clib_bitmap_free (hi->rss_queues);
1713       hi->rss_queues = clib_bitmap_dup (bitmap);
1714     }
1715
1716 done:
1717   return error;
1718 }
1719
1720 int collect_detailed_interface_stats_flag = 0;
1721
1722 void
1723 collect_detailed_interface_stats_flag_set (void)
1724 {
1725   collect_detailed_interface_stats_flag = 1;
1726 }
1727
1728 void
1729 collect_detailed_interface_stats_flag_clear (void)
1730 {
1731   collect_detailed_interface_stats_flag = 0;
1732 }
1733
1734 static clib_error_t *
1735 collect_detailed_interface_stats_cli (vlib_main_t * vm,
1736                                       unformat_input_t * input,
1737                                       vlib_cli_command_t * cmd)
1738 {
1739   unformat_input_t _line_input, *line_input = &_line_input;
1740   clib_error_t *error = NULL;
1741
1742   /* Get a line of input. */
1743   if (!unformat_user (input, unformat_line_input, line_input))
1744     return clib_error_return (0, "expected enable | disable");
1745
1746   while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
1747     {
1748       if (unformat (line_input, "enable") || unformat (line_input, "on"))
1749         collect_detailed_interface_stats_flag_set ();
1750       else if (unformat (line_input, "disable")
1751                || unformat (line_input, "off"))
1752         collect_detailed_interface_stats_flag_clear ();
1753       else
1754         {
1755           error = clib_error_return (0, "unknown input `%U'",
1756                                      format_unformat_error, line_input);
1757           goto done;
1758         }
1759     }
1760
1761 done:
1762   unformat_free (line_input);
1763   return error;
1764 }
1765
1766 /* *INDENT-OFF* */
1767 VLIB_CLI_COMMAND (collect_detailed_interface_stats_command, static) = {
1768   .path = "interface collect detailed-stats",
1769   .short_help = "interface collect detailed-stats <enable|disable>",
1770   .function = collect_detailed_interface_stats_cli,
1771 };
1772 /* *INDENT-ON* */
1773
1774 /*
1775  * fd.io coding-style-patch-verification: ON
1776  *
1777  * Local Variables:
1778  * eval: (c-set-style "gnu")
1779  * End:
1780  */