2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
7 * http://www.apache.org/licenses/LICENSE-2.0
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
16 * node.c: VLIB processing nodes
18 * Copyright (c) 2008 Eliot Dresselhaus
20 * Permission is hereby granted, free of charge, to any person obtaining
21 * a copy of this software and associated documentation files (the
22 * "Software"), to deal in the Software without restriction, including
23 * without limitation the rights to use, copy, modify, merge, publish,
24 * distribute, sublicense, and/or sell copies of the Software, and to
25 * permit persons to whom the Software is furnished to do so, subject to
26 * the following conditions:
28 * The above copyright notice and this permission notice shall be
29 * included in all copies or substantial portions of the Software.
31 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35 * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36 * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37 * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
40 #include <vlib/vlib.h>
41 #include <vlib/threads.h>
43 /* Query node given name. */
45 vlib_get_node_by_name (vlib_main_t * vm, u8 * name)
47 vlib_node_main_t *nm = &vm->node_main;
50 key = format (0, "%s", key);
51 p = hash_get (nm->node_by_name, key);
54 return p ? vec_elt (nm->nodes, p[0]) : 0;
58 node_set_elog_name (vlib_main_t * vm, uword node_index)
60 vlib_node_t *n = vlib_get_node (vm, node_index);
63 t = vec_elt_at_index (vm->node_call_elog_event_types, node_index);
65 t->format = (char *) format (0, "%v-call: %%d%c", n->name, 0);
67 t = vec_elt_at_index (vm->node_return_elog_event_types, node_index);
69 t->format = (char *) format (0, "%v-return: %%d%c", n->name, 0);
72 elog_string (&vlib_global_main.elog_main, "%v%c", n->name, 0);
76 vlib_node_rename (vlib_main_t * vm, u32 node_index, char *fmt, ...)
79 vlib_node_main_t *nm = &vm->node_main;
80 vlib_node_t *n = vlib_get_node (vm, node_index);
83 hash_unset (nm->node_by_name, n->name);
85 n->name = va_format (0, fmt, &va);
87 hash_set (nm->node_by_name, n->name, n->index);
89 node_set_elog_name (vm, node_index);
91 /* Propagate the change to all worker threads */
92 vlib_worker_thread_node_runtime_update ();
96 vlib_node_runtime_update (vlib_main_t * vm, u32 node_index, u32 next_index)
98 vlib_node_main_t *nm = &vm->node_main;
99 vlib_node_runtime_t *r, *s;
100 vlib_node_t *node, *next_node;
101 vlib_next_frame_t *nf;
102 vlib_pending_frame_t *pf;
105 node = vec_elt (nm->nodes, node_index);
106 r = vlib_node_get_runtime (vm, node_index);
108 n_insert = vec_len (node->next_nodes) - r->n_next_nodes;
111 i = r->next_frame_index + r->n_next_nodes;
112 vec_insert (nm->next_frames, n_insert, i);
114 /* Initialize newly inserted next frames. */
115 for (j = 0; j < n_insert; j++)
116 vlib_next_frame_init (nm->next_frames + i + j);
118 /* Relocate other next frames at higher indices. */
119 for (j = 0; j < vec_len (nm->nodes); j++)
121 s = vlib_node_get_runtime (vm, j);
122 if (j != node_index && s->next_frame_index >= i)
123 s->next_frame_index += n_insert;
126 /* Pending frames may need to be relocated also. */
127 vec_foreach (pf, nm->pending_frames)
129 if (pf->next_frame_index != VLIB_PENDING_FRAME_NO_NEXT_FRAME
130 && pf->next_frame_index >= i)
131 pf->next_frame_index += n_insert;
134 pool_foreach (pf, nm->suspended_process_frames) {
135 if (pf->next_frame_index != ~0 && pf->next_frame_index >= i)
136 pf->next_frame_index += n_insert;
140 r->n_next_nodes = vec_len (node->next_nodes);
143 /* Set frame's node runtime index. */
144 next_node = vlib_get_node (vm, node->next_nodes[next_index]);
145 nf = nm->next_frames + r->next_frame_index + next_index;
146 nf->node_runtime_index = next_node->runtime_index;
148 vlib_worker_thread_node_runtime_update ();
152 vlib_node_get_next (vlib_main_t * vm, uword node_index, uword next_node_index)
154 vlib_node_main_t *nm = &vm->node_main;
158 node = vec_elt (nm->nodes, node_index);
160 /* Runtime has to be initialized. */
161 ASSERT (nm->flags & VLIB_NODE_MAIN_RUNTIME_STARTED);
163 if ((p = hash_get (node->next_slot_by_node, next_node_index)))
171 /* Add next node to given node in given slot. */
173 vlib_node_add_next_with_slot (vlib_main_t * vm,
175 uword next_node_index, uword slot)
177 vlib_node_main_t *nm = &vm->node_main;
178 vlib_node_t *node, *next, *old_next;
182 ASSERT (vlib_get_thread_index () == 0);
184 node = vec_elt (nm->nodes, node_index);
185 next = vec_elt (nm->nodes, next_node_index);
187 /* Runtime has to be initialized. */
188 ASSERT (nm->flags & VLIB_NODE_MAIN_RUNTIME_STARTED);
190 if ((p = hash_get (node->next_slot_by_node, next_node_index)))
192 /* Next already exists: slot must match. */
194 ASSERT (slot == p[0]);
198 vlib_worker_thread_barrier_sync (vm);
201 slot = vec_len (node->next_nodes);
203 vec_validate_init_empty (node->next_nodes, slot, ~0);
204 vec_validate (node->n_vectors_by_next_node, slot);
206 if ((old_next_index = node->next_nodes[slot]) != ~0u)
208 hash_unset (node->next_slot_by_node, old_next_index);
209 old_next = vlib_get_node (vm, old_next_index);
210 old_next->prev_node_bitmap =
211 clib_bitmap_andnoti (old_next->prev_node_bitmap, node_index);
214 node->next_nodes[slot] = next_node_index;
215 hash_set (node->next_slot_by_node, next_node_index, slot);
217 vlib_node_runtime_update (vm, node_index, slot);
219 next->prev_node_bitmap = clib_bitmap_ori (next->prev_node_bitmap,
222 /* Siblings all get same node structure. */
224 uword sib_node_index, sib_slot;
225 vlib_node_t *sib_node;
227 clib_bitmap_foreach (sib_node_index, node->sibling_bitmap) {
228 sib_node = vec_elt (nm->nodes, sib_node_index);
229 if (sib_node != node)
231 sib_slot = vlib_node_add_next_with_slot (vm, sib_node_index, next_node_index, slot);
232 ASSERT (sib_slot == slot);
238 vlib_worker_thread_barrier_release (vm);
242 /* Add named next node to given node in given slot. */
244 vlib_node_add_named_next_with_slot (vlib_main_t * vm,
245 uword node, char *name, uword slot)
247 vlib_node_main_t *nm;
248 vlib_node_t *n, *n_next;
251 n = vlib_get_node (vm, node);
253 n_next = vlib_get_node_by_name (vm, (u8 *) name);
256 if (nm->flags & VLIB_NODE_MAIN_RUNTIME_STARTED)
260 slot = clib_max (vec_len (n->next_node_names),
261 vec_len (n->next_nodes));
262 vec_validate (n->next_node_names, slot);
263 n->next_node_names[slot] = name;
267 return vlib_node_add_next_with_slot (vm, node, n_next->index, slot);
271 node_elog_init (vlib_main_t * vm, uword ni)
275 clib_memset (&t, 0, sizeof (t));
277 /* 2 event types for this node: one when node function is called.
278 One when it returns. */
279 vec_validate (vm->node_call_elog_event_types, ni);
280 vm->node_call_elog_event_types[ni] = t;
282 vec_validate (vm->node_return_elog_event_types, ni);
283 vm->node_return_elog_event_types[ni] = t;
285 node_set_elog_name (vm, ni);
289 #define STACK_ALIGN (clib_mem_get_page_size())
291 #define STACK_ALIGN CLIB_CACHE_LINE_BYTES
294 vlib_node_function_t *
295 vlib_node_get_preferred_node_fn_variant (vlib_main_t *vm,
296 vlib_node_fn_registration_t *regs)
298 vlib_node_main_t *nm = &vm->node_main;
299 vlib_node_fn_registration_t *r;
300 vlib_node_fn_variant_t *v;
301 vlib_node_function_t *fn = 0;
304 if (nm->node_fn_default_march_variant != ~0)
309 if (r->march_variant == nm->node_fn_default_march_variant)
311 r = r->next_registration;
318 v = vec_elt_at_index (nm->variants, r->march_variant);
319 if (v->priority > priority)
321 priority = v->priority;
324 r = r->next_registration;
332 register_node (vlib_main_t * vm, vlib_node_registration_t * r)
334 vlib_node_main_t *nm = &vm->node_main;
340 /* Default (0) type should match INTERNAL. */
341 vlib_node_t zero = { 0 };
342 ASSERT (VLIB_NODE_TYPE_INTERNAL == zero.type);
345 if (r->node_fn_registrations)
347 /* to avoid confusion, please remove ".function " statiement from
348 CLIB_NODE_REGISTRATION() if using function function candidates */
349 ASSERT (r->function == 0);
352 vlib_node_get_preferred_node_fn_variant (vm, r->node_fn_registrations);
355 ASSERT (r->function != 0);
357 n = clib_mem_alloc_no_fail (sizeof (n[0]));
358 clib_memset (n, 0, sizeof (n[0]));
359 n->index = vec_len (nm->nodes);
360 n->node_fn_registrations = r->node_fn_registrations;
361 n->protocol_hint = r->protocol_hint;
363 vec_add1 (nm->nodes, n);
365 /* Name is always a vector so it can be formatted with %v. */
366 if (clib_mem_is_heap_object (vec_header (r->name, 0)))
367 n->name = vec_dup ((u8 *) r->name);
369 n->name = format (0, "%s", r->name);
371 if (!nm->node_by_name)
372 nm->node_by_name = hash_create_vec ( /* size */ 32,
373 sizeof (n->name[0]), sizeof (uword));
375 /* Node names must be unique. */
377 /* vlib_get_node_by_name() expects NULL-terminated strings */
378 u8 *name = format (0, "%v%c", n->name, 0);
379 vlib_node_t *o = vlib_get_node_by_name (vm, name);
382 clib_error ("more than one node named `%v'", n->name);
385 hash_set (nm->node_by_name, n->name, n->index);
387 r->index = n->index; /* save index in registration */
388 n->function = r->function;
390 /* Node index of next sibling will be filled in by vlib_node_main_init. */
391 n->sibling_of = r->sibling_of;
392 if (r->sibling_of && r->n_next_nodes > 0)
393 clib_error ("sibling node should not have any next nodes `%v'", n->name);
395 if (r->type == VLIB_NODE_TYPE_INTERNAL)
396 ASSERT (r->vector_size > 0);
398 #define _(f) n->f = r->f
410 /* Register error counters. */
411 vlib_register_errors (vm, n->index, r->n_errors, r->error_strings,
413 node_elog_init (vm, n->index);
415 _(runtime_data_bytes);
416 if (r->runtime_data_bytes > 0)
418 vec_resize (n->runtime_data, r->runtime_data_bytes);
420 clib_memcpy (n->runtime_data, r->runtime_data, r->runtime_data_bytes);
423 vec_resize (n->next_node_names, r->n_next_nodes);
424 for (i = 0; i < r->n_next_nodes; i++)
425 n->next_node_names[i] = r->next_nodes[i];
427 vec_validate_init_empty (n->next_nodes, r->n_next_nodes - 1, ~0);
428 vec_validate (n->n_vectors_by_next_node, r->n_next_nodes - 1);
430 n->owner_node_index = n->owner_next_index = ~0;
432 /* Initialize node runtime. */
434 vlib_node_runtime_t *rt;
437 if (n->type == VLIB_NODE_TYPE_PROCESS)
440 uword log2_n_stack_bytes;
442 log2_n_stack_bytes = clib_max (r->process_log2_n_stack_bytes,
443 VLIB_PROCESS_LOG2_STACK_SIZE);
444 log2_n_stack_bytes = clib_max (log2_n_stack_bytes,
445 clib_mem_get_log2_page_size ());
447 p = clib_mem_alloc_aligned (sizeof (p[0]), CLIB_CACHE_LINE_BYTES);
448 clib_memset (p, 0, sizeof (p[0]));
449 p->log2_n_stack_bytes = log2_n_stack_bytes;
451 p->stack = clib_mem_vm_map_stack (1ULL << log2_n_stack_bytes,
452 CLIB_MEM_PAGE_SZ_DEFAULT,
454 format_vlib_node_name, vm,
457 if (p->stack == CLIB_MEM_VM_MAP_FAILED)
458 clib_panic ("failed to allocate process stack (%d bytes)",
459 1ULL << log2_n_stack_bytes);
461 /* Process node's runtime index is really index into process
463 n->runtime_index = vec_len (nm->processes);
465 vec_add1 (nm->processes, p);
467 /* Paint first stack word with magic number so we can at least
468 detect process stack overruns. */
469 p->stack[0] = VLIB_PROCESS_STACK_MAGIC;
471 /* Node runtime is stored inside of process. */
472 rt = &p->node_runtime;
476 vec_add2_aligned (nm->nodes_by_type[n->type], rt, 1,
477 /* align */ CLIB_CACHE_LINE_BYTES);
478 if (n->type == VLIB_NODE_TYPE_INPUT)
479 clib_interrupt_resize (&nm->interrupts,
480 vec_len (nm->nodes_by_type[n->type]));
481 n->runtime_index = rt - nm->nodes_by_type[n->type];
484 if (n->type == VLIB_NODE_TYPE_INPUT)
485 nm->input_node_counts_by_state[n->state] += 1;
487 rt->function = n->function;
488 rt->flags = n->flags;
489 rt->state = n->state;
490 rt->node_index = n->index;
492 rt->n_next_nodes = r->n_next_nodes;
493 rt->next_frame_index = vec_len (nm->next_frames);
495 vec_resize (nm->next_frames, rt->n_next_nodes);
496 for (i = 0; i < rt->n_next_nodes; i++)
497 vlib_next_frame_init (nm->next_frames + rt->next_frame_index + i);
499 vec_resize (rt->errors, r->n_errors);
500 for (i = 0; i < vec_len (rt->errors); i++)
501 rt->errors[i] = n->error_heap_index + i;
503 STATIC_ASSERT_SIZEOF (vlib_node_runtime_t, 128);
504 ASSERT (vec_len (n->runtime_data) <= VLIB_NODE_RUNTIME_DATA_SIZE);
506 if (vec_len (n->runtime_data) > 0)
507 clib_memcpy (rt->runtime_data, n->runtime_data,
508 vec_len (n->runtime_data));
510 clib_memset (rt->runtime_data, 0, VLIB_NODE_RUNTIME_DATA_SIZE);
512 vec_free (n->runtime_data);
517 /* Register new packet processing node. */
519 vlib_register_node (vlib_main_t * vm, vlib_node_registration_t * r)
521 register_node (vm, r);
526 null_node_fn (vlib_main_t * vm,
527 vlib_node_runtime_t * node, vlib_frame_t * frame)
529 u16 n_vectors = frame->n_vectors;
531 vlib_node_increment_counter (vm, node->node_index, 0, n_vectors);
532 vlib_buffer_free (vm, vlib_frame_vector_args (frame), n_vectors);
533 vlib_frame_free (vm, node, frame);
539 vlib_register_all_node_march_variants (vlib_main_t *vm)
541 vlib_node_main_t *nm = &vm->node_main;
542 vlib_node_fn_variant_t *v;
545 nm->node_fn_default_march_variant = ~0;
546 ASSERT (nm->variants == 0);
547 vec_add2 (nm->variants, v, 1);
548 v->desc = v->suffix = "default";
549 v->index = CLIB_MARCH_VARIANT_TYPE;
552 vec_add2 (nm->variants, v, 1); \
554 v->index = CLIB_MARCH_VARIANT_TYPE_##s; \
555 v->priority = clib_cpu_march_priority_##s (); \
558 foreach_march_variant;
561 nm->node_fn_march_variant_by_suffix = hash_create_string (0, sizeof (u32));
563 vec_foreach (v, nm->variants)
565 ASSERT (v->index == v - nm->variants);
566 hash_set (nm->node_fn_march_variant_by_suffix, v->suffix, v->index);
567 if (v->priority > prio)
573 vlib_register_all_static_nodes (vlib_main_t * vm)
575 vlib_global_main_t *vgm = vlib_get_global_main ();
576 vlib_node_registration_t *r;
578 static char *null_node_error_strings[] = {
579 "blackholed packets",
582 static vlib_node_registration_t null_node_reg = {
583 .function = null_node_fn,
584 .vector_size = sizeof (u32),
587 .error_strings = null_node_error_strings,
590 /* make sure that node index 0 is not used by
592 register_node (vm, &null_node_reg);
594 r = vgm->node_registrations;
597 register_node (vm, r);
598 r = r->next_registration;
603 vlib_node_get_nodes (vlib_main_t * vm, u32 max_threads, int include_stats,
604 int barrier_sync, vlib_node_t **** node_dupsp,
605 vlib_main_t *** stat_vmsp)
607 vlib_node_main_t *nm = &vm->node_main;
609 vlib_node_t ***node_dups = *node_dupsp;
611 vlib_main_t **stat_vms = *stat_vmsp;
612 vlib_main_t *stat_vm;
614 u32 threads_to_serialize;
616 if (vec_len (stat_vms) == 0)
618 for (i = 0; i < vlib_get_n_threads (); i++)
620 stat_vm = vlib_get_main_by_index (i);
622 vec_add1 (stat_vms, stat_vm);
626 threads_to_serialize = clib_min (max_threads, vec_len (stat_vms));
628 vec_validate (node_dups, threads_to_serialize - 1);
631 * Barrier sync across stats scraping.
632 * Otherwise, the counts will be grossly inaccurate.
635 vlib_worker_thread_barrier_sync (vm);
637 for (j = 0; j < threads_to_serialize; j++)
639 stat_vm = stat_vms[j];
640 nm = &stat_vm->node_main;
644 for (i = 0; i < vec_len (nm->nodes); i++)
647 vlib_node_sync_stats (stat_vm, n);
651 nodes = node_dups[j];
652 vec_validate (nodes, vec_len (nm->nodes) - 1);
653 clib_memcpy (nodes, nm->nodes, vec_len (nm->nodes) * sizeof (nodes[0]));
654 node_dups[j] = nodes;
658 vlib_worker_thread_barrier_release (vm);
660 *node_dupsp = node_dups;
661 *stat_vmsp = stat_vms;
665 vlib_node_main_init (vlib_main_t * vm)
667 vlib_node_main_t *nm = &vm->node_main;
668 clib_error_t *error = 0;
672 nm->frame_sizes = vec_new (vlib_frame_size_t, 1);
673 #ifdef VLIB_SUPPORTS_ARBITRARY_SCALAR_SIZES
674 nm->frame_size_hash = hash_create (0, sizeof (uword));
676 nm->flags |= VLIB_NODE_MAIN_RUNTIME_STARTED;
678 /* Generate sibling relationships */
680 vlib_node_t *n, *sib;
683 for (ni = 0; ni < vec_len (nm->nodes); ni++)
685 n = vec_elt (nm->nodes, ni);
690 sib = vlib_get_node_by_name (vm, (u8 *) n->sibling_of);
693 error = clib_error_create ("sibling `%s' not found for node `%v'",
694 n->sibling_of, n->name);
699 clib_bitmap_foreach (si, sib->sibling_bitmap) {
700 vlib_node_t * m = vec_elt (nm->nodes, si);
702 /* Connect all of sibling's siblings to us. */
703 m->sibling_bitmap = clib_bitmap_ori (m->sibling_bitmap, n->index);
705 /* Connect us to all of sibling's siblings. */
706 n->sibling_bitmap = clib_bitmap_ori (n->sibling_bitmap, si);
710 /* Connect sibling to us. */
711 sib->sibling_bitmap = clib_bitmap_ori (sib->sibling_bitmap, n->index);
713 /* Connect us to sibling. */
714 n->sibling_bitmap = clib_bitmap_ori (n->sibling_bitmap, sib->index);
718 /* Resolve next names into next indices. */
719 for (ni = 0; ni < vec_len (nm->nodes); ni++)
723 n = vec_elt (nm->nodes, ni);
725 for (i = 0; i < vec_len (n->next_node_names); i++)
727 char *a = n->next_node_names[i];
732 if (~0 == vlib_node_add_named_next_with_slot (vm, n->index, a, i))
734 error = clib_error_create
735 ("node `%v' refers to unknown node `%s'", n->name, a);
740 vec_free (n->next_node_names);
743 /* Set previous node pointers. */
744 for (ni = 0; ni < vec_len (nm->nodes); ni++)
749 n = vec_elt (nm->nodes, ni);
751 for (i = 0; i < vec_len (n->next_nodes); i++)
753 if (n->next_nodes[i] >= vec_len (nm->nodes))
756 n_next = vec_elt (nm->nodes, n->next_nodes[i]);
757 n_next->prev_node_bitmap =
758 clib_bitmap_ori (n_next->prev_node_bitmap, n->index);
763 vlib_next_frame_t *nf;
764 vlib_node_runtime_t *r;
768 vec_foreach (r, nm->nodes_by_type[VLIB_NODE_TYPE_INTERNAL])
770 if (r->n_next_nodes == 0)
773 n = vlib_get_node (vm, r->node_index);
774 nf = vec_elt_at_index (nm->next_frames, r->next_frame_index);
776 for (i = 0; i < vec_len (n->next_nodes); i++)
778 next = vlib_get_node (vm, n->next_nodes[i]);
780 /* Validate node runtime indices are correctly initialized. */
781 ASSERT (nf[i].node_runtime_index == next->runtime_index);
784 if (next->flags & VLIB_NODE_FLAG_FRAME_NO_FREE_AFTER_DISPATCH)
785 nf[i].flags |= VLIB_FRAME_NO_FREE_AFTER_DISPATCH;
795 vlib_process_create (vlib_main_t * vm, char *name,
796 vlib_node_function_t * f, u32 log2_n_stack_bytes)
798 vlib_node_registration_t r;
801 memset (&r, 0, sizeof (r));
803 r.name = (char *) format (0, "%s", name, 0);
805 r.process_log2_n_stack_bytes = log2_n_stack_bytes;
806 r.type = VLIB_NODE_TYPE_PROCESS;
808 vlib_worker_thread_barrier_sync (vm);
810 vlib_register_node (vm, &r);
813 vlib_worker_thread_node_runtime_update ();
814 vlib_worker_thread_barrier_release (vm);
816 n = vlib_get_node (vm, r.index);
817 vlib_start_process (vm, n->runtime_index);
823 vlib_node_set_march_variant (vlib_main_t *vm, u32 node_index,
824 clib_march_variant_type_t march_variant)
826 vlib_node_fn_registration_t *fnr;
827 vlib_node_fn_variant_t *v;
828 vlib_node_t *n = vlib_get_node (vm, node_index);
830 if (n->node_fn_registrations == 0)
833 fnr = n->node_fn_registrations;
834 v = vec_elt_at_index (vm->node_main.variants, march_variant);
838 if (fnr->march_variant == v->index)
840 n->function = fnr->function;
842 for (int i = 0; i < vlib_get_n_threads (); i++)
844 vlib_node_runtime_t *nrt;
846 vlib_node_get_runtime (vlib_get_main_by_index (i), n->index);
847 nrt->function = fnr->function;
851 fnr = fnr->next_registration;
856 * fd.io coding-style-patch-verification: ON
859 * eval: (c-set-style "gnu")