2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
7 * http://www.apache.org/licenses/LICENSE-2.0
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
16 #include <vlib/vlib.h>
17 #include <vnet/l2/feat_bitmap.h>
18 #include <vnet/l2/l2_rw.h>
22 * @brief Layer 2 Rewrite.
24 * Layer 2-Rewrite node uses classify tables to match packets. Then, using
25 * the provisioned mask and value, modifies the packet header.
29 #ifndef CLIB_MARCH_VARIANT
30 l2_rw_main_t l2_rw_main;
31 #endif /* CLIB_MARCH_VARIANT */
36 u32 classify_table_index;
37 u32 rewrite_entry_index;
41 format_l2_rw_entry (u8 * s, va_list * args)
43 l2_rw_entry_t *e = va_arg (*args, l2_rw_entry_t *);
44 l2_rw_main_t *rw = &l2_rw_main;
45 s = format (s, "%d - mask:%U value:%U\n",
47 format_hex_bytes, e->mask,
48 e->rewrite_n_vectors * sizeof (u32x4), format_hex_bytes,
49 e->value, e->rewrite_n_vectors * sizeof (u32x4));
51 format (s, " hits:%d skip_bytes:%d", e->hit_count,
52 e->skip_n_vectors * sizeof (u32x4));
57 format_l2_rw_config (u8 * s, va_list * args)
59 l2_rw_config_t *c = va_arg (*args, l2_rw_config_t *);
60 return format (s, "table-index:%d miss-index:%d",
61 c->table_index, c->miss_index);
64 /* packet trace format function */
66 format_l2_rw_trace (u8 * s, va_list * args)
68 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
69 CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
70 l2_rw_trace_t *t = va_arg (*args, l2_rw_trace_t *);
71 return format (s, "l2-rw: sw_if_index %d, table %d, entry %d",
72 t->sw_if_index, t->classify_table_index,
73 t->rewrite_entry_index);
76 always_inline l2_rw_config_t *
77 l2_rw_get_config (u32 sw_if_index)
79 l2_rw_main_t *rw = &l2_rw_main;
80 if (PREDICT_FALSE (!clib_bitmap_get (rw->configs_bitmap, sw_if_index)))
82 vec_validate (rw->configs, sw_if_index);
83 rw->configs[sw_if_index].table_index = ~0;
84 rw->configs[sw_if_index].miss_index = ~0;
86 clib_bitmap_set (rw->configs_bitmap, sw_if_index, 1);
88 return &rw->configs[sw_if_index];
91 static_always_inline void
92 l2_rw_rewrite (l2_rw_entry_t * rwe, u8 * h)
94 if (U32X4_ALIGNED (h))
96 u32x4 *d = ((u32x4 *) h) + rwe->skip_n_vectors;
97 switch (rwe->rewrite_n_vectors)
100 d[4] = (d[4] & ~rwe->mask[4]) | rwe->value[4];
103 d[3] = (d[3] & ~rwe->mask[3]) | rwe->value[3];
106 d[2] = (d[2] & ~rwe->mask[2]) | rwe->value[2];
109 d[1] = (d[1] & ~rwe->mask[1]) | rwe->value[1];
112 d[0] = (d[0] & ~rwe->mask[0]) | rwe->value[0];
120 u64 *d = ((u64 *) h) + rwe->skip_n_vectors * 2;
121 switch (rwe->rewrite_n_vectors)
125 (d[8] & ~(((u64 *) rwe->mask)[8])) | (((u64 *) rwe->value)[8]);
127 (d[9] & ~(((u64 *) rwe->mask)[9])) | (((u64 *) rwe->value)[9]);
131 (d[6] & ~(((u64 *) rwe->mask)[6])) | (((u64 *) rwe->value)[6]);
133 (d[7] & ~(((u64 *) rwe->mask)[7])) | (((u64 *) rwe->value)[7]);
137 (d[4] & ~(((u64 *) rwe->mask)[4])) | (((u64 *) rwe->value)[4]);
139 (d[5] & ~(((u64 *) rwe->mask)[5])) | (((u64 *) rwe->value)[5]);
143 (d[2] & ~(((u64 *) rwe->mask)[2])) | (((u64 *) rwe->value)[2]);
145 (d[3] & ~(((u64 *) rwe->mask)[3])) | (((u64 *) rwe->value)[3]);
149 (d[0] & ~(((u64 *) rwe->mask)[0])) | (((u64 *) rwe->value)[0]);
151 (d[1] & ~(((u64 *) rwe->mask)[1])) | (((u64 *) rwe->value)[1]);
159 VLIB_NODE_FN (l2_rw_node) (vlib_main_t * vm,
160 vlib_node_runtime_t * node, vlib_frame_t * frame)
162 l2_rw_main_t *rw = &l2_rw_main;
163 u32 n_left_from, *from, *to_next, next_index;
164 vnet_classify_main_t *vcm = &vnet_classify_main;
165 f64 now = vlib_time_now (vlib_get_main ());
167 from = vlib_frame_vector_args (frame);
168 n_left_from = frame->n_vectors; /* number of packets to process */
169 next_index = node->cached_next_index;
171 while (n_left_from > 0)
175 /* get space to enqueue frame to graph node "next_index" */
176 vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next);
178 while (n_left_from >= 6 && n_left_to_next >= 2)
180 u32 bi0, next0, sw_if_index0, rwe_index0;
181 u32 bi1, next1, sw_if_index1, rwe_index1;
182 vlib_buffer_t *b0, *b1;
183 ethernet_header_t *h0, *h1;
184 l2_rw_config_t *config0, *config1;
186 vnet_classify_table_t *t0, *t1;
187 vnet_classify_entry_t *e0, *e1;
188 l2_rw_entry_t *rwe0, *rwe1;
191 vlib_buffer_t *p2, *p3, *p4, *p5;
192 p2 = vlib_get_buffer (vm, from[2]);
193 p3 = vlib_get_buffer (vm, from[3]);
194 p4 = vlib_get_buffer (vm, from[4]);
195 p5 = vlib_get_buffer (vm, from[5]);
197 vlib_prefetch_buffer_header (p4, LOAD);
198 vlib_prefetch_buffer_header (p5, LOAD);
199 vlib_prefetch_buffer_data (p2, LOAD);
200 vlib_prefetch_buffer_data (p3, LOAD);
212 b0 = vlib_get_buffer (vm, bi0);
213 b1 = vlib_get_buffer (vm, bi1);
214 h0 = vlib_buffer_get_current (b0);
215 h1 = vlib_buffer_get_current (b1);
217 sw_if_index0 = vnet_buffer (b0)->sw_if_index[VLIB_RX];
218 sw_if_index1 = vnet_buffer (b1)->sw_if_index[VLIB_RX];
219 config0 = l2_rw_get_config (sw_if_index0); /*TODO: check sw_if_index0 value */
220 config1 = l2_rw_get_config (sw_if_index1); /*TODO: check sw_if_index0 value */
221 t0 = pool_elt_at_index (vcm->tables, config0->table_index);
222 t1 = pool_elt_at_index (vcm->tables, config1->table_index);
224 hash0 = vnet_classify_hash_packet (t0, (u8 *) h0);
225 hash1 = vnet_classify_hash_packet (t1, (u8 *) h1);
226 e0 = vnet_classify_find_entry (t0, (u8 *) h0, hash0, now);
227 e1 = vnet_classify_find_entry (t1, (u8 *) h1, hash1, now);
229 while (!e0 && (t0->next_table_index != ~0))
231 t0 = pool_elt_at_index (vcm->tables, t0->next_table_index);
232 hash0 = vnet_classify_hash_packet (t0, (u8 *) h0);
233 e0 = vnet_classify_find_entry (t0, (u8 *) h0, hash0, now);
236 while (!e1 && (t1->next_table_index != ~0))
238 t1 = pool_elt_at_index (vcm->tables, t1->next_table_index);
239 hash1 = vnet_classify_hash_packet (t1, (u8 *) h1);
240 e1 = vnet_classify_find_entry (t1, (u8 *) h1, hash1, now);
243 rwe_index0 = e0 ? e0->opaque_index : config0->miss_index;
244 rwe_index1 = e1 ? e1->opaque_index : config1->miss_index;
246 if (rwe_index0 != ~0)
248 rwe0 = pool_elt_at_index (rw->entries, rwe_index0);
249 l2_rw_rewrite (rwe0, (u8 *) h0);
251 if (rwe_index1 != ~0)
253 rwe1 = pool_elt_at_index (rw->entries, rwe_index1);
254 l2_rw_rewrite (rwe1, (u8 *) h1);
257 if (PREDICT_FALSE ((b0->flags & VLIB_BUFFER_IS_TRACED)))
259 l2_rw_trace_t *t = vlib_add_trace (vm, node, b0, sizeof (*t));
260 t->sw_if_index = sw_if_index0;
261 t->classify_table_index = config0->table_index;
262 t->rewrite_entry_index = rwe_index0;
265 if (PREDICT_FALSE ((b1->flags & VLIB_BUFFER_IS_TRACED)))
267 l2_rw_trace_t *t = vlib_add_trace (vm, node, b1, sizeof (*t));
268 t->sw_if_index = sw_if_index1;
269 t->classify_table_index = config1->table_index;
270 t->rewrite_entry_index = rwe_index1;
273 /* Update feature bitmap and get next feature index */
274 next0 = vnet_l2_feature_next (b0, rw->feat_next_node_index,
276 next1 = vnet_l2_feature_next (b1, rw->feat_next_node_index,
279 vlib_validate_buffer_enqueue_x2 (vm, node, next_index,
280 to_next, n_left_to_next,
281 bi0, bi1, next0, next1);
284 while (n_left_from > 0 && n_left_to_next > 0)
286 u32 bi0, next0, sw_if_index0, rwe_index0;
288 ethernet_header_t *h0;
289 l2_rw_config_t *config0;
291 vnet_classify_table_t *t0;
292 vnet_classify_entry_t *e0;
302 b0 = vlib_get_buffer (vm, bi0);
303 h0 = vlib_buffer_get_current (b0);
305 sw_if_index0 = vnet_buffer (b0)->sw_if_index[VLIB_RX];
306 config0 = l2_rw_get_config (sw_if_index0); /*TODO: check sw_if_index0 value */
307 t0 = pool_elt_at_index (vcm->tables, config0->table_index);
309 hash0 = vnet_classify_hash_packet (t0, (u8 *) h0);
310 e0 = vnet_classify_find_entry (t0, (u8 *) h0, hash0, now);
312 while (!e0 && (t0->next_table_index != ~0))
314 t0 = pool_elt_at_index (vcm->tables, t0->next_table_index);
315 hash0 = vnet_classify_hash_packet (t0, (u8 *) h0);
316 e0 = vnet_classify_find_entry (t0, (u8 *) h0, hash0, now);
319 rwe_index0 = e0 ? e0->opaque_index : config0->miss_index;
321 if (rwe_index0 != ~0)
323 rwe0 = pool_elt_at_index (rw->entries, rwe_index0);
324 l2_rw_rewrite (rwe0, (u8 *) h0);
327 if (PREDICT_FALSE ((b0->flags & VLIB_BUFFER_IS_TRACED)))
329 l2_rw_trace_t *t = vlib_add_trace (vm, node, b0, sizeof (*t));
330 t->sw_if_index = sw_if_index0;
331 t->classify_table_index = config0->table_index;
332 t->rewrite_entry_index = rwe_index0;
335 /* Update feature bitmap and get next feature index */
336 next0 = vnet_l2_feature_next (b0, rw->feat_next_node_index,
339 vlib_validate_buffer_enqueue_x1 (vm, node, next_index,
340 to_next, n_left_to_next,
343 vlib_put_next_frame (vm, node, next_index, n_left_to_next);
346 return frame->n_vectors;
349 #ifndef CLIB_MARCH_VARIANT
351 l2_rw_mod_entry (u32 * index,
352 u8 * mask, u8 * value, u32 len, u32 skip, u8 is_del)
354 l2_rw_main_t *rw = &l2_rw_main;
355 l2_rw_entry_t *e = 0;
358 if (pool_is_free_index (rw->entries, *index))
362 e = pool_elt_at_index (rw->entries, *index);
366 pool_get (rw->entries, e);
367 *index = e - rw->entries;
375 pool_put (rw->entries, e);
379 e->skip_n_vectors = skip / sizeof (u32x4);
380 skip -= e->skip_n_vectors * sizeof (u32x4);
381 e->rewrite_n_vectors = (skip + len - 1) / sizeof (u32x4) + 1;
382 vec_alloc_aligned (e->mask, e->rewrite_n_vectors, sizeof (u32x4));
383 clib_memset (e->mask, 0, e->rewrite_n_vectors * sizeof (u32x4));
384 vec_alloc_aligned (e->value, e->rewrite_n_vectors, sizeof (u32x4));
385 clib_memset (e->value, 0, e->rewrite_n_vectors * sizeof (u32x4));
387 clib_memcpy (((u8 *) e->value) + skip, value, len);
388 clib_memcpy (((u8 *) e->mask) + skip, mask, len);
391 for (i = 0; i < e->rewrite_n_vectors; i++)
393 e->value[i] &= e->mask[i];
398 #endif /* CLIB_MARCH_VARIANT */
400 static clib_error_t *
401 l2_rw_entry_cli_fn (vlib_main_t * vm,
402 unformat_input_t * input, vlib_cli_command_t * cmd)
410 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
412 if (unformat (input, "index %d", &index))
414 else if (unformat (input, "mask %U", unformat_hex_string, &mask))
416 else if (unformat (input, "value %U", unformat_hex_string, &value))
418 else if (unformat (input, "skip %d", &skip))
420 else if (unformat (input, "del"))
427 return clib_error_return (0, "Unspecified mask or value");
429 if (vec_len (mask) != vec_len (value))
430 return clib_error_return (0, "Mask and value lengths must be identical");
434 l2_rw_mod_entry (&index, mask, value, vec_len (mask), skip, del)))
435 return clib_error_return (0, "Could not add entry");
441 * Layer 2-Rewrite node uses classify tables to match packets. Then, using
442 * the provisioned mask and value, modifies the packet header.
445 * @todo This is incomplete. This needs a detailed description and a
449 VLIB_CLI_COMMAND (l2_rw_entry_cli, static) = {
450 .path = "l2 rewrite entry",
452 "l2 rewrite entry [index <index>] [mask <hex-mask>] [value <hex-value>] [skip <n_bytes>] [del]",
453 .function = l2_rw_entry_cli_fn,
457 #ifndef CLIB_MARCH_VARIANT
459 l2_rw_interface_set_table (u32 sw_if_index, u32 table_index, u32 miss_index)
461 l2_rw_config_t *c = l2_rw_get_config (sw_if_index);
462 l2_rw_main_t *rw = &l2_rw_main;
464 c->table_index = table_index;
465 c->miss_index = miss_index;
466 u32 feature_bitmap = (table_index == ~0) ? 0 : L2INPUT_FEAT_RW;
468 l2input_intf_bitmap_enable (sw_if_index, L2INPUT_FEAT_RW, feature_bitmap);
470 if (c->table_index == ~0)
471 clib_bitmap_set (rw->configs_bitmap, sw_if_index, 0);
475 #endif /* CLIB_MARCH_VARIANT */
477 static clib_error_t *
478 l2_rw_interface_cli_fn (vlib_main_t * vm,
479 unformat_input_t * input, vlib_cli_command_t * cmd)
481 vnet_main_t *vnm = vnet_get_main ();
482 u32 table_index = ~0;
483 u32 sw_if_index = ~0;
486 if (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
488 unformat (input, "%U", unformat_vnet_sw_interface, vnm, &sw_if_index);
491 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
493 if (unformat (input, "table %d", &table_index))
495 else if (unformat (input, "miss-index %d", &miss_index))
501 if (sw_if_index == ~0)
502 return clib_error_return (0,
503 "You must specify an interface 'iface <interface>'",
504 format_unformat_error, input);
507 l2_rw_interface_set_table (sw_if_index, table_index, miss_index)))
508 return clib_error_return (0, "l2_rw_interface_set_table returned %d",
515 * Layer 2-Rewrite node uses classify tables to match packets. Then, using
516 * the provisioned mask and value, modifies the packet header.
519 * @todo This is incomplete. This needs a detailed description and a
523 VLIB_CLI_COMMAND (l2_rw_interface_cli, static) = {
524 .path = "set interface l2 rewrite",
526 "set interface l2 rewrite <interface> [table <table index>] [miss-index <entry-index>]",
527 .function = l2_rw_interface_cli_fn,
531 static clib_error_t *
532 l2_rw_show_interfaces_cli_fn (vlib_main_t * vm,
533 unformat_input_t * input,
534 vlib_cli_command_t * cmd)
536 l2_rw_main_t *rw = &l2_rw_main;
537 if (clib_bitmap_count_set_bits (rw->configs_bitmap) == 0)
538 vlib_cli_output (vm, "No interface is currently using l2 rewrite\n");
542 clib_bitmap_foreach(i, rw->configs_bitmap, {
543 vlib_cli_output (vm, "sw_if_index:%d %U\n", i, format_l2_rw_config, &rw->configs[i]);
550 * Layer 2-Rewrite node uses classify tables to match packets. Then, using
551 * the provisioned mask and value, modifies the packet header.
554 * @todo This is incomplete. This needs a detailed description and a
558 VLIB_CLI_COMMAND (l2_rw_show_interfaces_cli, static) = {
559 .path = "show l2 rewrite interfaces",
561 "show l2 rewrite interfaces",
562 .function = l2_rw_show_interfaces_cli_fn,
566 static clib_error_t *
567 l2_rw_show_entries_cli_fn (vlib_main_t * vm,
568 unformat_input_t * input, vlib_cli_command_t * cmd)
570 l2_rw_main_t *rw = &l2_rw_main;
572 if (pool_elts (rw->entries) == 0)
573 vlib_cli_output (vm, "No entries\n");
576 pool_foreach(e, rw->entries, {
577 vlib_cli_output (vm, "%U\n", format_l2_rw_entry, e);
584 * Layer 2-Rewrite node uses classify tables to match packets. Then, using
585 * the provisioned mask and value, modifies the packet header.
588 * @todo This is incomplete. This needs a detailed description and a
592 VLIB_CLI_COMMAND (l2_rw_show_entries_cli, static) = {
593 .path = "show l2 rewrite entries",
595 "show l2 rewrite entries",
596 .function = l2_rw_show_entries_cli_fn,
601 l2_rw_enable_disable (u32 bridge_domain, u8 disable)
603 u32 mask = L2INPUT_FEAT_RW;
604 l2input_set_bridge_features (bridge_domain, mask, disable ? 0 : mask);
608 static clib_error_t *
609 l2_rw_set_cli_fn (vlib_main_t * vm,
610 unformat_input_t * input, vlib_cli_command_t * cmd)
615 if (unformat_check_input (input) == UNFORMAT_END_OF_INPUT ||
616 !unformat (input, "%d", &bridge_domain))
618 return clib_error_return (0, "You must specify a bridge domain");
621 if (unformat_check_input (input) != UNFORMAT_END_OF_INPUT &&
622 unformat (input, "disable"))
627 if (l2_rw_enable_disable (bridge_domain, disable))
628 return clib_error_return (0, "Could not enable or disable rewrite");
634 * Layer 2-Rewrite node uses classify tables to match packets. Then, using
635 * the provisioned mask and value, modfies the packet header.
638 * @todo This is incomplete. This needs a detailed description and a
642 VLIB_CLI_COMMAND (l2_rw_set_cli, static) = {
643 .path = "set bridge-domain rewrite",
645 "set bridge-domain rewrite <bridge-domain> [disable]",
646 .function = l2_rw_set_cli_fn,
650 static clib_error_t *
651 l2_rw_init (vlib_main_t * vm)
653 l2_rw_main_t *rw = &l2_rw_main;
656 clib_bitmap_alloc (rw->configs_bitmap, 1);
657 feat_bitmap_init_next_nodes (vm,
660 l2input_get_feat_names (),
661 rw->feat_next_node_index);
665 VLIB_INIT_FUNCTION (l2_rw_init);
673 #define foreach_l2_rw_error \
674 _(UNKNOWN, "Unknown error")
678 #define _(sym,str) L2_RW_ERROR_##sym,
684 static char *l2_rw_error_strings[] = {
685 #define _(sym,string) string,
691 VLIB_REGISTER_NODE (l2_rw_node) = {
693 .vector_size = sizeof (u32),
694 .format_trace = format_l2_rw_trace,
695 .type = VLIB_NODE_TYPE_INTERNAL,
696 .n_errors = ARRAY_LEN(l2_rw_error_strings),
697 .error_strings = l2_rw_error_strings,
698 .runtime_data_bytes = 0,
699 .n_next_nodes = L2_RW_N_NEXT,
700 .next_nodes = { [L2_RW_NEXT_DROP] = "error-drop"},
705 * fd.io coding-style-patch-verification: ON
708 * eval: (c-set-style "gnu")