4 * Copyright (c) 2015 Cisco and/or its affiliates.
5 * Licensed under the Apache License, Version 2.0 (the "License");
6 * you may not use this file except in compliance with the License.
7 * You may obtain a copy of the License at:
9 * http://www.apache.org/licenses/LICENSE-2.0
11 * Unless required by applicable law or agreed to in writing, software
12 * distributed under the License is distributed on an "AS IS" BASIS,
13 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14 * See the License for the specific language governing permissions and
15 * limitations under the License.
18 #include <vnet/fib/fib_table.h>
19 #include <vnet/fib/ip6_fib.h>
20 #include <vnet/adj/adj.h>
21 #include <vnet/map/map_dpo.h>
27 crc_u32 (u32 data, u32 value)
29 __asm__ volatile ("crc32l %[data], %[value];":[value] "+r" (value):[data]
34 #include <vppinfra/xxhash.h>
37 crc_u32 (u32 data, u32 value)
39 u64 tmp = ((u64) data << 32) | (u64) value;
40 return (u32) clib_xxhash (tmp);
46 * This code supports the following MAP modes:
48 * Algorithmic Shared IPv4 address (ea_bits_len > 0):
49 * ea_bits_len + ip4_prefix > 32
50 * psid_length > 0, ip6_prefix < 64, ip4_prefix <= 32
51 * Algorithmic Full IPv4 address (ea_bits_len > 0):
52 * ea_bits_len + ip4_prefix = 32
53 * psid_length = 0, ip6_prefix < 64, ip4_prefix <= 32
54 * Algorithmic IPv4 prefix (ea_bits_len > 0):
55 * ea_bits_len + ip4_prefix < 32
56 * psid_length = 0, ip6_prefix < 64, ip4_prefix <= 32
58 * Independent Shared IPv4 address (ea_bits_len = 0):
61 * Rule IPv6 address = 128, Rule PSID Set
62 * Independent Full IPv4 address (ea_bits_len = 0):
64 * psid_length = 0, ip6_prefix = 128
65 * Independent IPv4 prefix (ea_bits_len = 0):
67 * psid_length = 0, ip6_prefix = 128
72 * This code supports MAP-T:
74 * With DMR prefix length equal to 96.
81 map_create_domain (ip4_address_t * ip4_prefix,
83 ip6_address_t * ip6_prefix,
85 ip6_address_t * ip6_src,
89 u8 psid_length, u32 * map_domain_index, u16 mtu, u8 flags)
91 u8 suffix_len, suffix_shift;
92 map_main_t *mm = &map_main;
93 dpo_id_t dpo_v4 = DPO_INVALID;
94 dpo_id_t dpo_v6 = DPO_INVALID;
97 /* Sanity check on the src prefix length */
98 if (flags & MAP_DOMAIN_TRANSLATION)
100 if (ip6_src_len != 96)
102 clib_warning ("MAP-T only supports ip6_src_len = 96 for now.");
108 if (ip6_src_len != 128)
111 ("MAP-E requires a BR address, not a prefix (ip6_src_len should "
117 /* How many, and which bits to grab from the IPv4 DA */
118 if (ip4_prefix_len + ea_bits_len < 32)
120 flags |= MAP_DOMAIN_PREFIX;
121 suffix_shift = 32 - ip4_prefix_len - ea_bits_len;
122 suffix_len = ea_bits_len;
127 suffix_len = 32 - ip4_prefix_len;
130 /* EA bits must be within the first 64 bits */
131 if (ea_bits_len > 0 && ((ip6_prefix_len + ea_bits_len) > 64 ||
132 ip6_prefix_len + suffix_len + psid_length > 64))
135 ("Embedded Address bits must be within the first 64 bits of "
140 /* Get domain index */
141 pool_get_aligned (mm->domains, d, CLIB_CACHE_LINE_BYTES);
142 memset (d, 0, sizeof (*d));
143 *map_domain_index = d - mm->domains;
145 /* Init domain struct */
146 d->ip4_prefix.as_u32 = ip4_prefix->as_u32;
147 d->ip4_prefix_len = ip4_prefix_len;
148 d->ip6_prefix = *ip6_prefix;
149 d->ip6_prefix_len = ip6_prefix_len;
150 d->ip6_src = *ip6_src;
151 d->ip6_src_len = ip6_src_len;
152 d->ea_bits_len = ea_bits_len;
153 d->psid_offset = psid_offset;
154 d->psid_length = psid_length;
157 d->suffix_shift = suffix_shift;
158 d->suffix_mask = (1 << suffix_len) - 1;
160 d->psid_shift = 16 - psid_length - psid_offset;
161 d->psid_mask = (1 << d->psid_length) - 1;
162 d->ea_shift = 64 - ip6_prefix_len - suffix_len - d->psid_length;
164 /* MAP data-plane object */
165 if (d->flags & MAP_DOMAIN_TRANSLATION)
166 map_t_dpo_create (DPO_PROTO_IP4, *map_domain_index, &dpo_v4);
168 map_dpo_create (DPO_PROTO_IP4, *map_domain_index, &dpo_v4);
170 /* Create ip4 route */
172 .fp_proto = FIB_PROTOCOL_IP4,
173 .fp_len = d->ip4_prefix_len,
175 .ip4 = d->ip4_prefix,
179 fib_table_entry_special_dpo_add (0, &pfx,
181 FIB_ENTRY_FLAG_EXCLUSIVE, &dpo_v4);
185 * construct a DPO to use the v6 domain
187 if (d->flags & MAP_DOMAIN_TRANSLATION)
188 map_t_dpo_create (DPO_PROTO_IP6, *map_domain_index, &dpo_v6);
190 map_dpo_create (DPO_PROTO_IP6, *map_domain_index, &dpo_v6);
193 * Multiple MAP domains may share same source IPv6 TEP. Which is just dandy.
194 * We are not tracking the sharing. So a v4 lookup to find the correct
195 * domain post decap/trnaslate is always done
197 * Create ip6 route. This is a reference counted add. If the prefix
198 * already exists and is MAP sourced, it is now MAP source n+1 times
199 * and will need to be removed n+1 times.
201 fib_prefix_t pfx6 = {
202 .fp_proto = FIB_PROTOCOL_IP6,
203 .fp_len = d->ip6_src_len,
204 .fp_addr.ip6 = d->ip6_src,
207 fib_table_entry_special_dpo_add (0, &pfx6,
209 FIB_ENTRY_FLAG_EXCLUSIVE, &dpo_v6);
212 /* Validate packet/byte counters */
213 map_domain_counter_lock (mm);
215 for (i = 0; i < vec_len (mm->simple_domain_counters); i++)
217 vlib_validate_simple_counter (&mm->simple_domain_counters[i],
219 vlib_zero_simple_counter (&mm->simple_domain_counters[i],
222 for (i = 0; i < vec_len (mm->domain_counters); i++)
224 vlib_validate_combined_counter (&mm->domain_counters[i],
226 vlib_zero_combined_counter (&mm->domain_counters[i], *map_domain_index);
228 map_domain_counter_unlock (mm);
237 map_delete_domain (u32 map_domain_index)
239 map_main_t *mm = &map_main;
242 if (pool_is_free_index (mm->domains, map_domain_index))
244 clib_warning ("MAP domain delete: domain does not exist: %d",
249 d = pool_elt_at_index (mm->domains, map_domain_index);
252 .fp_proto = FIB_PROTOCOL_IP4,
253 .fp_len = d->ip4_prefix_len,
255 .ip4 = d->ip4_prefix,
259 fib_table_entry_special_remove (0, &pfx, FIB_SOURCE_MAP);
261 fib_prefix_t pfx6 = {
262 .fp_proto = FIB_PROTOCOL_IP6,
263 .fp_len = d->ip6_src_len,
269 fib_table_entry_special_remove (0, &pfx6, FIB_SOURCE_MAP);
273 clib_mem_free (d->rules);
275 pool_put (mm->domains, d);
281 map_add_del_psid (u32 map_domain_index, u16 psid, ip6_address_t * tep,
285 map_main_t *mm = &map_main;
287 if (pool_is_free_index (mm->domains, map_domain_index))
289 clib_warning ("MAP rule: domain does not exist: %d", map_domain_index);
292 d = pool_elt_at_index (mm->domains, map_domain_index);
294 /* Rules are only used in 1:1 independent case */
295 if (d->ea_bits_len > 0)
300 u32 l = (0x1 << d->psid_length) * sizeof (ip6_address_t);
301 d->rules = clib_mem_alloc_aligned (l, CLIB_CACHE_LINE_BYTES);
304 memset (d->rules, 0, l);
307 if (psid >= (0x1 << d->psid_length))
309 clib_warning ("MAP rule: PSID outside bounds: %d [%d]", psid,
310 0x1 << d->psid_length);
316 d->rules[psid] = *tep;
320 memset (&d->rules[psid], 0, sizeof (ip6_address_t));
325 #ifdef MAP_SKIP_IP6_LOOKUP
327 * Pre-resolvd per-protocol global next-hops
329 map_main_pre_resolved_t pre_resolved[FIB_PROTOCOL_MAX];
332 map_pre_resolve_init (map_main_pre_resolved_t * pr)
334 pr->fei = FIB_NODE_INDEX_INVALID;
335 fib_node_init (&pr->node, FIB_NODE_TYPE_MAP_E);
339 format_map_pre_resolve (u8 * s, va_list ap)
341 map_main_pre_resolved_t *pr = va_arg (ap, map_main_pre_resolved_t *);
343 if (FIB_NODE_INDEX_INVALID != pr->fei)
347 fib_entry_get_prefix (pr->fei, &pfx);
349 return (format (s, "%U (%u)",
350 format_ip46_address, &pfx.fp_addr, IP46_TYPE_ANY,
351 pr->dpo.dpoi_index));
355 return (format (s, "un-set"));
361 * Function definition to inform the FIB node that its last lock has gone.
364 map_last_lock_gone (fib_node_t * node)
367 * The MAP is a root of the graph. As such
368 * it never has children and thus is never locked.
373 static map_main_pre_resolved_t *
374 map_from_fib_node (fib_node_t * node)
377 ASSERT (FIB_NODE_TYPE_MAP_E == node->fn_type);
379 return ((map_main_pre_resolved_t *)
381 STRUCT_OFFSET_OF (map_main_pre_resolved_t, node)));
385 map_stack (map_main_pre_resolved_t * pr)
389 dpo = fib_entry_contribute_ip_forwarding (pr->fei);
391 dpo_copy (&pr->dpo, dpo);
395 * Function definition to backwalk a FIB node
397 static fib_node_back_walk_rc_t
398 map_back_walk (fib_node_t * node, fib_node_back_walk_ctx_t * ctx)
400 map_stack (map_from_fib_node (node));
402 return (FIB_NODE_BACK_WALK_CONTINUE);
406 * Function definition to get a FIB node from its index
409 map_fib_node_get (fib_node_index_t index)
411 return (&pre_resolved[index].node);
415 * Virtual function table registered by MPLS GRE tunnels
416 * for participation in the FIB object graph.
418 const static fib_node_vft_t map_vft = {
419 .fnv_get = map_fib_node_get,
420 .fnv_last_lock = map_last_lock_gone,
421 .fnv_back_walk = map_back_walk,
425 map_fib_resolve (map_main_pre_resolved_t * pr,
426 fib_protocol_t proto, u8 len, const ip46_address_t * addr)
434 pr->fei = fib_table_entry_special_add (0, // default fib
436 FIB_SOURCE_RR, FIB_ENTRY_FLAG_NONE);
437 pr->sibling = fib_entry_child_add (pr->fei, FIB_NODE_TYPE_MAP_E, proto);
442 map_fib_unresolve (map_main_pre_resolved_t * pr,
443 fib_protocol_t proto, u8 len, const ip46_address_t * addr)
451 fib_entry_child_remove (pr->fei, pr->sibling);
453 fib_table_entry_special_remove (0, // default fib
454 &pfx, FIB_SOURCE_RR);
455 dpo_reset (&pr->dpo);
457 pr->fei = FIB_NODE_INDEX_INVALID;
458 pr->sibling = FIB_NODE_INDEX_INVALID;
462 map_pre_resolve (ip4_address_t * ip4, ip6_address_t * ip6, int is_del)
464 if (ip6 && (ip6->as_u64[0] != 0 || ip6->as_u64[1] != 0))
466 ip46_address_t addr = {
470 map_fib_unresolve (&pre_resolved[FIB_PROTOCOL_IP6],
471 FIB_PROTOCOL_IP6, 128, &addr);
473 map_fib_resolve (&pre_resolved[FIB_PROTOCOL_IP6],
474 FIB_PROTOCOL_IP6, 128, &addr);
476 if (ip4 && (ip4->as_u32 != 0))
478 ip46_address_t addr = {
482 map_fib_unresolve (&pre_resolved[FIB_PROTOCOL_IP4],
483 FIB_PROTOCOL_IP4, 32, &addr);
485 map_fib_resolve (&pre_resolved[FIB_PROTOCOL_IP4],
486 FIB_PROTOCOL_IP4, 32, &addr);
491 static clib_error_t *
492 map_security_check_command_fn (vlib_main_t * vm,
493 unformat_input_t * input,
494 vlib_cli_command_t * cmd)
496 unformat_input_t _line_input, *line_input = &_line_input;
497 map_main_t *mm = &map_main;
498 clib_error_t *error = NULL;
500 /* Get a line of input. */
501 if (!unformat_user (input, unformat_line_input, line_input))
504 while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
506 if (unformat (line_input, "off"))
507 mm->sec_check = false;
508 else if (unformat (line_input, "on"))
509 mm->sec_check = true;
512 error = clib_error_return (0, "unknown input `%U'",
513 format_unformat_error, line_input);
519 unformat_free (line_input);
524 static clib_error_t *
525 map_security_check_frag_command_fn (vlib_main_t * vm,
526 unformat_input_t * input,
527 vlib_cli_command_t * cmd)
529 unformat_input_t _line_input, *line_input = &_line_input;
530 map_main_t *mm = &map_main;
531 clib_error_t *error = NULL;
533 /* Get a line of input. */
534 if (!unformat_user (input, unformat_line_input, line_input))
537 while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
539 if (unformat (line_input, "off"))
540 mm->sec_check_frag = false;
541 else if (unformat (line_input, "on"))
542 mm->sec_check_frag = true;
545 error = clib_error_return (0, "unknown input `%U'",
546 format_unformat_error, line_input);
552 unformat_free (line_input);
557 static clib_error_t *
558 map_add_domain_command_fn (vlib_main_t * vm,
559 unformat_input_t * input, vlib_cli_command_t * cmd)
561 unformat_input_t _line_input, *line_input = &_line_input;
562 ip4_address_t ip4_prefix;
563 ip6_address_t ip6_prefix;
564 ip6_address_t ip6_src;
565 u32 ip6_prefix_len = 0, ip4_prefix_len = 0, map_domain_index, ip6_src_len;
567 /* Optional arguments */
568 u32 ea_bits_len = 0, psid_offset = 0, psid_length = 0;
572 clib_error_t *error = NULL;
574 /* Get a line of input. */
575 if (!unformat_user (input, unformat_line_input, line_input))
578 while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
581 (line_input, "ip4-pfx %U/%d", unformat_ip4_address, &ip4_prefix,
586 (line_input, "ip6-pfx %U/%d", unformat_ip6_address, &ip6_prefix,
591 (line_input, "ip6-src %U/%d", unformat_ip6_address, &ip6_src,
596 (line_input, "ip6-src %U", unformat_ip6_address, &ip6_src))
598 else if (unformat (line_input, "ea-bits-len %d", &ea_bits_len))
600 else if (unformat (line_input, "psid-offset %d", &psid_offset))
602 else if (unformat (line_input, "psid-len %d", &psid_length))
604 else if (unformat (line_input, "mtu %d", &mtu))
606 else if (unformat (line_input, "map-t"))
607 flags |= MAP_DOMAIN_TRANSLATION;
610 error = clib_error_return (0, "unknown input `%U'",
611 format_unformat_error, line_input);
618 error = clib_error_return (0, "mandatory argument(s) missing");
622 map_create_domain (&ip4_prefix, ip4_prefix_len,
623 &ip6_prefix, ip6_prefix_len, &ip6_src, ip6_src_len,
624 ea_bits_len, psid_offset, psid_length, &map_domain_index,
628 unformat_free (line_input);
633 static clib_error_t *
634 map_del_domain_command_fn (vlib_main_t * vm,
635 unformat_input_t * input, vlib_cli_command_t * cmd)
637 unformat_input_t _line_input, *line_input = &_line_input;
639 u32 map_domain_index;
640 clib_error_t *error = NULL;
642 /* Get a line of input. */
643 if (!unformat_user (input, unformat_line_input, line_input))
646 while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
648 if (unformat (line_input, "index %d", &map_domain_index))
652 error = clib_error_return (0, "unknown input `%U'",
653 format_unformat_error, line_input);
660 error = clib_error_return (0, "mandatory argument(s) missing");
664 map_delete_domain (map_domain_index);
667 unformat_free (line_input);
672 static clib_error_t *
673 map_add_rule_command_fn (vlib_main_t * vm,
674 unformat_input_t * input, vlib_cli_command_t * cmd)
676 unformat_input_t _line_input, *line_input = &_line_input;
679 u32 psid = 0, map_domain_index;
680 clib_error_t *error = NULL;
682 /* Get a line of input. */
683 if (!unformat_user (input, unformat_line_input, line_input))
686 while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
688 if (unformat (line_input, "index %d", &map_domain_index))
690 else if (unformat (line_input, "psid %d", &psid))
693 if (unformat (line_input, "ip6-dst %U", unformat_ip6_address, &tep))
697 error = clib_error_return (0, "unknown input `%U'",
698 format_unformat_error, line_input);
705 error = clib_error_return (0, "mandatory argument(s) missing");
709 if (map_add_del_psid (map_domain_index, psid, &tep, 1) != 0)
711 error = clib_error_return (0, "Failing to add Mapping Rule");
716 unformat_free (line_input);
721 #if MAP_SKIP_IP6_LOOKUP
722 static clib_error_t *
723 map_pre_resolve_command_fn (vlib_main_t * vm,
724 unformat_input_t * input,
725 vlib_cli_command_t * cmd)
727 unformat_input_t _line_input, *line_input = &_line_input;
728 ip4_address_t ip4nh, *p_v4 = NULL;
729 ip6_address_t ip6nh, *p_v6 = NULL;
730 clib_error_t *error = NULL;
733 memset (&ip4nh, 0, sizeof (ip4nh));
734 memset (&ip6nh, 0, sizeof (ip6nh));
736 /* Get a line of input. */
737 if (!unformat_user (input, unformat_line_input, line_input))
740 while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
742 if (unformat (line_input, "ip4-nh %U", unformat_ip4_address, &ip4nh))
745 if (unformat (line_input, "ip6-nh %U", unformat_ip6_address, &ip6nh))
747 else if (unformat (line_input, "del"))
751 error = clib_error_return (0, "unknown input `%U'",
752 format_unformat_error, line_input);
757 map_pre_resolve (p_v4, p_v6, is_del);
760 unformat_free (line_input);
766 static clib_error_t *
767 map_icmp_relay_source_address_command_fn (vlib_main_t * vm,
768 unformat_input_t * input,
769 vlib_cli_command_t * cmd)
771 unformat_input_t _line_input, *line_input = &_line_input;
772 ip4_address_t icmp_src_address;
773 map_main_t *mm = &map_main;
774 clib_error_t *error = NULL;
776 mm->icmp4_src_address.as_u32 = 0;
778 /* Get a line of input. */
779 if (!unformat_user (input, unformat_line_input, line_input))
782 while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
785 (line_input, "%U", unformat_ip4_address, &icmp_src_address))
786 mm->icmp4_src_address = icmp_src_address;
789 error = clib_error_return (0, "unknown input `%U'",
790 format_unformat_error, line_input);
796 unformat_free (line_input);
801 static clib_error_t *
802 map_icmp_unreachables_command_fn (vlib_main_t * vm,
803 unformat_input_t * input,
804 vlib_cli_command_t * cmd)
806 unformat_input_t _line_input, *line_input = &_line_input;
807 map_main_t *mm = &map_main;
809 clib_error_t *error = NULL;
811 /* Get a line of input. */
812 if (!unformat_user (input, unformat_line_input, line_input))
815 while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
818 if (unformat (line_input, "on"))
819 mm->icmp6_enabled = true;
820 else if (unformat (line_input, "off"))
821 mm->icmp6_enabled = false;
824 error = clib_error_return (0, "unknown input `%U'",
825 format_unformat_error, line_input);
832 error = clib_error_return (0, "mandatory argument(s) missing");
835 unformat_free (line_input);
840 static clib_error_t *
841 map_fragment_command_fn (vlib_main_t * vm,
842 unformat_input_t * input, vlib_cli_command_t * cmd)
844 unformat_input_t _line_input, *line_input = &_line_input;
845 map_main_t *mm = &map_main;
846 clib_error_t *error = NULL;
848 /* Get a line of input. */
849 if (!unformat_user (input, unformat_line_input, line_input))
852 while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
854 if (unformat (line_input, "inner"))
855 mm->frag_inner = true;
856 else if (unformat (line_input, "outer"))
857 mm->frag_inner = false;
860 error = clib_error_return (0, "unknown input `%U'",
861 format_unformat_error, line_input);
867 unformat_free (line_input);
872 static clib_error_t *
873 map_fragment_df_command_fn (vlib_main_t * vm,
874 unformat_input_t * input,
875 vlib_cli_command_t * cmd)
877 unformat_input_t _line_input, *line_input = &_line_input;
878 map_main_t *mm = &map_main;
879 clib_error_t *error = NULL;
881 /* Get a line of input. */
882 if (!unformat_user (input, unformat_line_input, line_input))
885 while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
887 if (unformat (line_input, "on"))
888 mm->frag_ignore_df = true;
889 else if (unformat (line_input, "off"))
890 mm->frag_ignore_df = false;
893 error = clib_error_return (0, "unknown input `%U'",
894 format_unformat_error, line_input);
900 unformat_free (line_input);
905 static clib_error_t *
906 map_traffic_class_command_fn (vlib_main_t * vm,
907 unformat_input_t * input,
908 vlib_cli_command_t * cmd)
910 unformat_input_t _line_input, *line_input = &_line_input;
911 map_main_t *mm = &map_main;
913 clib_error_t *error = NULL;
917 /* Get a line of input. */
918 if (!unformat_user (input, unformat_line_input, line_input))
921 while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
923 if (unformat (line_input, "copy"))
925 else if (unformat (line_input, "%x", &tc))
929 error = clib_error_return (0, "unknown input `%U'",
930 format_unformat_error, line_input);
936 unformat_free (line_input);
942 format_map_domain (u8 * s, va_list * args)
944 map_domain_t *d = va_arg (*args, map_domain_t *);
945 bool counters = va_arg (*args, int);
946 map_main_t *mm = &map_main;
947 ip6_address_t ip6_prefix;
950 memset (&ip6_prefix, 0, sizeof (ip6_prefix));
952 ip6_prefix = d->ip6_prefix;
955 "[%d] ip4-pfx %U/%d ip6-pfx %U/%d ip6-src %U/%d ea_bits_len %d psid-offset %d psid-len %d mtu %d %s",
957 format_ip4_address, &d->ip4_prefix, d->ip4_prefix_len,
958 format_ip6_address, &ip6_prefix, d->ip6_prefix_len,
959 format_ip6_address, &d->ip6_src, d->ip6_src_len,
960 d->ea_bits_len, d->psid_offset, d->psid_length, d->mtu,
961 (d->flags & MAP_DOMAIN_TRANSLATION) ? "map-t" : "");
965 map_domain_counter_lock (mm);
967 vlib_get_combined_counter (&mm->domain_counters[MAP_DOMAIN_COUNTER_TX],
968 d - mm->domains, &v);
969 s = format (s, " TX: %lld/%lld", v.packets, v.bytes);
970 vlib_get_combined_counter (&mm->domain_counters[MAP_DOMAIN_COUNTER_RX],
971 d - mm->domains, &v);
972 s = format (s, " RX: %lld/%lld", v.packets, v.bytes);
973 map_domain_counter_unlock (mm);
975 s = format (s, "\n");
981 for (i = 0; i < (0x1 << d->psid_length); i++)
984 if (dst.as_u64[0] == 0 && dst.as_u64[1] == 0)
987 " rule psid: %d ip6-dst %U\n", i, format_ip6_address,
995 format_map_ip4_reass (u8 * s, va_list * args)
997 map_main_t *mm = &map_main;
998 map_ip4_reass_t *r = va_arg (*args, map_ip4_reass_t *);
999 map_ip4_reass_key_t *k = &r->key;
1000 f64 now = vlib_time_now (mm->vlib_main);
1001 f64 lifetime = (((f64) mm->ip4_reass_conf_lifetime_ms) / 1000);
1002 f64 dt = (r->ts + lifetime > now) ? (r->ts + lifetime - now) : -1;
1004 "ip4-reass src=%U dst=%U protocol=%d identifier=%d port=%d lifetime=%.3lf\n",
1005 format_ip4_address, &k->src.as_u8, format_ip4_address,
1006 &k->dst.as_u8, k->protocol,
1007 clib_net_to_host_u16 (k->fragment_id),
1008 (r->port >= 0) ? clib_net_to_host_u16 (r->port) : -1, dt);
1013 format_map_ip6_reass (u8 * s, va_list * args)
1015 map_main_t *mm = &map_main;
1016 map_ip6_reass_t *r = va_arg (*args, map_ip6_reass_t *);
1017 map_ip6_reass_key_t *k = &r->key;
1018 f64 now = vlib_time_now (mm->vlib_main);
1019 f64 lifetime = (((f64) mm->ip6_reass_conf_lifetime_ms) / 1000);
1020 f64 dt = (r->ts + lifetime > now) ? (r->ts + lifetime - now) : -1;
1022 "ip6-reass src=%U dst=%U protocol=%d identifier=%d lifetime=%.3lf\n",
1023 format_ip6_address, &k->src.as_u8, format_ip6_address,
1024 &k->dst.as_u8, k->protocol,
1025 clib_net_to_host_u32 (k->fragment_id), dt);
1029 static clib_error_t *
1030 show_map_domain_command_fn (vlib_main_t * vm, unformat_input_t * input,
1031 vlib_cli_command_t * cmd)
1033 unformat_input_t _line_input, *line_input = &_line_input;
1034 map_main_t *mm = &map_main;
1036 bool counters = false;
1037 u32 map_domain_index = ~0;
1038 clib_error_t *error = NULL;
1040 /* Get a line of input. */
1041 if (!unformat_user (input, unformat_line_input, line_input))
1044 while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
1046 if (unformat (line_input, "counters"))
1048 else if (unformat (line_input, "index %d", &map_domain_index))
1052 error = clib_error_return (0, "unknown input `%U'",
1053 format_unformat_error, line_input);
1058 if (pool_elts (mm->domains) == 0)
1059 vlib_cli_output (vm, "No MAP domains are configured...");
1061 if (map_domain_index == ~0)
1064 pool_foreach(d, mm->domains, ({vlib_cli_output(vm, "%U", format_map_domain, d, counters);}));
1069 if (pool_is_free_index (mm->domains, map_domain_index))
1071 error = clib_error_return (0, "MAP domain does not exists %d",
1076 d = pool_elt_at_index (mm->domains, map_domain_index);
1077 vlib_cli_output (vm, "%U", format_map_domain, d, counters);
1081 unformat_free (line_input);
1086 static clib_error_t *
1087 show_map_fragments_command_fn (vlib_main_t * vm, unformat_input_t * input,
1088 vlib_cli_command_t * cmd)
1090 map_main_t *mm = &map_main;
1091 map_ip4_reass_t *f4;
1092 map_ip6_reass_t *f6;
1095 pool_foreach(f4, mm->ip4_reass_pool, ({vlib_cli_output (vm, "%U", format_map_ip4_reass, f4);}));
1098 pool_foreach(f6, mm->ip6_reass_pool, ({vlib_cli_output (vm, "%U", format_map_ip6_reass, f6);}));
1104 map_error_counter_get (u32 node_index, map_error_t map_error)
1106 vlib_main_t *vm = vlib_get_main ();
1107 vlib_node_runtime_t *error_node = vlib_node_get_runtime (vm, node_index);
1108 vlib_error_main_t *em = &vm->error_main;
1109 vlib_error_t e = error_node->errors[map_error];
1110 vlib_node_t *n = vlib_get_node (vm, node_index);
1113 ci = vlib_error_get_code (e);
1114 ASSERT (ci < n->n_errors);
1115 ci += n->error_heap_index;
1117 return (em->counters[ci]);
1120 static clib_error_t *
1121 show_map_stats_command_fn (vlib_main_t * vm, unformat_input_t * input,
1122 vlib_cli_command_t * cmd)
1124 map_main_t *mm = &map_main;
1126 int domains = 0, rules = 0, domaincount = 0, rulecount = 0;
1127 if (pool_elts (mm->domains) == 0)
1128 vlib_cli_output (vm, "No MAP domains are configured...");
1131 pool_foreach(d, mm->domains, ({
1133 rulecount+= 0x1 << d->psid_length;
1134 rules += sizeof(ip6_address_t) * 0x1 << d->psid_length;
1136 domains += sizeof(*d);
1141 vlib_cli_output (vm, "MAP domains structure: %d\n", sizeof (map_domain_t));
1142 vlib_cli_output (vm, "MAP domains: %d (%d bytes)\n", domaincount, domains);
1143 vlib_cli_output (vm, "MAP rules: %d (%d bytes)\n", rulecount, rules);
1144 vlib_cli_output (vm, "Total: %d bytes)\n", rules + domains);
1146 #if MAP_SKIP_IP6_LOOKUP
1147 vlib_cli_output (vm,
1148 "MAP pre-resolve: IP6 next-hop: %U, IP4 next-hop: %U\n",
1149 format_map_pre_resolve, &pre_resolved[FIB_PROTOCOL_IP6],
1150 format_map_pre_resolve, &pre_resolved[FIB_PROTOCOL_IP4]);
1155 vlib_cli_output (vm, "MAP traffic-class: copy");
1157 vlib_cli_output (vm, "MAP traffic-class: %x", mm->tc);
1159 vlib_cli_output (vm,
1160 "MAP IPv6 inbound security check: %s, fragmented packet security check: %s",
1161 mm->sec_check ? "enabled" : "disabled",
1162 mm->sec_check_frag ? "enabled" : "disabled");
1164 vlib_cli_output (vm, "ICMP-relay IPv4 source address: %U\n",
1165 format_ip4_address, &mm->icmp4_src_address);
1166 vlib_cli_output (vm, "ICMP6 unreachables sent for unmatched packets: %s\n",
1167 mm->icmp6_enabled ? "enabled" : "disabled");
1168 vlib_cli_output (vm, "Inner fragmentation: %s\n",
1169 mm->frag_inner ? "enabled" : "disabled");
1170 vlib_cli_output (vm, "Fragment packets regardless of DF flag: %s\n",
1171 mm->frag_ignore_df ? "enabled" : "disabled");
1176 vlib_combined_counter_main_t *cm = mm->domain_counters;
1177 u64 total_pkts[MAP_N_DOMAIN_COUNTER];
1178 u64 total_bytes[MAP_N_DOMAIN_COUNTER];
1182 memset (total_pkts, 0, sizeof (total_pkts));
1183 memset (total_bytes, 0, sizeof (total_bytes));
1185 map_domain_counter_lock (mm);
1186 vec_foreach (cm, mm->domain_counters)
1188 which = cm - mm->domain_counters;
1190 for (i = 0; i < vlib_combined_counter_n_counters (cm); i++)
1192 vlib_get_combined_counter (cm, i, &v);
1193 total_pkts[which] += v.packets;
1194 total_bytes[which] += v.bytes;
1197 map_domain_counter_unlock (mm);
1199 vlib_cli_output (vm, "Encapsulated packets: %lld bytes: %lld\n",
1200 total_pkts[MAP_DOMAIN_COUNTER_TX],
1201 total_bytes[MAP_DOMAIN_COUNTER_TX]);
1202 vlib_cli_output (vm, "Decapsulated packets: %lld bytes: %lld\n",
1203 total_pkts[MAP_DOMAIN_COUNTER_RX],
1204 total_bytes[MAP_DOMAIN_COUNTER_RX]);
1206 vlib_cli_output (vm, "ICMP relayed packets: %d\n",
1207 vlib_get_simple_counter (&mm->icmp_relayed, 0));
1212 static clib_error_t *
1213 map_params_reass_command_fn (vlib_main_t * vm, unformat_input_t * input,
1214 vlib_cli_command_t * cmd)
1216 unformat_input_t _line_input, *line_input = &_line_input;
1218 f64 ht_ratio = (MAP_IP4_REASS_CONF_HT_RATIO_MAX + 1);
1220 u64 buffers = ~(0ull);
1221 u8 ip4 = 0, ip6 = 0;
1223 if (!unformat_user (input, unformat_line_input, line_input))
1226 while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT)
1228 if (unformat (line_input, "lifetime %u", &lifetime))
1230 else if (unformat (line_input, "ht-ratio %lf", &ht_ratio))
1232 else if (unformat (line_input, "pool-size %u", &pool_size))
1234 else if (unformat (line_input, "buffers %llu", &buffers))
1236 else if (unformat (line_input, "ip4"))
1238 else if (unformat (line_input, "ip6"))
1242 unformat_free (line_input);
1243 return clib_error_return (0, "invalid input");
1246 unformat_free (line_input);
1249 return clib_error_return (0, "must specify ip4 and/or ip6");
1253 if (pool_size != ~0 && pool_size > MAP_IP4_REASS_CONF_POOL_SIZE_MAX)
1254 return clib_error_return (0, "invalid ip4-reass pool-size ( > %d)",
1255 MAP_IP4_REASS_CONF_POOL_SIZE_MAX);
1256 if (ht_ratio != (MAP_IP4_REASS_CONF_HT_RATIO_MAX + 1)
1257 && ht_ratio > MAP_IP4_REASS_CONF_HT_RATIO_MAX)
1258 return clib_error_return (0, "invalid ip4-reass ht-ratio ( > %d)",
1259 MAP_IP4_REASS_CONF_HT_RATIO_MAX);
1260 if (lifetime != ~0 && lifetime > MAP_IP4_REASS_CONF_LIFETIME_MAX)
1261 return clib_error_return (0, "invalid ip4-reass lifetime ( > %d)",
1262 MAP_IP4_REASS_CONF_LIFETIME_MAX);
1263 if (buffers != ~(0ull) && buffers > MAP_IP4_REASS_CONF_BUFFERS_MAX)
1264 return clib_error_return (0, "invalid ip4-reass buffers ( > %ld)",
1265 MAP_IP4_REASS_CONF_BUFFERS_MAX);
1270 if (pool_size != ~0 && pool_size > MAP_IP6_REASS_CONF_POOL_SIZE_MAX)
1271 return clib_error_return (0, "invalid ip6-reass pool-size ( > %d)",
1272 MAP_IP6_REASS_CONF_POOL_SIZE_MAX);
1273 if (ht_ratio != (MAP_IP4_REASS_CONF_HT_RATIO_MAX + 1)
1274 && ht_ratio > MAP_IP6_REASS_CONF_HT_RATIO_MAX)
1275 return clib_error_return (0, "invalid ip6-reass ht-log2len ( > %d)",
1276 MAP_IP6_REASS_CONF_HT_RATIO_MAX);
1277 if (lifetime != ~0 && lifetime > MAP_IP6_REASS_CONF_LIFETIME_MAX)
1278 return clib_error_return (0, "invalid ip6-reass lifetime ( > %d)",
1279 MAP_IP6_REASS_CONF_LIFETIME_MAX);
1280 if (buffers != ~(0ull) && buffers > MAP_IP6_REASS_CONF_BUFFERS_MAX)
1281 return clib_error_return (0, "invalid ip6-reass buffers ( > %ld)",
1282 MAP_IP6_REASS_CONF_BUFFERS_MAX);
1287 u32 reass = 0, packets = 0;
1288 if (pool_size != ~0)
1290 if (map_ip4_reass_conf_pool_size (pool_size, &reass, &packets))
1292 vlib_cli_output (vm, "Could not set ip4-reass pool-size");
1296 vlib_cli_output (vm,
1297 "Setting ip4-reass pool-size (destroyed-reassembly=%u , dropped-fragments=%u)",
1301 if (ht_ratio != (MAP_IP4_REASS_CONF_HT_RATIO_MAX + 1))
1303 if (map_ip4_reass_conf_ht_ratio (ht_ratio, &reass, &packets))
1305 vlib_cli_output (vm, "Could not set ip4-reass ht-log2len");
1309 vlib_cli_output (vm,
1310 "Setting ip4-reass ht-log2len (destroyed-reassembly=%u , dropped-fragments=%u)",
1316 if (map_ip4_reass_conf_lifetime (lifetime))
1317 vlib_cli_output (vm, "Could not set ip4-reass lifetime");
1319 vlib_cli_output (vm, "Setting ip4-reass lifetime");
1321 if (buffers != ~(0ull))
1323 if (map_ip4_reass_conf_buffers (buffers))
1324 vlib_cli_output (vm, "Could not set ip4-reass buffers");
1326 vlib_cli_output (vm, "Setting ip4-reass buffers");
1329 if (map_main.ip4_reass_conf_buffers >
1330 map_main.ip4_reass_conf_pool_size *
1331 MAP_IP4_REASS_MAX_FRAGMENTS_PER_REASSEMBLY)
1333 vlib_cli_output (vm,
1334 "Note: 'ip4-reass buffers' > pool-size * max-fragments-per-reassembly.");
1340 u32 reass = 0, packets = 0;
1341 if (pool_size != ~0)
1343 if (map_ip6_reass_conf_pool_size (pool_size, &reass, &packets))
1345 vlib_cli_output (vm, "Could not set ip6-reass pool-size");
1349 vlib_cli_output (vm,
1350 "Setting ip6-reass pool-size (destroyed-reassembly=%u , dropped-fragments=%u)",
1354 if (ht_ratio != (MAP_IP4_REASS_CONF_HT_RATIO_MAX + 1))
1356 if (map_ip6_reass_conf_ht_ratio (ht_ratio, &reass, &packets))
1358 vlib_cli_output (vm, "Could not set ip6-reass ht-log2len");
1362 vlib_cli_output (vm,
1363 "Setting ip6-reass ht-log2len (destroyed-reassembly=%u , dropped-fragments=%u)",
1369 if (map_ip6_reass_conf_lifetime (lifetime))
1370 vlib_cli_output (vm, "Could not set ip6-reass lifetime");
1372 vlib_cli_output (vm, "Setting ip6-reass lifetime");
1374 if (buffers != ~(0ull))
1376 if (map_ip6_reass_conf_buffers (buffers))
1377 vlib_cli_output (vm, "Could not set ip6-reass buffers");
1379 vlib_cli_output (vm, "Setting ip6-reass buffers");
1382 if (map_main.ip6_reass_conf_buffers >
1383 map_main.ip6_reass_conf_pool_size *
1384 MAP_IP6_REASS_MAX_FRAGMENTS_PER_REASSEMBLY)
1386 vlib_cli_output (vm,
1387 "Note: 'ip6-reass buffers' > pool-size * max-fragments-per-reassembly.");
1396 * packet trace format function
1399 format_map_trace (u8 * s, va_list * args)
1401 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
1402 CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
1403 map_trace_t *t = va_arg (*args, map_trace_t *);
1404 u32 map_domain_index = t->map_domain_index;
1408 format (s, "MAP domain index: %d L4 port: %u", map_domain_index,
1409 clib_net_to_host_u16 (port));
1414 static_always_inline map_ip4_reass_t *
1415 map_ip4_reass_lookup (map_ip4_reass_key_t * k, u32 bucket, f64 now)
1417 map_main_t *mm = &map_main;
1418 u32 ri = mm->ip4_reass_hash_table[bucket];
1419 while (ri != MAP_REASS_INDEX_NONE)
1421 map_ip4_reass_t *r = pool_elt_at_index (mm->ip4_reass_pool, ri);
1422 if (r->key.as_u64[0] == k->as_u64[0] &&
1423 r->key.as_u64[1] == k->as_u64[1] &&
1424 now < r->ts + (((f64) mm->ip4_reass_conf_lifetime_ms) / 1000))
1428 ri = r->bucket_next;
1433 #define map_ip4_reass_pool_index(r) (r - map_main.ip4_reass_pool)
1436 map_ip4_reass_free (map_ip4_reass_t * r, u32 ** pi_to_drop)
1438 map_main_t *mm = &map_main;
1439 map_ip4_reass_get_fragments (r, pi_to_drop);
1441 // Unlink in hash bucket
1442 map_ip4_reass_t *r2 = NULL;
1443 u32 r2i = mm->ip4_reass_hash_table[r->bucket];
1444 while (r2i != map_ip4_reass_pool_index (r))
1446 ASSERT (r2i != MAP_REASS_INDEX_NONE);
1447 r2 = pool_elt_at_index (mm->ip4_reass_pool, r2i);
1448 r2i = r2->bucket_next;
1452 r2->bucket_next = r->bucket_next;
1456 mm->ip4_reass_hash_table[r->bucket] = r->bucket_next;
1460 if (r->fifo_next == map_ip4_reass_pool_index (r))
1462 mm->ip4_reass_fifo_last = MAP_REASS_INDEX_NONE;
1466 if (mm->ip4_reass_fifo_last == map_ip4_reass_pool_index (r))
1467 mm->ip4_reass_fifo_last = r->fifo_prev;
1468 pool_elt_at_index (mm->ip4_reass_pool, r->fifo_prev)->fifo_next =
1470 pool_elt_at_index (mm->ip4_reass_pool, r->fifo_next)->fifo_prev =
1474 pool_put (mm->ip4_reass_pool, r);
1475 mm->ip4_reass_allocated--;
1479 map_ip4_reass_get (u32 src, u32 dst, u16 fragment_id,
1480 u8 protocol, u32 ** pi_to_drop)
1483 map_main_t *mm = &map_main;
1484 map_ip4_reass_key_t k = {.src.data_u32 = src,
1485 .dst.data_u32 = dst,
1486 .fragment_id = fragment_id,
1487 .protocol = protocol
1491 h = crc_u32 (k.as_u32[0], h);
1492 h = crc_u32 (k.as_u32[1], h);
1493 h = crc_u32 (k.as_u32[2], h);
1494 h = crc_u32 (k.as_u32[3], h);
1495 h = h >> (32 - mm->ip4_reass_ht_log2len);
1497 f64 now = vlib_time_now (mm->vlib_main);
1499 //Cache garbage collection
1500 while (mm->ip4_reass_fifo_last != MAP_REASS_INDEX_NONE)
1502 map_ip4_reass_t *last =
1503 pool_elt_at_index (mm->ip4_reass_pool, mm->ip4_reass_fifo_last);
1504 if (last->ts + (((f64) mm->ip4_reass_conf_lifetime_ms) / 1000) < now)
1505 map_ip4_reass_free (last, pi_to_drop);
1510 if ((r = map_ip4_reass_lookup (&k, h, now)))
1513 if (mm->ip4_reass_allocated >= mm->ip4_reass_conf_pool_size)
1516 pool_get (mm->ip4_reass_pool, r);
1517 mm->ip4_reass_allocated++;
1519 for (i = 0; i < MAP_IP4_REASS_MAX_FRAGMENTS_PER_REASSEMBLY; i++)
1520 r->fragments[i] = ~0;
1522 u32 ri = map_ip4_reass_pool_index (r);
1524 //Link in new bucket
1526 r->bucket_next = mm->ip4_reass_hash_table[h];
1527 mm->ip4_reass_hash_table[h] = ri;
1530 if (mm->ip4_reass_fifo_last != MAP_REASS_INDEX_NONE)
1533 pool_elt_at_index (mm->ip4_reass_pool,
1534 mm->ip4_reass_fifo_last)->fifo_next;
1535 r->fifo_prev = mm->ip4_reass_fifo_last;
1536 pool_elt_at_index (mm->ip4_reass_pool, r->fifo_prev)->fifo_next = ri;
1537 pool_elt_at_index (mm->ip4_reass_pool, r->fifo_next)->fifo_prev = ri;
1541 r->fifo_next = r->fifo_prev = ri;
1542 mm->ip4_reass_fifo_last = ri;
1549 #ifdef MAP_IP4_REASS_COUNT_BYTES
1550 r->expected_total = 0xffff;
1558 map_ip4_reass_add_fragment (map_ip4_reass_t * r, u32 pi)
1560 if (map_main.ip4_reass_buffered_counter >= map_main.ip4_reass_conf_buffers)
1564 for (i = 0; i < MAP_IP4_REASS_MAX_FRAGMENTS_PER_REASSEMBLY; i++)
1565 if (r->fragments[i] == ~0)
1567 r->fragments[i] = pi;
1568 map_main.ip4_reass_buffered_counter++;
1574 static_always_inline map_ip6_reass_t *
1575 map_ip6_reass_lookup (map_ip6_reass_key_t * k, u32 bucket, f64 now)
1577 map_main_t *mm = &map_main;
1578 u32 ri = mm->ip6_reass_hash_table[bucket];
1579 while (ri != MAP_REASS_INDEX_NONE)
1581 map_ip6_reass_t *r = pool_elt_at_index (mm->ip6_reass_pool, ri);
1582 if (now < r->ts + (((f64) mm->ip6_reass_conf_lifetime_ms) / 1000) &&
1583 r->key.as_u64[0] == k->as_u64[0] &&
1584 r->key.as_u64[1] == k->as_u64[1] &&
1585 r->key.as_u64[2] == k->as_u64[2] &&
1586 r->key.as_u64[3] == k->as_u64[3] &&
1587 r->key.as_u64[4] == k->as_u64[4])
1589 ri = r->bucket_next;
1594 #define map_ip6_reass_pool_index(r) (r - map_main.ip6_reass_pool)
1597 map_ip6_reass_free (map_ip6_reass_t * r, u32 ** pi_to_drop)
1599 map_main_t *mm = &map_main;
1601 for (i = 0; i < MAP_IP6_REASS_MAX_FRAGMENTS_PER_REASSEMBLY; i++)
1602 if (r->fragments[i].pi != ~0)
1604 vec_add1 (*pi_to_drop, r->fragments[i].pi);
1605 r->fragments[i].pi = ~0;
1606 map_main.ip6_reass_buffered_counter--;
1609 // Unlink in hash bucket
1610 map_ip6_reass_t *r2 = NULL;
1611 u32 r2i = mm->ip6_reass_hash_table[r->bucket];
1612 while (r2i != map_ip6_reass_pool_index (r))
1614 ASSERT (r2i != MAP_REASS_INDEX_NONE);
1615 r2 = pool_elt_at_index (mm->ip6_reass_pool, r2i);
1616 r2i = r2->bucket_next;
1620 r2->bucket_next = r->bucket_next;
1624 mm->ip6_reass_hash_table[r->bucket] = r->bucket_next;
1628 if (r->fifo_next == map_ip6_reass_pool_index (r))
1630 //Single element in the list, list is now empty
1631 mm->ip6_reass_fifo_last = MAP_REASS_INDEX_NONE;
1635 if (mm->ip6_reass_fifo_last == map_ip6_reass_pool_index (r)) //First element
1636 mm->ip6_reass_fifo_last = r->fifo_prev;
1637 pool_elt_at_index (mm->ip6_reass_pool, r->fifo_prev)->fifo_next =
1639 pool_elt_at_index (mm->ip6_reass_pool, r->fifo_next)->fifo_prev =
1643 // Free from pool if necessary
1644 pool_put (mm->ip6_reass_pool, r);
1645 mm->ip6_reass_allocated--;
1649 map_ip6_reass_get (ip6_address_t * src, ip6_address_t * dst, u32 fragment_id,
1650 u8 protocol, u32 ** pi_to_drop)
1653 map_main_t *mm = &map_main;
1654 map_ip6_reass_key_t k = {
1657 .fragment_id = fragment_id,
1658 .protocol = protocol
1663 for (i = 0; i < 10; i++)
1664 h = crc_u32 (k.as_u32[i], h);
1665 h = h >> (32 - mm->ip6_reass_ht_log2len);
1667 f64 now = vlib_time_now (mm->vlib_main);
1669 //Cache garbage collection
1670 while (mm->ip6_reass_fifo_last != MAP_REASS_INDEX_NONE)
1672 map_ip6_reass_t *last =
1673 pool_elt_at_index (mm->ip6_reass_pool, mm->ip6_reass_fifo_last);
1674 if (last->ts + (((f64) mm->ip6_reass_conf_lifetime_ms) / 1000) < now)
1675 map_ip6_reass_free (last, pi_to_drop);
1680 if ((r = map_ip6_reass_lookup (&k, h, now)))
1683 if (mm->ip6_reass_allocated >= mm->ip6_reass_conf_pool_size)
1686 pool_get (mm->ip6_reass_pool, r);
1687 mm->ip6_reass_allocated++;
1688 for (i = 0; i < MAP_IP6_REASS_MAX_FRAGMENTS_PER_REASSEMBLY; i++)
1690 r->fragments[i].pi = ~0;
1691 r->fragments[i].next_data_len = 0;
1692 r->fragments[i].next_data_offset = 0;
1695 u32 ri = map_ip6_reass_pool_index (r);
1697 //Link in new bucket
1699 r->bucket_next = mm->ip6_reass_hash_table[h];
1700 mm->ip6_reass_hash_table[h] = ri;
1703 if (mm->ip6_reass_fifo_last != MAP_REASS_INDEX_NONE)
1706 pool_elt_at_index (mm->ip6_reass_pool,
1707 mm->ip6_reass_fifo_last)->fifo_next;
1708 r->fifo_prev = mm->ip6_reass_fifo_last;
1709 pool_elt_at_index (mm->ip6_reass_pool, r->fifo_prev)->fifo_next = ri;
1710 pool_elt_at_index (mm->ip6_reass_pool, r->fifo_next)->fifo_prev = ri;
1714 r->fifo_next = r->fifo_prev = ri;
1715 mm->ip6_reass_fifo_last = ri;
1721 r->ip4_header.ip_version_and_header_length = 0;
1722 #ifdef MAP_IP6_REASS_COUNT_BYTES
1723 r->expected_total = 0xffff;
1730 map_ip6_reass_add_fragment (map_ip6_reass_t * r, u32 pi,
1731 u16 data_offset, u16 next_data_offset,
1732 u8 * data_start, u16 data_len)
1734 map_ip6_fragment_t *f = NULL, *prev_f = NULL;
1735 u16 copied_len = (data_len > 20) ? 20 : data_len;
1737 if (map_main.ip6_reass_buffered_counter >= map_main.ip6_reass_conf_buffers)
1740 //Lookup for fragments for the current buffer
1741 //and the one before that
1743 for (i = 0; i < MAP_IP6_REASS_MAX_FRAGMENTS_PER_REASSEMBLY; i++)
1745 if (data_offset && r->fragments[i].next_data_offset == data_offset)
1747 prev_f = &r->fragments[i]; // This is buffer for previous packet
1749 else if (r->fragments[i].next_data_offset == next_data_offset)
1751 f = &r->fragments[i]; // This is a buffer for the current packet
1753 else if (r->fragments[i].next_data_offset == 0)
1756 f = &r->fragments[i];
1757 else if (prev_f == NULL)
1758 prev_f = &r->fragments[i];
1762 if (!f || f->pi != ~0)
1770 clib_memcpy (prev_f->next_data, data_start, copied_len);
1771 prev_f->next_data_len = copied_len;
1772 prev_f->next_data_offset = data_offset;
1776 if (((ip4_header_t *) data_start)->ip_version_and_header_length != 0x45)
1779 if (r->ip4_header.ip_version_and_header_length == 0)
1780 clib_memcpy (&r->ip4_header, data_start, sizeof (ip4_header_t));
1785 f->next_data_offset = next_data_offset;
1787 map_main.ip6_reass_buffered_counter++;
1793 map_ip4_reass_reinit (u32 * trashed_reass, u32 * dropped_packets)
1795 map_main_t *mm = &map_main;
1798 if (dropped_packets)
1799 *dropped_packets = mm->ip4_reass_buffered_counter;
1801 *trashed_reass = mm->ip4_reass_allocated;
1802 if (mm->ip4_reass_fifo_last != MAP_REASS_INDEX_NONE)
1804 u16 ri = mm->ip4_reass_fifo_last;
1807 map_ip4_reass_t *r = pool_elt_at_index (mm->ip4_reass_pool, ri);
1808 for (i = 0; i < MAP_IP4_REASS_MAX_FRAGMENTS_PER_REASSEMBLY; i++)
1809 if (r->fragments[i] != ~0)
1810 map_ip4_drop_pi (r->fragments[i]);
1813 pool_put (mm->ip4_reass_pool, r);
1815 while (ri != mm->ip4_reass_fifo_last);
1818 vec_free (mm->ip4_reass_hash_table);
1819 vec_resize (mm->ip4_reass_hash_table, 1 << mm->ip4_reass_ht_log2len);
1820 for (i = 0; i < (1 << mm->ip4_reass_ht_log2len); i++)
1821 mm->ip4_reass_hash_table[i] = MAP_REASS_INDEX_NONE;
1822 pool_free (mm->ip4_reass_pool);
1823 pool_alloc (mm->ip4_reass_pool, mm->ip4_reass_conf_pool_size);
1825 mm->ip4_reass_allocated = 0;
1826 mm->ip4_reass_fifo_last = MAP_REASS_INDEX_NONE;
1827 mm->ip4_reass_buffered_counter = 0;
1831 map_get_ht_log2len (f32 ht_ratio, u16 pool_size)
1833 u32 desired_size = (u32) (pool_size * ht_ratio);
1835 for (i = 1; i < 31; i++)
1836 if ((1 << i) >= desired_size)
1842 map_ip4_reass_conf_ht_ratio (f32 ht_ratio, u32 * trashed_reass,
1843 u32 * dropped_packets)
1845 map_main_t *mm = &map_main;
1846 if (ht_ratio > MAP_IP4_REASS_CONF_HT_RATIO_MAX)
1849 map_ip4_reass_lock ();
1850 mm->ip4_reass_conf_ht_ratio = ht_ratio;
1851 mm->ip4_reass_ht_log2len =
1852 map_get_ht_log2len (ht_ratio, mm->ip4_reass_conf_pool_size);
1853 map_ip4_reass_reinit (trashed_reass, dropped_packets);
1854 map_ip4_reass_unlock ();
1859 map_ip4_reass_conf_pool_size (u16 pool_size, u32 * trashed_reass,
1860 u32 * dropped_packets)
1862 map_main_t *mm = &map_main;
1863 if (pool_size > MAP_IP4_REASS_CONF_POOL_SIZE_MAX)
1866 map_ip4_reass_lock ();
1867 mm->ip4_reass_conf_pool_size = pool_size;
1868 map_ip4_reass_reinit (trashed_reass, dropped_packets);
1869 map_ip4_reass_unlock ();
1874 map_ip4_reass_conf_lifetime (u16 lifetime_ms)
1876 map_main.ip4_reass_conf_lifetime_ms = lifetime_ms;
1881 map_ip4_reass_conf_buffers (u32 buffers)
1883 map_main.ip4_reass_conf_buffers = buffers;
1888 map_ip6_reass_reinit (u32 * trashed_reass, u32 * dropped_packets)
1890 map_main_t *mm = &map_main;
1891 if (dropped_packets)
1892 *dropped_packets = mm->ip6_reass_buffered_counter;
1894 *trashed_reass = mm->ip6_reass_allocated;
1896 if (mm->ip6_reass_fifo_last != MAP_REASS_INDEX_NONE)
1898 u16 ri = mm->ip6_reass_fifo_last;
1901 map_ip6_reass_t *r = pool_elt_at_index (mm->ip6_reass_pool, ri);
1902 for (i = 0; i < MAP_IP6_REASS_MAX_FRAGMENTS_PER_REASSEMBLY; i++)
1903 if (r->fragments[i].pi != ~0)
1904 map_ip6_drop_pi (r->fragments[i].pi);
1907 pool_put (mm->ip6_reass_pool, r);
1909 while (ri != mm->ip6_reass_fifo_last);
1910 mm->ip6_reass_fifo_last = MAP_REASS_INDEX_NONE;
1913 vec_free (mm->ip6_reass_hash_table);
1914 vec_resize (mm->ip6_reass_hash_table, 1 << mm->ip6_reass_ht_log2len);
1915 for (i = 0; i < (1 << mm->ip6_reass_ht_log2len); i++)
1916 mm->ip6_reass_hash_table[i] = MAP_REASS_INDEX_NONE;
1917 pool_free (mm->ip6_reass_pool);
1918 pool_alloc (mm->ip6_reass_pool, mm->ip4_reass_conf_pool_size);
1920 mm->ip6_reass_allocated = 0;
1921 mm->ip6_reass_buffered_counter = 0;
1925 map_ip6_reass_conf_ht_ratio (f32 ht_ratio, u32 * trashed_reass,
1926 u32 * dropped_packets)
1928 map_main_t *mm = &map_main;
1929 if (ht_ratio > MAP_IP6_REASS_CONF_HT_RATIO_MAX)
1932 map_ip6_reass_lock ();
1933 mm->ip6_reass_conf_ht_ratio = ht_ratio;
1934 mm->ip6_reass_ht_log2len =
1935 map_get_ht_log2len (ht_ratio, mm->ip6_reass_conf_pool_size);
1936 map_ip6_reass_reinit (trashed_reass, dropped_packets);
1937 map_ip6_reass_unlock ();
1942 map_ip6_reass_conf_pool_size (u16 pool_size, u32 * trashed_reass,
1943 u32 * dropped_packets)
1945 map_main_t *mm = &map_main;
1946 if (pool_size > MAP_IP6_REASS_CONF_POOL_SIZE_MAX)
1949 map_ip6_reass_lock ();
1950 mm->ip6_reass_conf_pool_size = pool_size;
1951 map_ip6_reass_reinit (trashed_reass, dropped_packets);
1952 map_ip6_reass_unlock ();
1957 map_ip6_reass_conf_lifetime (u16 lifetime_ms)
1959 map_main.ip6_reass_conf_lifetime_ms = lifetime_ms;
1964 map_ip6_reass_conf_buffers (u32 buffers)
1966 map_main.ip6_reass_conf_buffers = buffers;
1973 * Configure MAP reassembly behaviour
1976 * @cliexstart{map params reassembly}
1979 VLIB_CLI_COMMAND(map_ip4_reass_lifetime_command, static) = {
1980 .path = "map params reassembly",
1981 .short_help = "map params reassembly [ip4 | ip6] [lifetime <lifetime-ms>] "
1982 "[pool-size <pool-size>] [buffers <buffers>] "
1983 "[ht-ratio <ht-ratio>]",
1984 .function = map_params_reass_command_fn,
1988 * Set or copy the IP TOS/Traffic Class field
1991 * @cliexstart{map params traffic-class}
1993 * This command is used to set the traffic-class field in translated
1994 * or encapsulated packets. If copy is specifed (the default) then the
1995 * traffic-class/TOS field is copied from the original packet to the
1996 * translated / encapsulating header.
1999 VLIB_CLI_COMMAND(map_traffic_class_command, static) = {
2000 .path = "map params traffic-class",
2001 .short_help = "map params traffic-class {0x0-0xff | copy}",
2002 .function = map_traffic_class_command_fn,
2006 * Bypass IP4/IP6 lookup
2009 * @cliexstart{map params pre-resolve}
2011 * Bypass a second FIB lookup of the translated or encapsulated
2012 * packet, and forward the packet directly to the specified
2013 * next-hop. This optimization trades forwarding flexibility for
2017 VLIB_CLI_COMMAND(map_pre_resolve_command, static) = {
2018 .path = "map params pre-resolve",
2019 .short_help = " map params pre-resolve {ip4-nh <address>} "
2020 "| {ip6-nh <address>}",
2021 .function = map_pre_resolve_command_fn,
2025 * Enable or disable the MAP-E inbound security check
2028 * @cliexstart{map params security-check}
2030 * By default, a decapsulated packet's IPv4 source address will be
2031 * verified against the outer header's IPv6 source address. Disabling
2032 * this feature will allow IPv4 source address spoofing.
2035 VLIB_CLI_COMMAND(map_security_check_command, static) = {
2036 .path = "map params security-check",
2037 .short_help = "map params security-check on|off",
2038 .function = map_security_check_command_fn,
2042 * Specifiy the IPv4 source address used for relayed ICMP error messages
2045 * @cliexstart{map params icmp source-address}
2047 * This command specifies which IPv4 source address (must be local to
2048 * the system), that is used for relayed received IPv6 ICMP error
2052 VLIB_CLI_COMMAND(map_icmp_relay_source_address_command, static) = {
2053 .path = "map params icmp source-address",
2054 .short_help = "map params icmp source-address <ip4-address>",
2055 .function = map_icmp_relay_source_address_command_fn,
2059 * Send IPv6 ICMP unreachables
2062 * @cliexstart{map params icmp6 unreachables}
2064 * Send IPv6 ICMP unreachable messages back if security check fails or
2065 * no MAP domain exists.
2068 VLIB_CLI_COMMAND(map_icmp_unreachables_command, static) = {
2069 .path = "map params icmp6 unreachables",
2070 .short_help = "map params icmp6 unreachables {on|off}",
2071 .function = map_icmp_unreachables_command_fn,
2075 * Configure MAP fragmentation behaviour
2078 * @cliexstart{map params fragment}
2081 VLIB_CLI_COMMAND(map_fragment_command, static) = {
2082 .path = "map params fragment",
2083 .short_help = "map params fragment inner|outer",
2084 .function = map_fragment_command_fn,
2088 * Ignore the IPv4 Don't fragment bit
2091 * @cliexstart{map params fragment ignore-df}
2093 * Allows fragmentation of the IPv4 packet even if the DF bit is
2094 * set. The choice between inner or outer fragmentation of tunnel
2095 * packets is complicated. The benefit of inner fragmentation is that
2096 * the ultimate endpoint must reassemble, instead of the tunnel
2100 VLIB_CLI_COMMAND(map_fragment_df_command, static) = {
2101 .path = "map params fragment ignore-df",
2102 .short_help = "map params fragment ignore-df on|off",
2103 .function = map_fragment_df_command_fn,
2107 * Specifiy if the inbound security check should be done on fragments
2110 * @cliexstart{map params security-check fragments}
2112 * Typically the inbound on-decapsulation security check is only done
2113 * on the first packet. The packet that contains the L4
2114 * information. While a security check on every fragment is possible,
2115 * it has a cost. State must be created on the first fragment.
2118 VLIB_CLI_COMMAND(map_security_check_frag_command, static) = {
2119 .path = "map params security-check fragments",
2120 .short_help = "map params security-check fragments on|off",
2121 .function = map_security_check_frag_command_fn,
2128 * @cliexstart{map add domain}
2131 VLIB_CLI_COMMAND(map_add_domain_command, static) = {
2132 .path = "map add domain",
2133 .short_help = "map add domain ip4-pfx <ip4-pfx> ip6-pfx <ip6-pfx> "
2134 "ip6-src <ip6-pfx> ea-bits-len <n> psid-offset <n> psid-len <n> "
2135 "[map-t] [mtu <mtu>]",
2136 .function = map_add_domain_command_fn,
2140 * Add MAP rule to a domain
2143 * @cliexstart{map add rule}
2146 VLIB_CLI_COMMAND(map_add_rule_command, static) = {
2147 .path = "map add rule",
2148 .short_help = "map add rule index <domain> psid <psid> ip6-dst <ip6-addr>",
2149 .function = map_add_rule_command_fn,
2156 * @cliexstart{map del domain}
2159 VLIB_CLI_COMMAND(map_del_command, static) = {
2160 .path = "map del domain",
2161 .short_help = "map del domain index <domain>",
2162 .function = map_del_domain_command_fn,
2169 * @cliexstart{show map domain}
2172 VLIB_CLI_COMMAND(show_map_domain_command, static) = {
2173 .path = "show map domain",
2174 .short_help = "show map domain index <n> [counters]",
2175 .function = show_map_domain_command_fn,
2179 * Show MAP statistics
2182 * @cliexstart{show map stats}
2185 VLIB_CLI_COMMAND(show_map_stats_command, static) = {
2186 .path = "show map stats",
2187 .short_help = "show map stats",
2188 .function = show_map_stats_command_fn,
2192 * Show MAP fragmentation information
2195 * @cliexstart{show map fragments}
2198 VLIB_CLI_COMMAND(show_map_fragments_command, static) = {
2199 .path = "show map fragments",
2200 .short_help = "show map fragments",
2201 .function = show_map_fragments_command_fn,
2209 map_init (vlib_main_t * vm)
2211 map_main_t *mm = &map_main;
2212 mm->vnet_main = vnet_get_main ();
2215 #ifdef MAP_SKIP_IP6_LOOKUP
2216 fib_protocol_t proto;
2218 FOR_EACH_FIB_PROTOCOL (proto)
2220 map_pre_resolve_init (&pre_resolved[proto]);
2228 /* Inbound security check */
2229 mm->sec_check = true;
2230 mm->sec_check_frag = false;
2232 /* ICMP6 Type 1, Code 5 for security check failure */
2233 mm->icmp6_enabled = false;
2235 /* Inner or outer fragmentation */
2236 mm->frag_inner = false;
2237 mm->frag_ignore_df = false;
2239 vec_validate (mm->domain_counters, MAP_N_DOMAIN_COUNTER - 1);
2240 mm->domain_counters[MAP_DOMAIN_COUNTER_RX].name = "rx";
2241 mm->domain_counters[MAP_DOMAIN_COUNTER_TX].name = "tx";
2243 vlib_validate_simple_counter (&mm->icmp_relayed, 0);
2244 vlib_zero_simple_counter (&mm->icmp_relayed, 0);
2246 /* IP4 virtual reassembly */
2247 mm->ip4_reass_hash_table = 0;
2248 mm->ip4_reass_pool = 0;
2249 mm->ip4_reass_lock =
2250 clib_mem_alloc_aligned (CLIB_CACHE_LINE_BYTES, CLIB_CACHE_LINE_BYTES);
2251 mm->ip4_reass_conf_ht_ratio = MAP_IP4_REASS_HT_RATIO_DEFAULT;
2252 mm->ip4_reass_conf_lifetime_ms = MAP_IP4_REASS_LIFETIME_DEFAULT;
2253 mm->ip4_reass_conf_pool_size = MAP_IP4_REASS_POOL_SIZE_DEFAULT;
2254 mm->ip4_reass_conf_buffers = MAP_IP4_REASS_BUFFERS_DEFAULT;
2255 mm->ip4_reass_ht_log2len =
2256 map_get_ht_log2len (mm->ip4_reass_conf_ht_ratio,
2257 mm->ip4_reass_conf_pool_size);
2258 mm->ip4_reass_fifo_last = MAP_REASS_INDEX_NONE;
2259 map_ip4_reass_reinit (NULL, NULL);
2261 /* IP6 virtual reassembly */
2262 mm->ip6_reass_hash_table = 0;
2263 mm->ip6_reass_pool = 0;
2264 mm->ip6_reass_lock =
2265 clib_mem_alloc_aligned (CLIB_CACHE_LINE_BYTES, CLIB_CACHE_LINE_BYTES);
2266 mm->ip6_reass_conf_ht_ratio = MAP_IP6_REASS_HT_RATIO_DEFAULT;
2267 mm->ip6_reass_conf_lifetime_ms = MAP_IP6_REASS_LIFETIME_DEFAULT;
2268 mm->ip6_reass_conf_pool_size = MAP_IP6_REASS_POOL_SIZE_DEFAULT;
2269 mm->ip6_reass_conf_buffers = MAP_IP6_REASS_BUFFERS_DEFAULT;
2270 mm->ip6_reass_ht_log2len =
2271 map_get_ht_log2len (mm->ip6_reass_conf_ht_ratio,
2272 mm->ip6_reass_conf_pool_size);
2273 mm->ip6_reass_fifo_last = MAP_REASS_INDEX_NONE;
2274 map_ip6_reass_reinit (NULL, NULL);
2276 #ifdef MAP_SKIP_IP6_LOOKUP
2277 fib_node_register_type (FIB_NODE_TYPE_MAP_E, &map_vft);
2279 map_dpo_module_init ();
2284 VLIB_INIT_FUNCTION (map_init);
2287 * fd.io coding-style-patch-verification: ON
2290 * eval: (c-set-style "gnu")