2 * Copyright (c) 2018 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
7 * http://www.apache.org/licenses/LICENSE-2.0
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
16 #ifndef included_acl_inlines_h
17 #define included_acl_inlines_h
21 #include <vlib/unix/plugin.h>
22 #include <plugins/acl/acl.h>
23 #include <plugins/acl/fa_node.h>
24 #include <plugins/acl/hash_lookup_private.h>
26 #include <plugins/acl/exported_types.h>
28 #define LOAD_SYMBOL_FROM_PLUGIN_TO(p, s, st) \
30 st = vlib_get_plugin_symbol(p, #s); \
32 return clib_error_return(0, \
33 "Plugin %s and/or symbol %s not found.", p, #s); \
36 #define LOAD_SYMBOL(s) LOAD_SYMBOL_FROM_PLUGIN_TO("acl_plugin.so", s, s)
39 static inline clib_error_t * acl_plugin_exports_init (acl_plugin_methods_t *m)
41 acl_plugin_methods_vtable_init_fn_t mvi;
43 LOAD_SYMBOL_FROM_PLUGIN_TO("acl_plugin.so", acl_plugin_methods_vtable_init, mvi);
48 get_ptr_to_offset (vlib_buffer_t * b0, int offset)
50 u8 *p = vlib_buffer_get_current (b0) + offset;
55 offset_within_packet (vlib_buffer_t * b0, int offset)
57 /* For the purposes of this code, "within" means we have at least 8 bytes after it */
58 return (offset <= (b0->current_length - 8));
63 acl_fill_5tuple_l3_data (acl_main_t * am, vlib_buffer_t * b0, int is_ip6,
64 int l3_offset, fa_5tuple_t * p5tuple_pkt)
68 clib_memcpy (&p5tuple_pkt->ip6_addr,
69 get_ptr_to_offset (b0,
70 offsetof (ip6_header_t,
71 src_address) + l3_offset),
72 sizeof (p5tuple_pkt->ip6_addr));
76 memset(p5tuple_pkt->l3_zero_pad, 0, sizeof(p5tuple_pkt->l3_zero_pad));
77 clib_memcpy (&p5tuple_pkt->ip4_addr,
78 get_ptr_to_offset (b0,
79 offsetof (ip4_header_t,
80 src_address) + l3_offset),
81 sizeof (p5tuple_pkt->ip4_addr));
86 acl_fill_5tuple_l4_and_pkt_data (acl_main_t * am, u32 sw_if_index0, vlib_buffer_t * b0, int is_ip6, int is_input,
87 int l3_offset, fa_session_l4_key_t *p5tuple_l4, fa_packet_info_t *p5tuple_pkt)
89 /* IP4 and IP6 protocol numbers of ICMP */
90 static u8 icmp_protos_v4v6[] = { IP_PROTOCOL_ICMP, IP_PROTOCOL_ICMP6 };
96 fa_session_l4_key_t tmp_l4 = { .lsb_of_sw_if_index = sw_if_index0 & 0xffff };
97 fa_packet_info_t tmp_pkt = { .is_ip6 = is_ip6, .mask_type_index_lsb = ~0 };
102 *(u8 *) get_ptr_to_offset (b0,
103 offsetof (ip6_header_t,
104 protocol) + l3_offset);
105 l4_offset = l3_offset + sizeof (ip6_header_t);
106 #ifdef FA_NODE_VERBOSE_DEBUG
107 clib_warning ("ACL_FA_NODE_DBG: proto: %d, l4_offset: %d", proto,
110 /* IP6 EH handling is here, increment l4_offset if needs to, update the proto */
111 int need_skip_eh = clib_bitmap_get (am->fa_ipv6_known_eh_bitmap, proto);
112 if (PREDICT_FALSE (need_skip_eh))
114 while (need_skip_eh && offset_within_packet (b0, l4_offset))
116 /* Fragment header needs special handling */
117 if (PREDICT_FALSE(ACL_EH_FRAGMENT == proto))
119 proto = *(u8 *) get_ptr_to_offset (b0, l4_offset);
121 clib_memcpy (&frag_offset, get_ptr_to_offset (b0, 2 + l4_offset), sizeof(frag_offset));
122 frag_offset = clib_net_to_host_u16(frag_offset) >> 3;
125 tmp_pkt.is_nonfirst_fragment = 1;
126 /* invalidate L4 offset so we don't try to find L4 info */
127 l4_offset += b0->current_length;
131 /* First fragment: skip the frag header and move on. */
137 u8 nwords = *(u8 *) get_ptr_to_offset (b0, 1 + l4_offset);
138 proto = *(u8 *) get_ptr_to_offset (b0, l4_offset);
139 l4_offset += 8 * (1 + (u16) nwords);
141 #ifdef FA_NODE_VERBOSE_DEBUG
142 clib_warning ("ACL_FA_NODE_DBG: new proto: %d, new offset: %d",
146 clib_bitmap_get (am->fa_ipv6_known_eh_bitmap, proto);
153 *(u8 *) get_ptr_to_offset (b0,
154 offsetof (ip4_header_t,
155 protocol) + l3_offset);
156 l4_offset = l3_offset + sizeof (ip4_header_t);
157 u16 flags_and_fragment_offset;
158 clib_memcpy (&flags_and_fragment_offset,
159 get_ptr_to_offset (b0,
160 offsetof (ip4_header_t,
161 flags_and_fragment_offset)) + l3_offset,
162 sizeof(flags_and_fragment_offset));
163 flags_and_fragment_offset = clib_net_to_host_u16 (flags_and_fragment_offset);
165 /* non-initial fragments have non-zero offset */
166 if ((PREDICT_FALSE(0xfff & flags_and_fragment_offset)))
168 tmp_pkt.is_nonfirst_fragment = 1;
169 /* invalidate L4 offset so we don't try to find L4 info */
170 l4_offset += b0->current_length;
174 tmp_l4.proto = proto;
175 tmp_l4.is_input = is_input;
177 if (PREDICT_TRUE (offset_within_packet (b0, l4_offset)))
179 tmp_pkt.l4_valid = 1;
180 if (icmp_protos_v4v6[is_ip6] == proto)
184 *(u8 *) get_ptr_to_offset (b0,
185 l4_offset + offsetof (icmp46_header_t,
189 *(u8 *) get_ptr_to_offset (b0,
190 l4_offset + offsetof (icmp46_header_t,
192 tmp_l4.is_slowpath = 1;
194 else if ((IP_PROTOCOL_TCP == proto) || (IP_PROTOCOL_UDP == proto))
197 get_ptr_to_offset (b0,
198 l4_offset + offsetof (tcp_header_t,
201 tmp_l4.port[0] = clib_net_to_host_u16 (ports[0]);
202 tmp_l4.port[1] = clib_net_to_host_u16 (ports[1]);
205 *(u8 *) get_ptr_to_offset (b0,
206 l4_offset + offsetof (tcp_header_t,
208 tmp_pkt.tcp_flags_valid = (proto == IP_PROTOCOL_TCP);
209 tmp_l4.is_slowpath = 0;
213 tmp_l4.is_slowpath = 1;
217 p5tuple_pkt->as_u64 = tmp_pkt.as_u64;
218 p5tuple_l4->as_u64 = tmp_l4.as_u64;
222 acl_fill_5tuple (acl_main_t * am, u32 sw_if_index0, vlib_buffer_t * b0, int is_ip6,
223 int is_input, int is_l2_path, fa_5tuple_t * p5tuple_pkt)
229 l3_offset = ethernet_buffer_header_size(b0);
236 l3_offset = vnet_buffer(b0)->ip.save_rewrite_length;
239 /* key[0..3] contains src/dst address and is cleared/set below */
240 /* Remainder of the key and per-packet non-key data */
241 acl_fill_5tuple_l3_data(am, b0, is_ip6, l3_offset, p5tuple_pkt);
242 acl_fill_5tuple_l4_and_pkt_data(am, sw_if_index0, b0, is_ip6, is_input, l3_offset, &p5tuple_pkt->l4, &p5tuple_pkt->pkt);
246 acl_plugin_fill_5tuple_inline (void *p_acl_main, u32 lc_index, vlib_buffer_t * b0, int is_ip6,
247 int is_input, int is_l2_path, fa_5tuple_opaque_t * p5tuple_pkt)
249 acl_main_t *am = p_acl_main;
250 acl_fill_5tuple(am, 0, b0, is_ip6, is_input, is_l2_path, (fa_5tuple_t *)p5tuple_pkt);
256 fa_acl_match_ip4_addr (ip4_address_t * addr1, ip4_address_t * addr2,
261 /* match any always succeeds */
264 uint32_t a1 = clib_net_to_host_u32 (addr1->as_u32);
265 uint32_t a2 = clib_net_to_host_u32 (addr2->as_u32);
266 uint32_t mask0 = 0xffffffff - ((1 << (32 - prefixlen)) - 1);
267 return (a1 & mask0) == a2;
271 fa_acl_match_ip6_addr (ip6_address_t * addr1, ip6_address_t * addr2,
276 /* match any always succeeds */
279 if (memcmp (addr1, addr2, prefixlen / 8))
281 /* If the starting full bytes do not match, no point in bittwidling the thumbs further */
286 u8 b1 = *((u8 *) addr1 + 1 + prefixlen / 8);
287 u8 b2 = *((u8 *) addr2 + 1 + prefixlen / 8);
288 u8 mask0 = (0xff - ((1 << (8 - (prefixlen % 8))) - 1));
289 return (b1 & mask0) == b2;
293 /* The prefix fits into integer number of bytes, so nothing left to do */
299 fa_acl_match_port (u16 port, u16 port_first, u16 port_last, int is_ip6)
301 return ((port >= port_first) && (port <= port_last));
305 single_acl_match_5tuple (acl_main_t * am, u32 acl_index, fa_5tuple_t * pkt_5tuple,
306 int is_ip6, u8 * r_action, u32 * r_acl_match_p,
307 u32 * r_rule_match_p, u32 * trace_bitmap)
313 if (pool_is_free_index (am->acls, acl_index))
316 *r_acl_match_p = acl_index;
318 *r_rule_match_p = -1;
319 /* the ACL does not exist but is used for policy. Block traffic. */
322 a = am->acls + acl_index;
323 for (i = 0; i < a->count; i++)
326 if (is_ip6 != r->is_ipv6)
331 if (!fa_acl_match_ip6_addr
332 (&pkt_5tuple->ip6_addr[1], &r->dst.ip6, r->dst_prefixlen))
334 if (!fa_acl_match_ip6_addr
335 (&pkt_5tuple->ip6_addr[0], &r->src.ip6, r->src_prefixlen))
338 if (!fa_acl_match_ip4_addr
339 (&pkt_5tuple->ip4_addr[1], &r->dst.ip4, r->dst_prefixlen))
341 if (!fa_acl_match_ip4_addr
342 (&pkt_5tuple->ip4_addr[0], &r->src.ip4, r->src_prefixlen))
348 if (pkt_5tuple->l4.proto != r->proto)
351 if (PREDICT_FALSE (pkt_5tuple->pkt.is_nonfirst_fragment &&
352 am->l4_match_nonfirst_fragment))
354 /* non-initial fragment with frag match configured - match this rule */
355 *trace_bitmap |= 0x80000000;
356 *r_action = r->is_permit;
358 *r_acl_match_p = acl_index;
364 /* A sanity check just to ensure we are about to match the ports extracted from the packet */
365 if (PREDICT_FALSE (!pkt_5tuple->pkt.l4_valid))
368 #ifdef FA_NODE_VERBOSE_DEBUG
370 ("ACL_FA_NODE_DBG acl %d rule %d pkt proto %d match rule %d",
371 acl_index, i, pkt_5tuple->l4.proto, r->proto);
374 if (!fa_acl_match_port
375 (pkt_5tuple->l4.port[0], r->src_port_or_type_first,
376 r->src_port_or_type_last, is_ip6))
379 #ifdef FA_NODE_VERBOSE_DEBUG
381 ("ACL_FA_NODE_DBG acl %d rule %d pkt sport %d match rule [%d..%d]",
382 acl_index, i, pkt_5tuple->l4.port[0], r->src_port_or_type_first,
383 r->src_port_or_type_last);
386 if (!fa_acl_match_port
387 (pkt_5tuple->l4.port[1], r->dst_port_or_code_first,
388 r->dst_port_or_code_last, is_ip6))
391 #ifdef FA_NODE_VERBOSE_DEBUG
393 ("ACL_FA_NODE_DBG acl %d rule %d pkt dport %d match rule [%d..%d]",
394 acl_index, i, pkt_5tuple->l4.port[1], r->dst_port_or_code_first,
395 r->dst_port_or_code_last);
397 if (pkt_5tuple->pkt.tcp_flags_valid
398 && ((pkt_5tuple->pkt.tcp_flags & r->tcp_flags_mask) !=
402 /* everything matches! */
403 #ifdef FA_NODE_VERBOSE_DEBUG
404 clib_warning ("ACL_FA_NODE_DBG acl %d rule %d FULL-MATCH, action %d",
405 acl_index, i, r->is_permit);
407 *r_action = r->is_permit;
409 *r_acl_match_p = acl_index;
418 acl_plugin_single_acl_match_5tuple (void *p_acl_main, u32 acl_index, fa_5tuple_t * pkt_5tuple,
419 int is_ip6, u8 * r_action, u32 * r_acl_match_p,
420 u32 * r_rule_match_p, u32 * trace_bitmap)
422 acl_main_t * am = p_acl_main;
423 return single_acl_match_5tuple(am, acl_index, pkt_5tuple, is_ip6, r_action,
424 r_acl_match_p, r_rule_match_p, trace_bitmap);
428 linear_multi_acl_match_5tuple (void *p_acl_main, u32 lc_index, fa_5tuple_t * pkt_5tuple,
429 int is_ip6, u8 *r_action, u32 *acl_pos_p, u32 * acl_match_p,
430 u32 * rule_match_p, u32 * trace_bitmap)
432 acl_main_t *am = p_acl_main;
436 acl_lookup_context_t *acontext = pool_elt_at_index(am->acl_lookup_contexts, lc_index);
438 acl_vector = acontext->acl_indices;
440 for (i = 0; i < vec_len (acl_vector); i++)
442 #ifdef FA_NODE_VERBOSE_DEBUG
443 clib_warning ("ACL_FA_NODE_DBG: Trying to match ACL: %d",
446 if (single_acl_match_5tuple
447 (am, acl_vector[i], pkt_5tuple, is_ip6, &action,
448 acl_match_p, rule_match_p, trace_bitmap))
455 if (vec_len (acl_vector) > 0)
459 #ifdef FA_NODE_VERBOSE_DEBUG
460 clib_warning ("ACL_FA_NODE_DBG: No ACL on lc_index %d", lc_index);
462 /* If there are no ACLs defined we should not be here. */
469 * This returns true if there is indeed a match on the portranges.
470 * With all these levels of indirections, this is not going to be very fast,
471 * so, best use the individual ports or wildcard ports for performance.
474 match_portranges(acl_main_t *am, fa_5tuple_t *match, u32 index)
477 applied_hash_ace_entry_t **applied_hash_aces = vec_elt_at_index(am->hash_entry_vec_by_lc_index, match->pkt.lc_index);
478 applied_hash_ace_entry_t *pae = vec_elt_at_index((*applied_hash_aces), index);
480 acl_rule_t *r = &(am->acls[pae->acl_index].rules[pae->ace_index]);
482 #ifdef FA_NODE_VERBOSE_DEBUG
483 clib_warning("PORTMATCH: %d <= %d <= %d && %d <= %d <= %d ?",
484 r->src_port_or_type_first, match->l4.port[0], r->src_port_or_type_last,
485 r->dst_port_or_code_first, match->l4.port[1], r->dst_port_or_code_last);
488 return ( ((r->src_port_or_type_first <= match->l4.port[0]) && r->src_port_or_type_last >= match->l4.port[0]) &&
489 ((r->dst_port_or_code_first <= match->l4.port[1]) && r->dst_port_or_code_last >= match->l4.port[1]) );
493 multi_acl_match_get_applied_ace_index(acl_main_t *am, fa_5tuple_t *match)
495 clib_bihash_kv_48_8_t kv;
496 clib_bihash_kv_48_8_t result;
497 fa_5tuple_t *kv_key = (fa_5tuple_t *)kv.key;
498 hash_acl_lookup_value_t *result_val = (hash_acl_lookup_value_t *)&result.value;
499 u64 *pmatch = (u64 *)match;
503 u32 curr_match_index = ~0;
505 u32 lc_index = match->pkt.lc_index;
506 applied_hash_ace_entry_t **applied_hash_aces = vec_elt_at_index(am->hash_entry_vec_by_lc_index, match->pkt.lc_index);
507 applied_hash_acl_info_t **applied_hash_acls = &am->applied_hash_acl_info_by_lc_index;
509 DBG("TRYING TO MATCH: %016llx %016llx %016llx %016llx %016llx %016llx",
510 pmatch[0], pmatch[1], pmatch[2], pmatch[3], pmatch[4], pmatch[5]);
512 for(mask_type_index=0; mask_type_index < pool_len(am->ace_mask_type_pool); mask_type_index++) {
513 if (!clib_bitmap_get(vec_elt_at_index((*applied_hash_acls), lc_index)->mask_type_index_bitmap, mask_type_index)) {
514 /* This bit is not set. Avoid trying to match */
517 ace_mask_type_entry_t *mte = vec_elt_at_index(am->ace_mask_type_pool, mask_type_index);
518 pmatch = (u64 *)match;
519 pmask = (u64 *)&mte->mask;
520 pkey = (u64 *)kv.key;
522 * unrolling the below loop results in a noticeable performance increase.
525 kv.key[i] = pmatch[i] & pmask[i];
529 *pkey++ = *pmatch++ & *pmask++;
530 *pkey++ = *pmatch++ & *pmask++;
531 *pkey++ = *pmatch++ & *pmask++;
532 *pkey++ = *pmatch++ & *pmask++;
533 *pkey++ = *pmatch++ & *pmask++;
534 *pkey++ = *pmatch++ & *pmask++;
536 kv_key->pkt.mask_type_index_lsb = mask_type_index;
537 DBG(" KEY %3d: %016llx %016llx %016llx %016llx %016llx %016llx", mask_type_index,
538 kv.key[0], kv.key[1], kv.key[2], kv.key[3], kv.key[4], kv.key[5]);
539 int res = clib_bihash_search_48_8 (&am->acl_lookup_hash, &kv, &result);
541 DBG("ACL-MATCH! result_val: %016llx", result_val->as_u64);
542 if (result_val->applied_entry_index < curr_match_index) {
543 if (PREDICT_FALSE(result_val->need_portrange_check)) {
545 * This is going to be slow, since we can have multiple superset
546 * entries for narrow-ish portranges, e.g.:
547 * 0..42 100..400, 230..60000,
548 * so we need to walk linearly and check if they match.
551 u32 curr_index = result_val->applied_entry_index;
552 while ((curr_index != ~0) && !match_portranges(am, match, curr_index)) {
553 /* while no match and there are more entries, walk... */
554 applied_hash_ace_entry_t *pae = vec_elt_at_index((*applied_hash_aces),curr_index);
555 DBG("entry %d did not portmatch, advancing to %d", curr_index, pae->next_applied_entry_index);
556 curr_index = pae->next_applied_entry_index;
558 if (curr_index < curr_match_index) {
559 DBG("The index %d is the new candidate in portrange matches.", curr_index);
560 curr_match_index = curr_index;
562 DBG("Curr portmatch index %d is too big vs. current matched one %d", curr_index, curr_match_index);
565 /* The usual path is here. Found an entry in front of the current candiate - so it's a new one */
566 DBG("This match is the new candidate");
567 curr_match_index = result_val->applied_entry_index;
568 if (!result_val->shadowed) {
569 /* new result is known to not be shadowed, so no point to look up further */
576 DBG("MATCH-RESULT: %d", curr_match_index);
577 return curr_match_index;
581 hash_multi_acl_match_5tuple (void *p_acl_main, u32 lc_index, fa_5tuple_t * pkt_5tuple,
582 int is_ip6, u8 *action, u32 *acl_pos_p, u32 * acl_match_p,
583 u32 * rule_match_p, u32 * trace_bitmap)
585 acl_main_t *am = p_acl_main;
586 applied_hash_ace_entry_t **applied_hash_aces = vec_elt_at_index(am->hash_entry_vec_by_lc_index, lc_index);
587 u32 match_index = multi_acl_match_get_applied_ace_index(am, pkt_5tuple);
588 if (match_index < vec_len((*applied_hash_aces))) {
589 applied_hash_ace_entry_t *pae = vec_elt_at_index((*applied_hash_aces), match_index);
591 *acl_pos_p = pae->acl_position;
592 *acl_match_p = pae->acl_index;
593 *rule_match_p = pae->ace_index;
594 *action = pae->action;
603 acl_plugin_match_5tuple_inline (void *p_acl_main, u32 lc_index,
604 fa_5tuple_opaque_t * pkt_5tuple,
605 int is_ip6, u8 * r_action,
608 u32 * r_rule_match_p,
611 acl_main_t *am = p_acl_main;
612 fa_5tuple_t * pkt_5tuple_internal = (fa_5tuple_t *)pkt_5tuple;
613 pkt_5tuple_internal->pkt.lc_index = lc_index;
614 if (am->use_hash_acl_matching) {
615 return hash_multi_acl_match_5tuple(p_acl_main, lc_index, pkt_5tuple_internal, is_ip6, r_action,
616 r_acl_pos_p, r_acl_match_p, r_rule_match_p, trace_bitmap);
618 return linear_multi_acl_match_5tuple(p_acl_main, lc_index, pkt_5tuple_internal, is_ip6, r_action,
619 r_acl_pos_p, r_acl_match_p, r_rule_match_p, trace_bitmap);