5 #include <vppinfra/bihash_40_8.h>
7 // #define FA_NODE_VERBOSE_DEBUG 3
9 #define TCP_FLAG_FIN 0x01
10 #define TCP_FLAG_SYN 0x02
11 #define TCP_FLAG_RST 0x04
12 #define TCP_FLAG_PUSH 0x08
13 #define TCP_FLAG_ACK 0x10
14 #define TCP_FLAG_URG 0x20
15 #define TCP_FLAG_ECE 0x40
16 #define TCP_FLAG_CWR 0x80
17 #define TCP_FLAGS_RSTFINACKSYN (TCP_FLAG_RST + TCP_FLAG_FIN + TCP_FLAG_SYN + TCP_FLAG_ACK)
18 #define TCP_FLAGS_ACKSYN (TCP_FLAG_SYN + TCP_FLAG_ACK)
20 #define ACL_FA_CONN_TABLE_DEFAULT_HASH_NUM_BUCKETS (64 * 1024)
21 #define ACL_FA_CONN_TABLE_DEFAULT_HASH_MEMORY_SIZE (1<<30)
22 #define ACL_FA_CONN_TABLE_DEFAULT_MAX_ENTRIES 1000000
28 u16 mask_type_index_lsb;
32 u8 is_nonfirst_fragment:1;
48 u16 lsb_of_sw_if_index;
53 } fa_session_l4_key_t;
57 ip46_address_t addr[2];
58 fa_session_l4_key_t l4;
59 /* This field should align with u64 value in bihash_40_8 keyvalue struct */
62 clib_bihash_kv_40_8_t kv;
66 u8 opaque[sizeof(fa_5tuple_t)];
71 fa_5tuple_t info; /* (5+1)*8 = 48 bytes */
72 u64 last_active_time; /* +8 bytes = 56 */
73 u32 sw_if_index; /* +4 bytes = 60 */
77 } tcp_flags_seen; ; /* +2 bytes = 62 */
78 u16 thread_index; /* +2 bytes = 64 */
79 u64 link_enqueue_time; /* 8 byte = 8 */
80 u32 link_prev_idx; /* +4 bytes = 12 */
81 u32 link_next_idx; /* +4 bytes = 16 */
82 u8 link_list_id; /* +1 bytes = 17 */
83 u8 reserved1[7]; /* +7 bytes = 24 */
84 u64 reserved2[5]; /* +5*8 bytes = 64 */
87 #define FA_POLICY_EPOCH_MASK 0x7fff
88 /* input policy epochs have the MSB set */
89 #define FA_POLICY_EPOCH_IS_INPUT 0x8000
92 /* This structure is used to fill in the u64 value
93 in the per-sw-if-index hash table */
100 u16 intf_policy_epoch;
103 } fa_full_session_id_t;
106 * A few compile-time constraints on the size and the layout of the union, to ensure
107 * it makes sense both for bihash and for us.
110 #define CT_ASSERT_EQUAL(name, x,y) typedef int assert_ ## name ## _compile_time_assertion_failed[((x) == (y))-1]
111 CT_ASSERT_EQUAL(fa_l3_key_size_is_40, offsetof(fa_5tuple_t, pkt), offsetof(clib_bihash_kv_40_8_t, value));
112 CT_ASSERT_EQUAL(fa_l4_key_t_is_8, sizeof(fa_session_l4_key_t), sizeof(u64));
113 CT_ASSERT_EQUAL(fa_packet_info_t_is_8, sizeof(fa_packet_info_t), sizeof(u64));
114 CT_ASSERT_EQUAL(fa_l3_kv_size_is_48, sizeof(fa_5tuple_t), sizeof(clib_bihash_kv_40_8_t));
116 /* Let's try to fit within two cachelines */
117 CT_ASSERT_EQUAL(fa_session_t_size_is_128, sizeof(fa_session_t), 128);
119 /* Session ID MUST be the same as u64 */
120 CT_ASSERT_EQUAL(fa_full_session_id_size_is_64, sizeof(fa_full_session_id_t), sizeof(u64));
121 #undef CT_ASSERT_EQUAL
124 /* The pool of sessions managed by this worker */
125 fa_session_t *fa_sessions_pool;
126 /* per-worker ACL_N_TIMEOUTS of conn lists */
127 u32 *fa_conn_list_head;
128 u32 *fa_conn_list_tail;
129 /* adds and deletes per-worker-per-interface */
130 u64 *fa_session_dels_by_sw_if_index;
131 u64 *fa_session_adds_by_sw_if_index;
132 /* sessions deleted due to epoch change */
133 u64 *fa_session_epoch_change_by_sw_if_index;
134 /* Vector of expired connections retrieved from lists */
136 /* the earliest next expiry time */
137 u64 next_expiry_time;
138 /* if not zero, look at all the elements until their enqueue timestamp is after below one */
139 u64 requeue_until_time;
140 /* Current time between the checks */
141 u64 current_time_wait_interval;
142 /* Counter of how many sessions we did delete */
143 u64 cnt_deleted_sessions;
144 /* Counter of already deleted sessions being deleted - should not increment unless a bug */
145 u64 cnt_already_deleted_sessions;
146 /* Number of times we requeued a session to a head of the list */
147 u64 cnt_session_timer_restarted;
148 /* swipe up to this enqueue time, rather than following the timeouts */
150 /* bitmap of sw_if_index serviced by this worker */
151 uword *serviced_sw_if_index_bitmap;
152 /* bitmap of sw_if_indices to clear. set by main thread, cleared by worker */
153 uword *pending_clear_sw_if_index_bitmap;
154 /* atomic, indicates that the swipe-deletion of connections is in progress */
155 u32 clear_in_process;
156 /* Interrupt is pending from main thread */
157 int interrupt_is_pending;
159 * Interrupt node on the worker thread sets this if it knows there is
160 * more work to do, but it has to finish to avoid hogging the
163 int interrupt_is_needed;
165 * Set to indicate that the interrupt node wants to get less interrupts
166 * because there is not enough work for the current rate.
168 int interrupt_is_unwanted;
170 * Set to copy of a "generation" counter in main thread so we can sync the interrupts.
172 int interrupt_generation;
173 } acl_fa_per_worker_data_t;
184 ACL_FA_CLEANER_RESCHEDULE = 1,
185 ACL_FA_CLEANER_DELETE_BY_SW_IF_INDEX,
186 } acl_fa_cleaner_process_event_e;
188 void acl_fa_enable_disable(u32 sw_if_index, int is_input, int enable_disable);
190 void show_fa_sessions_hash(vlib_main_t * vm, u32 verbose);
192 u8 *format_acl_plugin_5tuple (u8 * s, va_list * args);
194 /* use like: elog_acl_maybe_trace_X1(am, "foobar: %d", "i4", int32_value); */
196 #define elog_acl_maybe_trace_X1(am, acl_elog_trace_format_label, acl_elog_trace_format_args, acl_elog_val1) \
198 if (am->trace_sessions) { \
199 CLIB_UNUSED(struct { u8 available_space[18 - sizeof(acl_elog_val1)]; } *static_check); \
200 u16 thread_index = os_get_thread_index (); \
201 vlib_worker_thread_t * w = vlib_worker_threads + thread_index; \
202 ELOG_TYPE_DECLARE (e) = \
204 .format = "(%02d) " acl_elog_trace_format_label, \
205 .format_args = "i2" acl_elog_trace_format_args, \
210 typeof(acl_elog_val1) val1; \
212 ed = ELOG_TRACK_DATA (&vlib_global_main.elog_main, e, w->elog_track); \
213 ed->thread = thread_index; \
214 ed->val1 = acl_elog_val1; \
219 /* use like: elog_acl_maybe_trace_X2(am, "foobar: %d some u64: %lu", "i4i8", int32_value, int64_value); */
221 #define elog_acl_maybe_trace_X2(am, acl_elog_trace_format_label, acl_elog_trace_format_args, \
222 acl_elog_val1, acl_elog_val2) \
224 if (am->trace_sessions) { \
225 CLIB_UNUSED(struct { u8 available_space[18 - sizeof(acl_elog_val1) - sizeof(acl_elog_val2)]; } *static_check); \
226 u16 thread_index = os_get_thread_index (); \
227 vlib_worker_thread_t * w = vlib_worker_threads + thread_index; \
228 ELOG_TYPE_DECLARE (e) = \
230 .format = "(%02d) " acl_elog_trace_format_label, \
231 .format_args = "i2" acl_elog_trace_format_args, \
236 typeof(acl_elog_val1) val1; \
237 typeof(acl_elog_val2) val2; \
239 ed = ELOG_TRACK_DATA (&vlib_global_main.elog_main, e, w->elog_track); \
240 ed->thread = thread_index; \
241 ed->val1 = acl_elog_val1; \
242 ed->val2 = acl_elog_val2; \
247 /* use like: elog_acl_maybe_trace_X3(am, "foobar: %d some u64 %lu baz: %d", "i4i8i4", int32_value, u64_value, int_value); */
249 #define elog_acl_maybe_trace_X3(am, acl_elog_trace_format_label, acl_elog_trace_format_args, acl_elog_val1, \
250 acl_elog_val2, acl_elog_val3) \
252 if (am->trace_sessions) { \
253 CLIB_UNUSED(struct { u8 available_space[18 - sizeof(acl_elog_val1) - sizeof(acl_elog_val2) \
254 - sizeof(acl_elog_val3)]; } *static_check); \
255 u16 thread_index = os_get_thread_index (); \
256 vlib_worker_thread_t * w = vlib_worker_threads + thread_index; \
257 ELOG_TYPE_DECLARE (e) = \
259 .format = "(%02d) " acl_elog_trace_format_label, \
260 .format_args = "i2" acl_elog_trace_format_args, \
265 typeof(acl_elog_val1) val1; \
266 typeof(acl_elog_val2) val2; \
267 typeof(acl_elog_val3) val3; \
269 ed = ELOG_TRACK_DATA (&vlib_global_main.elog_main, e, w->elog_track); \
270 ed->thread = thread_index; \
271 ed->val1 = acl_elog_val1; \
272 ed->val2 = acl_elog_val2; \
273 ed->val3 = acl_elog_val3; \
278 /* use like: elog_acl_maybe_trace_X4(am, "foobar: %d some int %d baz: %d bar: %d", "i4i4i4i4", int32_value, int32_value2, int_value, int_value); */
280 #define elog_acl_maybe_trace_X4(am, acl_elog_trace_format_label, acl_elog_trace_format_args, acl_elog_val1, \
281 acl_elog_val2, acl_elog_val3, acl_elog_val4) \
283 if (am->trace_sessions) { \
284 CLIB_UNUSED(struct { u8 available_space[18 - sizeof(acl_elog_val1) - sizeof(acl_elog_val2) \
285 - sizeof(acl_elog_val3) -sizeof(acl_elog_val4)]; } *static_check); \
286 u16 thread_index = os_get_thread_index (); \
287 vlib_worker_thread_t * w = vlib_worker_threads + thread_index; \
288 ELOG_TYPE_DECLARE (e) = \
290 .format = "(%02d) " acl_elog_trace_format_label, \
291 .format_args = "i2" acl_elog_trace_format_args, \
296 typeof(acl_elog_val1) val1; \
297 typeof(acl_elog_val2) val2; \
298 typeof(acl_elog_val3) val3; \
299 typeof(acl_elog_val4) val4; \
301 ed = ELOG_TRACK_DATA (&vlib_global_main.elog_main, e, w->elog_track); \
302 ed->thread = thread_index; \
303 ed->val1 = acl_elog_val1; \
304 ed->val2 = acl_elog_val2; \
305 ed->val3 = acl_elog_val3; \
306 ed->val4 = acl_elog_val4; \