448566d93ce7d11237998defa284f1dbf4192924
[vpp.git] / src / plugins / nat / nat44-ei / nat44_ei.c
1 /*
2  * nat44_ei.c - nat44 endpoint dependent plugin
3  *
4  * Copyright (c) 2020 Cisco and/or its affiliates.
5  * Licensed under the Apache License, Version 2.0 (the "License");
6  * you may not use this file except in compliance with the License.
7  * You may obtain a copy of the License at:
8  *
9  *     http://www.apache.org/licenses/LICENSE-2.0
10  *
11  * Unless required by applicable law or agreed to in writing, software
12  * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
13  * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
14  * License for the specific language governing permissions and limitations
15  * under the License.
16  */
17
18 #include <vnet/plugin/plugin.h>
19 #include <vpp/app/version.h>
20
21 #include <vnet/vnet.h>
22 #include <vnet/ip/ip.h>
23 #include <vnet/ip/ip4.h>
24 #include <vnet/ip/ip_table.h>
25 #include <vnet/ip/reass/ip4_sv_reass.h>
26 #include <vnet/fib/fib_table.h>
27 #include <vnet/fib/ip4_fib.h>
28 #include <vnet/plugin/plugin.h>
29
30 // nat lib
31 #include <nat/lib/log.h>
32 #include <nat/lib/nat_syslog.h>
33 #include <nat/lib/nat_inlines.h>
34 #include <nat/lib/ipfix_logging.h>
35
36 #include <nat/nat44-ei/nat44_ei_dpo.h>
37 #include <nat/nat44-ei/nat44_ei_inlines.h>
38 #include <nat/nat44-ei/nat44_ei.h>
39
40 nat44_ei_main_t nat44_ei_main;
41
42 extern vlib_node_registration_t nat44_ei_hairpinning_node;
43 extern vlib_node_registration_t
44   nat44_ei_in2out_hairpinning_finish_ip4_lookup_node;
45 extern vlib_node_registration_t
46   nat44_ei_in2out_hairpinning_finish_interface_output_node;
47
48 #define skip_if_disabled()                                                    \
49   do                                                                          \
50     {                                                                         \
51       nat44_ei_main_t *nm = &nat44_ei_main;                                   \
52       if (PREDICT_FALSE (!nm->enabled))                                       \
53         return;                                                               \
54     }                                                                         \
55   while (0)
56
57 #define fail_if_enabled()                                                     \
58   do                                                                          \
59     {                                                                         \
60       nat44_ei_main_t *nm = &nat44_ei_main;                                   \
61       if (PREDICT_FALSE (nm->enabled))                                        \
62         {                                                                     \
63           nat44_ei_log_err ("plugin enabled");                                \
64           return 1;                                                           \
65         }                                                                     \
66     }                                                                         \
67   while (0)
68
69 #define fail_if_disabled()                                                    \
70   do                                                                          \
71     {                                                                         \
72       nat44_ei_main_t *nm = &nat44_ei_main;                                   \
73       if (PREDICT_FALSE (!nm->enabled))                                       \
74         {                                                                     \
75           nat44_ei_log_err ("plugin disabled");                               \
76           return 1;                                                           \
77         }                                                                     \
78     }                                                                         \
79   while (0)
80
81 /* Hook up input features */
82 VNET_FEATURE_INIT (ip4_nat_classify, static) = {
83   .arc_name = "ip4-unicast",
84   .node_name = "nat44-ei-classify",
85   .runs_after = VNET_FEATURES ("acl-plugin-in-ip4-fa",
86                                "ip4-sv-reassembly-feature"),
87 };
88 VNET_FEATURE_INIT (ip4_nat_handoff_classify, static) = {
89   .arc_name = "ip4-unicast",
90   .node_name = "nat44-ei-handoff-classify",
91   .runs_after = VNET_FEATURES ("acl-plugin-in-ip4-fa",
92                                "ip4-sv-reassembly-feature"),
93 };
94 VNET_FEATURE_INIT (ip4_nat44_ei_in2out, static) = {
95   .arc_name = "ip4-unicast",
96   .node_name = "nat44-ei-in2out",
97   .runs_after = VNET_FEATURES ("acl-plugin-in-ip4-fa",
98                                "ip4-sv-reassembly-feature"),
99 };
100 VNET_FEATURE_INIT (ip4_nat44_ei_out2in, static) = {
101   .arc_name = "ip4-unicast",
102   .node_name = "nat44-ei-out2in",
103   .runs_after = VNET_FEATURES ("acl-plugin-in-ip4-fa",
104                                "ip4-sv-reassembly-feature",
105                                "ip4-dhcp-client-detect"),
106 };
107 VNET_FEATURE_INIT (ip4_nat44_ei_in2out_output, static) = {
108   .arc_name = "ip4-output",
109   .node_name = "nat44-ei-in2out-output",
110   .runs_after = VNET_FEATURES ("acl-plugin-out-ip4-fa",
111                                "ip4-sv-reassembly-output-feature"),
112 };
113 VNET_FEATURE_INIT (ip4_nat44_ei_hairpinning, static) = {
114   .arc_name = "ip4-local",
115   .node_name = "nat44-ei-hairpinning",
116   .runs_before = VNET_FEATURES ("ip4-local-end-of-arc"),
117 };
118 VNET_FEATURE_INIT (ip4_nat44_ei_in2out_worker_handoff, static) = {
119   .arc_name = "ip4-unicast",
120   .node_name = "nat44-ei-in2out-worker-handoff",
121   .runs_after = VNET_FEATURES ("acl-plugin-in-ip4-fa"),
122 };
123 VNET_FEATURE_INIT (ip4_nat44_ei_out2in_worker_handoff, static) = {
124   .arc_name = "ip4-unicast",
125   .node_name = "nat44-ei-out2in-worker-handoff",
126   .runs_after = VNET_FEATURES ("acl-plugin-in-ip4-fa",
127                                "ip4-dhcp-client-detect"),
128 };
129 VNET_FEATURE_INIT (ip4_nat44_ei_in2out_output_worker_handoff, static) = {
130   .arc_name = "ip4-output",
131   .node_name = "nat44-ei-in2out-output-worker-handoff",
132   .runs_after = VNET_FEATURES ("acl-plugin-out-ip4-fa",
133                                "ip4-sv-reassembly-output-feature"),
134 };
135
136 VLIB_PLUGIN_REGISTER () = {
137   .version = VPP_BUILD_VER,
138   .description = "IPv4 Endpoint-Independent NAT (NAT44 EI)",
139 };
140
141 #define foreach_nat44_ei_classify_error                                       \
142   _ (NEXT_IN2OUT, "next in2out")                                              \
143   _ (NEXT_OUT2IN, "next out2in")                                              \
144   _ (FRAG_CACHED, "fragment cached")
145
146 typedef enum
147 {
148 #define _(sym, str) NAT44_EI_CLASSIFY_ERROR_##sym,
149   foreach_nat44_ei_classify_error
150 #undef _
151     NAT44_EI_CLASSIFY_N_ERROR,
152 } nat44_ei_classify_error_t;
153
154 static char *nat44_ei_classify_error_strings[] = {
155 #define _(sym, string) string,
156   foreach_nat44_ei_classify_error
157 #undef _
158 };
159
160 typedef enum
161 {
162   NAT44_EI_CLASSIFY_NEXT_IN2OUT,
163   NAT44_EI_CLASSIFY_NEXT_OUT2IN,
164   NAT44_EI_CLASSIFY_NEXT_DROP,
165   NAT44_EI_CLASSIFY_N_NEXT,
166 } nat44_ei_classify_next_t;
167
168 typedef struct
169 {
170   u8 next_in2out;
171   u8 cached;
172 } nat44_ei_classify_trace_t;
173
174 void nat44_ei_add_del_addr_to_fib (ip4_address_t *addr, u8 p_len,
175                                    u32 sw_if_index, int is_add);
176
177 static void nat44_ei_worker_db_free (nat44_ei_main_per_thread_data_t *tnm);
178
179 static int nat44_ei_add_static_mapping_internal (
180   ip4_address_t l_addr, ip4_address_t e_addr, u16 l_port, u16 e_port,
181   nat_protocol_t proto, u32 vrf_id, u32 sw_if_index, u32 flags,
182   ip4_address_t pool_addr, u8 *tag);
183
184 static int nat44_ei_del_static_mapping_internal (
185   ip4_address_t l_addr, ip4_address_t e_addr, u16 l_port, u16 e_port,
186   nat_protocol_t proto, u32 vrf_id, u32 sw_if_index, u32 flags);
187
188 always_inline bool
189 nat44_ei_port_is_used (nat44_ei_address_t *a, u8 proto, u16 port)
190 {
191   return clib_bitmap_get (a->busy_port_bitmap[proto], port);
192 }
193
194 always_inline void
195 nat44_ei_port_get (nat44_ei_address_t *a, u8 proto, u16 port)
196 {
197   ASSERT (!nat44_ei_port_is_used (a, proto, port));
198   a->busy_port_bitmap[proto] =
199     clib_bitmap_set (a->busy_port_bitmap[proto], port, 1);
200 }
201
202 always_inline void
203 nat44_ei_port_put (nat44_ei_address_t *a, u8 proto, u16 port)
204 {
205   ASSERT (nat44_ei_port_is_used (a, proto, port));
206   a->busy_port_bitmap[proto] =
207     clib_bitmap_set (a->busy_port_bitmap[proto], port, 0);
208 }
209
210 static u8 *
211 format_nat44_ei_classify_trace (u8 *s, va_list *args)
212 {
213   CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
214   CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
215   nat44_ei_classify_trace_t *t = va_arg (*args, nat44_ei_classify_trace_t *);
216   char *next;
217
218   if (t->cached)
219     s = format (s, "nat44-ei-classify: fragment cached");
220   else
221     {
222       next = t->next_in2out ? "nat44-ei-in2out" : "nat44-ei-out2in";
223       s = format (s, "nat44-ei-classify: next %s", next);
224     }
225
226   return s;
227 }
228
229 static void nat44_ei_db_init (u32 translations, u32 translation_buckets,
230                               u32 user_buckets);
231
232 static void nat44_ei_ip4_add_del_interface_address_cb (
233   ip4_main_t *im, uword opaque, u32 sw_if_index, ip4_address_t *address,
234   u32 address_length, u32 if_address_index, u32 is_delete);
235
236 static void nat44_ei_ip4_add_del_addr_only_sm_cb (
237   ip4_main_t *im, uword opaque, u32 sw_if_index, ip4_address_t *address,
238   u32 address_length, u32 if_address_index, u32 is_delete);
239
240 static void nat44_ei_update_outside_fib (ip4_main_t *im, uword opaque,
241                                          u32 sw_if_index, u32 new_fib_index,
242                                          u32 old_fib_index);
243
244 void
245 nat44_ei_set_node_indexes (nat44_ei_main_t *nm, vlib_main_t *vm)
246 {
247   vlib_node_t *node;
248   node = vlib_get_node_by_name (vm, (u8 *) "nat44-ei-out2in");
249   nm->out2in_node_index = node->index;
250   node = vlib_get_node_by_name (vm, (u8 *) "nat44-ei-in2out");
251   nm->in2out_node_index = node->index;
252   node = vlib_get_node_by_name (vm, (u8 *) "nat44-ei-in2out-output");
253   nm->in2out_output_node_index = node->index;
254 }
255
256 int
257 nat44_ei_set_workers (uword *bitmap)
258 {
259   nat44_ei_main_t *nm = &nat44_ei_main;
260   int i, j = 0;
261
262   if (nm->num_workers < 2)
263     return VNET_API_ERROR_FEATURE_DISABLED;
264
265   if (clib_bitmap_last_set (bitmap) >= nm->num_workers)
266     return VNET_API_ERROR_INVALID_WORKER;
267
268   vec_free (nm->workers);
269   clib_bitmap_foreach (i, bitmap)
270     {
271       vec_add1 (nm->workers, i);
272       nm->per_thread_data[nm->first_worker_index + i].snat_thread_index = j;
273       nm->per_thread_data[nm->first_worker_index + i].thread_index = i;
274       j++;
275     }
276
277   nm->port_per_thread = (0xffff - 1024) / _vec_len (nm->workers);
278
279   return 0;
280 }
281
282 #define nat_validate_simple_counter(c, i)                                     \
283   do                                                                          \
284     {                                                                         \
285       vlib_validate_simple_counter (&c, i);                                   \
286       vlib_zero_simple_counter (&c, i);                                       \
287     }                                                                         \
288   while (0);
289
290 #define nat_init_simple_counter(c, n, sn)                                     \
291   do                                                                          \
292     {                                                                         \
293       c.name = n;                                                             \
294       c.stat_segment_name = sn;                                               \
295       nat_validate_simple_counter (c, 0);                                     \
296     }                                                                         \
297   while (0);
298
299 static_always_inline void
300 nat_validate_interface_counters (nat44_ei_main_t *nm, u32 sw_if_index)
301 {
302 #define _(x)                                                                  \
303   nat_validate_simple_counter (nm->counters.fastpath.in2out.x, sw_if_index);  \
304   nat_validate_simple_counter (nm->counters.fastpath.out2in.x, sw_if_index);  \
305   nat_validate_simple_counter (nm->counters.slowpath.in2out.x, sw_if_index);  \
306   nat_validate_simple_counter (nm->counters.slowpath.out2in.x, sw_if_index);
307   foreach_nat_counter;
308 #undef _
309   nat_validate_simple_counter (nm->counters.hairpinning, sw_if_index);
310 }
311
312 static void
313 nat44_ei_add_del_addr_to_fib_foreach_out_if (ip4_address_t *addr, u8 is_add)
314 {
315   nat44_ei_main_t *nm = &nat44_ei_main;
316   nat44_ei_interface_t *i;
317
318   pool_foreach (i, nm->interfaces)
319     {
320       if (nat44_ei_interface_is_outside (i) && !nm->out2in_dpo)
321         {
322           nat44_ei_add_del_addr_to_fib (addr, 32, i->sw_if_index, is_add);
323         }
324     }
325   pool_foreach (i, nm->output_feature_interfaces)
326     {
327       if (nat44_ei_interface_is_outside (i) && !nm->out2in_dpo)
328         {
329           nat44_ei_add_del_addr_to_fib (addr, 32, i->sw_if_index, is_add);
330         }
331     }
332 }
333
334 static_always_inline void
335 nat44_ei_add_del_addr_to_fib_foreach_addr (u32 sw_if_index, u8 is_add)
336 {
337   nat44_ei_main_t *nm = &nat44_ei_main;
338   nat44_ei_address_t *ap;
339
340   vec_foreach (ap, nm->addresses)
341     {
342       nat44_ei_add_del_addr_to_fib (&ap->addr, 32, sw_if_index, is_add);
343     }
344 }
345
346 static_always_inline void
347 nat44_ei_add_del_addr_to_fib_foreach_addr_only_sm (u32 sw_if_index, u8 is_add)
348 {
349   nat44_ei_main_t *nm = &nat44_ei_main;
350   nat44_ei_static_mapping_t *m;
351
352   pool_foreach (m, nm->static_mappings)
353     {
354       if (is_sm_addr_only (m->flags) &&
355           !(m->local_addr.as_u32 == m->external_addr.as_u32))
356         {
357           nat44_ei_add_del_addr_to_fib (&m->external_addr, 32, sw_if_index,
358                                         is_add);
359         }
360     }
361 }
362
363 static int
364 nat44_ei_is_address_used_in_static_mapping (ip4_address_t addr)
365 {
366   nat44_ei_main_t *nm = &nat44_ei_main;
367   nat44_ei_static_mapping_t *m;
368   pool_foreach (m, nm->static_mappings)
369     {
370       if (is_sm_addr_only (m->flags) || is_sm_identity_nat (m->flags))
371         {
372           continue;
373         }
374       if (m->external_addr.as_u32 == addr.as_u32)
375         {
376           return 1;
377         }
378     }
379   return 0;
380 }
381
382 clib_error_t *
383 nat44_ei_init (vlib_main_t *vm)
384 {
385   nat44_ei_main_t *nm = &nat44_ei_main;
386   vlib_thread_main_t *tm = vlib_get_thread_main ();
387   vlib_thread_registration_t *tr;
388   ip4_add_del_interface_address_callback_t cbi = { 0 };
389   ip4_table_bind_callback_t cbt = { 0 };
390   u32 i, num_threads = 0;
391   uword *p, *bitmap = 0;
392
393   clib_memset (nm, 0, sizeof (*nm));
394
395   // required
396   nm->vnet_main = vnet_get_main ();
397   // convenience
398   nm->ip4_main = &ip4_main;
399   nm->api_main = vlibapi_get_main ();
400   nm->ip4_lookup_main = &ip4_main.lookup_main;
401
402   // handoff stuff
403   nm->fq_out2in_index = ~0;
404   nm->fq_in2out_index = ~0;
405   nm->fq_in2out_output_index = ~0;
406
407   nm->log_level = NAT_LOG_ERROR;
408
409   nat44_ei_set_node_indexes (nm, vm);
410   nm->log_class = vlib_log_register_class ("nat44-ei", 0);
411
412   nat_init_simple_counter (nm->total_users, "total-users",
413                            "/nat44-ei/total-users");
414   nat_init_simple_counter (nm->total_sessions, "total-sessions",
415                            "/nat44-ei/total-sessions");
416   nat_init_simple_counter (nm->user_limit_reached, "user-limit-reached",
417                            "/nat44-ei/user-limit-reached");
418
419 #define _(x)                                                                  \
420   nat_init_simple_counter (nm->counters.fastpath.in2out.x, #x,                \
421                            "/nat44-ei/in2out/fastpath/" #x);                  \
422   nat_init_simple_counter (nm->counters.fastpath.out2in.x, #x,                \
423                            "/nat44-ei/out2in/fastpath/" #x);                  \
424   nat_init_simple_counter (nm->counters.slowpath.in2out.x, #x,                \
425                            "/nat44-ei/in2out/slowpath/" #x);                  \
426   nat_init_simple_counter (nm->counters.slowpath.out2in.x, #x,                \
427                            "/nat44-ei/out2in/slowpath/" #x);
428   foreach_nat_counter;
429 #undef _
430   nat_init_simple_counter (nm->counters.hairpinning, "hairpinning",
431                            "/nat44-ei/hairpinning");
432
433   p = hash_get_mem (tm->thread_registrations_by_name, "workers");
434   if (p)
435     {
436       tr = (vlib_thread_registration_t *) p[0];
437       if (tr)
438         {
439           nm->num_workers = tr->count;
440           nm->first_worker_index = tr->first_index;
441         }
442     }
443   num_threads = tm->n_vlib_mains - 1;
444   nm->port_per_thread = 0xffff - 1024;
445   vec_validate (nm->per_thread_data, num_threads);
446
447   /* Use all available workers by default */
448   if (nm->num_workers > 1)
449     {
450       for (i = 0; i < nm->num_workers; i++)
451         bitmap = clib_bitmap_set (bitmap, i, 1);
452       nat44_ei_set_workers (bitmap);
453       clib_bitmap_free (bitmap);
454     }
455   else
456     {
457       nm->per_thread_data[0].snat_thread_index = 0;
458     }
459
460   /* callbacks to call when interface address changes. */
461   cbi.function = nat44_ei_ip4_add_del_interface_address_cb;
462   vec_add1 (nm->ip4_main->add_del_interface_address_callbacks, cbi);
463   cbi.function = nat44_ei_ip4_add_del_addr_only_sm_cb;
464   vec_add1 (nm->ip4_main->add_del_interface_address_callbacks, cbi);
465
466   /* callbacks to call when interface to table biding changes */
467   cbt.function = nat44_ei_update_outside_fib;
468   vec_add1 (nm->ip4_main->table_bind_callbacks, cbt);
469
470   nm->fib_src_low = fib_source_allocate (
471     "nat44-ei-low", FIB_SOURCE_PRIORITY_LOW, FIB_SOURCE_BH_SIMPLE);
472   nm->fib_src_hi = fib_source_allocate ("nat44-ei-hi", FIB_SOURCE_PRIORITY_HI,
473                                         FIB_SOURCE_BH_SIMPLE);
474
475   // used only by out2in-dpo feature
476   nat_dpo_module_init ();
477   nat_ha_init (vm, nm->num_workers, num_threads);
478
479   nm->hairpinning_fq_index =
480     vlib_frame_queue_main_init (nat44_ei_hairpinning_node.index, 0);
481   nm->in2out_hairpinning_finish_ip4_lookup_node_fq_index =
482     vlib_frame_queue_main_init (
483       nat44_ei_in2out_hairpinning_finish_ip4_lookup_node.index, 0);
484   nm->in2out_hairpinning_finish_interface_output_node_fq_index =
485     vlib_frame_queue_main_init (
486       nat44_ei_in2out_hairpinning_finish_interface_output_node.index, 0);
487   return nat44_ei_api_hookup (vm);
488 }
489
490 VLIB_INIT_FUNCTION (nat44_ei_init);
491
492 int
493 nat44_ei_plugin_enable (nat44_ei_config_t c)
494 {
495   nat44_ei_main_t *nm = &nat44_ei_main;
496
497   fail_if_enabled ();
498
499   if (!c.users)
500     c.users = 1024;
501
502   if (!c.sessions)
503     c.sessions = 10 * 1024;
504
505   if (!c.user_sessions)
506     c.user_sessions = c.sessions;
507
508   nm->rconfig = c;
509
510   if (!nm->frame_queue_nelts)
511     nm->frame_queue_nelts = NAT_FQ_NELTS_DEFAULT;
512
513   nm->translations = c.sessions;
514   nm->translation_buckets = nat_calc_bihash_buckets (c.sessions);
515   nm->user_buckets = nat_calc_bihash_buckets (c.users);
516
517   nm->pat = (!c.static_mapping_only ||
518              (c.static_mapping_only && c.connection_tracking));
519
520   nm->static_mapping_only = c.static_mapping_only;
521   nm->static_mapping_connection_tracking = c.connection_tracking;
522   nm->out2in_dpo = c.out2in_dpo;
523   nm->forwarding_enabled = 0;
524   nm->mss_clamping = 0;
525
526   nm->max_users_per_thread = c.users;
527   nm->max_translations_per_thread = c.sessions;
528   nm->max_translations_per_user = c.user_sessions;
529
530   nm->inside_vrf_id = c.inside_vrf;
531   nm->inside_fib_index = fib_table_find_or_create_and_lock (
532     FIB_PROTOCOL_IP4, c.inside_vrf, nm->fib_src_hi);
533
534   nm->outside_vrf_id = c.outside_vrf;
535   nm->outside_fib_index = fib_table_find_or_create_and_lock (
536     FIB_PROTOCOL_IP4, c.outside_vrf, nm->fib_src_hi);
537
538   nat_reset_timeouts (&nm->timeouts);
539   nat44_ei_db_init (nm->translations, nm->translation_buckets,
540                     nm->user_buckets);
541   nat44_ei_set_alloc_default ();
542
543   vlib_zero_simple_counter (&nm->total_users, 0);
544   vlib_zero_simple_counter (&nm->total_sessions, 0);
545   vlib_zero_simple_counter (&nm->user_limit_reached, 0);
546
547   if (nm->num_workers > 1)
548     {
549       if (nm->fq_in2out_index == ~0)
550         {
551           nm->fq_in2out_index = vlib_frame_queue_main_init (
552             nm->in2out_node_index, nm->frame_queue_nelts);
553         }
554       if (nm->fq_out2in_index == ~0)
555         {
556           nm->fq_out2in_index = vlib_frame_queue_main_init (
557             nm->out2in_node_index, nm->frame_queue_nelts);
558         }
559       if (nm->fq_in2out_output_index == ~0)
560         {
561           nm->fq_in2out_output_index = vlib_frame_queue_main_init (
562             nm->in2out_output_node_index, nm->frame_queue_nelts);
563         }
564     }
565
566   nat_ha_enable ();
567   nm->enabled = 1;
568
569   return 0;
570 }
571
572 static_always_inline nat44_ei_outside_fib_t *
573 nat44_ei_get_outside_fib (nat44_ei_outside_fib_t *outside_fibs, u32 fib_index)
574 {
575   nat44_ei_outside_fib_t *f;
576   vec_foreach (f, outside_fibs)
577     {
578       if (f->fib_index == fib_index)
579         {
580           return f;
581         }
582     }
583   return 0;
584 }
585
586 static_always_inline nat44_ei_interface_t *
587 nat44_ei_get_interface (nat44_ei_interface_t *interfaces, u32 sw_if_index)
588 {
589   nat44_ei_interface_t *i;
590   pool_foreach (i, interfaces)
591     {
592       if (i->sw_if_index == sw_if_index)
593         {
594           return i;
595         }
596     }
597   return 0;
598 }
599
600 static_always_inline int
601 nat44_ei_hairpinning_enable (u8 is_enable)
602 {
603   nat44_ei_main_t *nm = &nat44_ei_main;
604   u32 sw_if_index = 0; // local0
605
606   if (is_enable)
607     {
608       nm->hairpin_reg += 1;
609       if (1 == nm->hairpin_reg)
610         {
611           return vnet_feature_enable_disable (
612             "ip4-local", "nat44-ei-hairpinning", sw_if_index, is_enable, 0, 0);
613         }
614     }
615   else
616     {
617       if (0 == nm->hairpin_reg)
618         return 1;
619
620       nm->hairpin_reg -= 1;
621       if (0 == nm->hairpin_reg)
622         {
623           return vnet_feature_enable_disable (
624             "ip4-local", "nat44-ei-hairpinning", sw_if_index, is_enable, 0, 0);
625         }
626     }
627
628   return 0;
629 }
630
631 int
632 nat44_ei_add_interface (u32 sw_if_index, u8 is_inside)
633 {
634   const char *feature_name, *del_feature_name;
635   nat44_ei_main_t *nm = &nat44_ei_main;
636
637   nat44_ei_outside_fib_t *outside_fib;
638   nat44_ei_interface_t *i;
639   u32 fib_index;
640   int rv;
641
642   fail_if_disabled ();
643
644   if (nm->out2in_dpo && !is_inside)
645     {
646       nat44_ei_log_err ("error unsupported");
647       return VNET_API_ERROR_UNSUPPORTED;
648     }
649
650   if (nat44_ei_get_interface (nm->output_feature_interfaces, sw_if_index))
651     {
652       nat44_ei_log_err ("error interface already configured");
653       return VNET_API_ERROR_VALUE_EXIST;
654     }
655
656   i = nat44_ei_get_interface (nm->interfaces, sw_if_index);
657   if (i)
658     {
659       if ((nat44_ei_interface_is_inside (i) && is_inside) ||
660           (nat44_ei_interface_is_outside (i) && !is_inside))
661         {
662           return 0;
663         }
664       if (nm->num_workers > 1)
665         {
666           del_feature_name = !is_inside ? "nat44-ei-in2out-worker-handoff" :
667                                           "nat44-ei-out2in-worker-handoff";
668           feature_name = "nat44-ei-handoff-classify";
669         }
670       else
671         {
672           del_feature_name =
673             !is_inside ? "nat44-ei-in2out" : "nat44-ei-out2in";
674
675           feature_name = "nat44-ei-classify";
676         }
677
678       rv = ip4_sv_reass_enable_disable_with_refcnt (sw_if_index, 1);
679       if (rv)
680         {
681           return rv;
682         }
683       rv = vnet_feature_enable_disable ("ip4-unicast", del_feature_name,
684                                         sw_if_index, 0, 0, 0);
685       if (rv)
686         {
687           return rv;
688         }
689       rv = vnet_feature_enable_disable ("ip4-unicast", feature_name,
690                                         sw_if_index, 1, 0, 0);
691       if (rv)
692         {
693           return rv;
694         }
695       if (!is_inside)
696         {
697           rv = nat44_ei_hairpinning_enable (0);
698           if (rv)
699             {
700               return rv;
701             }
702         }
703     }
704   else
705     {
706       if (nm->num_workers > 1)
707         {
708           feature_name = is_inside ? "nat44-ei-in2out-worker-handoff" :
709                                      "nat44-ei-out2in-worker-handoff";
710         }
711       else
712         {
713           feature_name = is_inside ? "nat44-ei-in2out" : "nat44-ei-out2in";
714         }
715       nat_validate_interface_counters (nm, sw_if_index);
716
717       rv = ip4_sv_reass_enable_disable_with_refcnt (sw_if_index, 1);
718       if (rv)
719         {
720           return rv;
721         }
722       rv = vnet_feature_enable_disable ("ip4-unicast", feature_name,
723                                         sw_if_index, 1, 0, 0);
724       if (rv)
725         {
726           return rv;
727         }
728       if (is_inside && !nm->out2in_dpo)
729         {
730           rv = nat44_ei_hairpinning_enable (1);
731           if (rv)
732             {
733               return rv;
734             }
735         }
736
737       pool_get (nm->interfaces, i);
738       i->sw_if_index = sw_if_index;
739       i->flags = 0;
740     }
741
742   fib_index =
743     fib_table_get_index_for_sw_if_index (FIB_PROTOCOL_IP4, sw_if_index);
744
745   if (!is_inside)
746     {
747       i->flags |= NAT44_EI_INTERFACE_FLAG_IS_OUTSIDE;
748
749       outside_fib = nat44_ei_get_outside_fib (nm->outside_fibs, fib_index);
750       if (outside_fib)
751         {
752           outside_fib->refcount++;
753         }
754       else
755         {
756           vec_add2 (nm->outside_fibs, outside_fib, 1);
757           outside_fib->fib_index = fib_index;
758           outside_fib->refcount = 1;
759         }
760
761       nat44_ei_add_del_addr_to_fib_foreach_addr (sw_if_index, 1);
762       nat44_ei_add_del_addr_to_fib_foreach_addr_only_sm (sw_if_index, 1);
763     }
764   else
765     {
766       i->flags |= NAT44_EI_INTERFACE_FLAG_IS_INSIDE;
767     }
768
769   return 0;
770 }
771
772 int
773 nat44_ei_del_interface (u32 sw_if_index, u8 is_inside)
774 {
775   const char *feature_name, *del_feature_name;
776   nat44_ei_main_t *nm = &nat44_ei_main;
777
778   nat44_ei_outside_fib_t *outside_fib;
779   nat44_ei_interface_t *i;
780   u32 fib_index;
781   int rv;
782
783   fail_if_disabled ();
784
785   if (nm->out2in_dpo && !is_inside)
786     {
787       nat44_ei_log_err ("error unsupported");
788       return VNET_API_ERROR_UNSUPPORTED;
789     }
790
791   i = nat44_ei_get_interface (nm->interfaces, sw_if_index);
792   if (i == 0)
793     {
794       nat44_ei_log_err ("error interface couldn't be found");
795       return VNET_API_ERROR_NO_SUCH_ENTRY;
796     }
797
798   if (nat44_ei_interface_is_inside (i) && nat44_ei_interface_is_outside (i))
799     {
800       if (nm->num_workers > 1)
801         {
802           del_feature_name = "nat44-ei-handoff-classify";
803           feature_name = !is_inside ? "nat44-ei-in2out-worker-handoff" :
804                                       "nat44-ei-out2in-worker-handoff";
805         }
806       else
807         {
808           del_feature_name = "nat44-ei-classify";
809           feature_name = !is_inside ? "nat44-ei-in2out" : "nat44-ei-out2in";
810         }
811
812       rv = ip4_sv_reass_enable_disable_with_refcnt (sw_if_index, 0);
813       if (rv)
814         {
815           return rv;
816         }
817       rv = vnet_feature_enable_disable ("ip4-unicast", del_feature_name,
818                                         sw_if_index, 0, 0, 0);
819       if (rv)
820         {
821           return rv;
822         }
823       rv = vnet_feature_enable_disable ("ip4-unicast", feature_name,
824                                         sw_if_index, 1, 0, 0);
825       if (rv)
826         {
827           return rv;
828         }
829       if (is_inside)
830         {
831           i->flags &= ~NAT44_EI_INTERFACE_FLAG_IS_INSIDE;
832         }
833       else
834         {
835           rv = nat44_ei_hairpinning_enable (1);
836           if (rv)
837             {
838               return rv;
839             }
840           i->flags &= ~NAT44_EI_INTERFACE_FLAG_IS_OUTSIDE;
841         }
842     }
843   else
844     {
845       if (nm->num_workers > 1)
846         {
847           feature_name = is_inside ? "nat44-ei-in2out-worker-handoff" :
848                                      "nat44-ei-out2in-worker-handoff";
849         }
850       else
851         {
852           feature_name = is_inside ? "nat44-ei-in2out" : "nat44-ei-out2in";
853         }
854
855       rv = ip4_sv_reass_enable_disable_with_refcnt (sw_if_index, 0);
856       if (rv)
857         {
858           return rv;
859         }
860       rv = vnet_feature_enable_disable ("ip4-unicast", feature_name,
861                                         sw_if_index, 0, 0, 0);
862       if (rv)
863         {
864           return rv;
865         }
866       if (is_inside)
867         {
868           rv = nat44_ei_hairpinning_enable (0);
869           if (rv)
870             {
871               return rv;
872             }
873         }
874
875       // remove interface
876       pool_put (nm->interfaces, i);
877     }
878
879   if (!is_inside)
880     {
881       fib_index =
882         fib_table_get_index_for_sw_if_index (FIB_PROTOCOL_IP4, sw_if_index);
883       outside_fib = nat44_ei_get_outside_fib (nm->outside_fibs, fib_index);
884       if (outside_fib)
885         {
886           outside_fib->refcount--;
887           if (!outside_fib->refcount)
888             {
889               vec_del1 (nm->outside_fibs, outside_fib - nm->outside_fibs);
890             }
891         }
892
893       nat44_ei_add_del_addr_to_fib_foreach_addr (sw_if_index, 0);
894       nat44_ei_add_del_addr_to_fib_foreach_addr_only_sm (sw_if_index, 0);
895     }
896
897   return 0;
898 }
899
900 int
901 nat44_ei_add_output_interface (u32 sw_if_index)
902 {
903   nat44_ei_main_t *nm = &nat44_ei_main;
904
905   nat44_ei_outside_fib_t *outside_fib;
906   nat44_ei_interface_t *i;
907   u32 fib_index;
908   int rv;
909
910   fail_if_disabled ();
911
912   if (nat44_ei_get_interface (nm->interfaces, sw_if_index))
913     {
914       nat44_ei_log_err ("error interface already configured");
915       return VNET_API_ERROR_VALUE_EXIST;
916     }
917
918   if (nat44_ei_get_interface (nm->output_feature_interfaces, sw_if_index))
919     {
920       nat44_ei_log_err ("error interface already configured");
921       return VNET_API_ERROR_VALUE_EXIST;
922     }
923
924   if (nm->num_workers > 1)
925     {
926       rv = ip4_sv_reass_enable_disable_with_refcnt (sw_if_index, 1);
927       if (rv)
928         {
929           return rv;
930         }
931       rv = ip4_sv_reass_output_enable_disable_with_refcnt (sw_if_index, 1);
932       if (rv)
933         {
934           return rv;
935         }
936       rv = vnet_feature_enable_disable (
937         "ip4-unicast", "nat44-ei-out2in-worker-handoff", sw_if_index, 1, 0, 0);
938       if (rv)
939         {
940           return rv;
941         }
942       rv = vnet_feature_enable_disable (
943         "ip4-output", "nat44-ei-in2out-output-worker-handoff", sw_if_index, 1,
944         0, 0);
945       if (rv)
946         {
947           return rv;
948         }
949     }
950   else
951     {
952       rv = ip4_sv_reass_enable_disable_with_refcnt (sw_if_index, 1);
953       if (rv)
954         {
955           return rv;
956         }
957       rv = ip4_sv_reass_output_enable_disable_with_refcnt (sw_if_index, 1);
958       if (rv)
959         {
960           return rv;
961         }
962       rv = vnet_feature_enable_disable ("ip4-unicast", "nat44-ei-out2in",
963                                         sw_if_index, 1, 0, 0);
964       if (rv)
965         {
966           return rv;
967         }
968       rv = vnet_feature_enable_disable ("ip4-output", "nat44-ei-in2out-output",
969                                         sw_if_index, 1, 0, 0);
970       if (rv)
971         {
972           return rv;
973         }
974     }
975
976   nat_validate_interface_counters (nm, sw_if_index);
977
978   pool_get (nm->output_feature_interfaces, i);
979   i->sw_if_index = sw_if_index;
980   i->flags = 0;
981   i->flags |= NAT44_EI_INTERFACE_FLAG_IS_INSIDE;
982   i->flags |= NAT44_EI_INTERFACE_FLAG_IS_OUTSIDE;
983
984   fib_index =
985     fib_table_get_index_for_sw_if_index (FIB_PROTOCOL_IP4, sw_if_index);
986   outside_fib = nat44_ei_get_outside_fib (nm->outside_fibs, fib_index);
987   if (outside_fib)
988     {
989       outside_fib->refcount++;
990     }
991   else
992     {
993       vec_add2 (nm->outside_fibs, outside_fib, 1);
994       outside_fib->fib_index = fib_index;
995       outside_fib->refcount = 1;
996     }
997
998   nat44_ei_add_del_addr_to_fib_foreach_addr (sw_if_index, 1);
999   nat44_ei_add_del_addr_to_fib_foreach_addr_only_sm (sw_if_index, 1);
1000
1001   return 0;
1002 }
1003
1004 int
1005 nat44_ei_del_output_interface (u32 sw_if_index)
1006 {
1007   nat44_ei_main_t *nm = &nat44_ei_main;
1008
1009   nat44_ei_outside_fib_t *outside_fib;
1010   nat44_ei_interface_t *i;
1011   u32 fib_index;
1012   int rv;
1013
1014   fail_if_disabled ();
1015
1016   i = nat44_ei_get_interface (nm->output_feature_interfaces, sw_if_index);
1017   if (!i)
1018     {
1019       nat44_ei_log_err ("error interface couldn't be found");
1020       return VNET_API_ERROR_NO_SUCH_ENTRY;
1021     }
1022
1023   if (nm->num_workers > 1)
1024     {
1025       rv = ip4_sv_reass_enable_disable_with_refcnt (sw_if_index, 0);
1026       if (rv)
1027         {
1028           return rv;
1029         }
1030       rv = ip4_sv_reass_output_enable_disable_with_refcnt (sw_if_index, 0);
1031       if (rv)
1032         {
1033           return rv;
1034         }
1035       rv = vnet_feature_enable_disable (
1036         "ip4-unicast", "nat44-ei-out2in-worker-handoff", sw_if_index, 0, 0, 0);
1037       if (rv)
1038         {
1039           return rv;
1040         }
1041       rv = vnet_feature_enable_disable (
1042         "ip4-output", "nat44-ei-in2out-output-worker-handoff", sw_if_index, 0,
1043         0, 0);
1044       if (rv)
1045         {
1046           return rv;
1047         }
1048     }
1049   else
1050     {
1051       rv = ip4_sv_reass_enable_disable_with_refcnt (sw_if_index, 0);
1052       if (rv)
1053         {
1054           return rv;
1055         }
1056       rv = ip4_sv_reass_output_enable_disable_with_refcnt (sw_if_index, 0);
1057       if (rv)
1058         {
1059           return rv;
1060         }
1061       rv = vnet_feature_enable_disable ("ip4-unicast", "nat44-ei-out2in",
1062                                         sw_if_index, 0, 0, 0);
1063       if (rv)
1064         {
1065           return rv;
1066         }
1067       rv = vnet_feature_enable_disable ("ip4-output", "nat44-ei-in2out-output",
1068                                         sw_if_index, 0, 0, 0);
1069       if (rv)
1070         {
1071           return rv;
1072         }
1073     }
1074
1075   pool_put (nm->output_feature_interfaces, i);
1076
1077   fib_index =
1078     fib_table_get_index_for_sw_if_index (FIB_PROTOCOL_IP4, sw_if_index);
1079   outside_fib = nat44_ei_get_outside_fib (nm->outside_fibs, fib_index);
1080   if (outside_fib)
1081     {
1082       outside_fib->refcount--;
1083       if (!outside_fib->refcount)
1084         {
1085           vec_del1 (nm->outside_fibs, outside_fib - nm->outside_fibs);
1086         }
1087     }
1088
1089   nat44_ei_add_del_addr_to_fib_foreach_addr (sw_if_index, 0);
1090   nat44_ei_add_del_addr_to_fib_foreach_addr_only_sm (sw_if_index, 0);
1091
1092   return 0;
1093 }
1094
1095 int
1096 nat44_ei_add_del_output_interface (u32 sw_if_index, int is_del)
1097 {
1098   if (is_del)
1099     {
1100       return nat44_ei_del_output_interface (sw_if_index);
1101     }
1102   else
1103     {
1104       return nat44_ei_add_output_interface (sw_if_index);
1105     }
1106 }
1107
1108 int
1109 nat44_ei_del_addresses ()
1110 {
1111   nat44_ei_main_t *nm = &nat44_ei_main;
1112   nat44_ei_address_t *a, *vec;
1113   int error = 0;
1114
1115   vec = vec_dup (nm->addresses);
1116   vec_foreach (a, vec)
1117     {
1118       error = nat44_ei_del_address (a->addr, 0);
1119
1120       if (error)
1121         {
1122           nat44_ei_log_err ("error occurred while removing adderess");
1123         }
1124     }
1125   vec_free (vec);
1126   vec_free (nm->addresses);
1127   nm->addresses = 0;
1128
1129   vec_free (nm->auto_add_sw_if_indices);
1130   nm->auto_add_sw_if_indices = 0;
1131   return error;
1132 }
1133
1134 int
1135 nat44_ei_del_interfaces ()
1136 {
1137   nat44_ei_main_t *nm = &nat44_ei_main;
1138   nat44_ei_interface_t *i, *pool;
1139   int error = 0;
1140
1141   pool = pool_dup (nm->interfaces);
1142   pool_foreach (i, pool)
1143     {
1144       if (nat44_ei_interface_is_inside (i))
1145         {
1146           error = nat44_ei_del_interface (i->sw_if_index, 1);
1147         }
1148       if (nat44_ei_interface_is_outside (i))
1149         {
1150           error = nat44_ei_del_interface (i->sw_if_index, 0);
1151         }
1152
1153       if (error)
1154         {
1155           nat44_ei_log_err ("error occurred while removing interface");
1156         }
1157     }
1158   pool_free (pool);
1159   pool_free (nm->interfaces);
1160   nm->interfaces = 0;
1161   return error;
1162 }
1163
1164 int
1165 nat44_ei_del_output_interfaces ()
1166 {
1167   nat44_ei_main_t *nm = &nat44_ei_main;
1168   nat44_ei_interface_t *i, *pool;
1169   int error = 0;
1170
1171   pool = pool_dup (nm->output_feature_interfaces);
1172   pool_foreach (i, pool)
1173     {
1174       error = nat44_ei_del_output_interface (i->sw_if_index);
1175       if (error)
1176         {
1177           nat44_ei_log_err ("error occurred while removing output interface");
1178         }
1179     }
1180   pool_free (pool);
1181   pool_free (nm->output_feature_interfaces);
1182   nm->output_feature_interfaces = 0;
1183   return error;
1184 }
1185
1186 int
1187 nat44_ei_del_static_mappings ()
1188 {
1189   nat44_ei_main_t *nm = &nat44_ei_main;
1190   nat44_ei_static_mapping_t *m, *pool;
1191   int error = 0;
1192
1193   pool = pool_dup (nm->static_mappings);
1194   pool_foreach (m, pool)
1195     {
1196       error = nat44_ei_del_static_mapping_internal (
1197         m->local_addr, m->external_addr, m->local_port, m->external_port,
1198         m->proto, m->vrf_id, ~0, m->flags);
1199       if (error)
1200         {
1201           nat44_ei_log_err ("error occurred while removing mapping");
1202         }
1203     }
1204   pool_free (pool);
1205   pool_free (nm->static_mappings);
1206   nm->static_mappings = 0;
1207
1208   vec_free (nm->to_resolve);
1209   nm->to_resolve = 0;
1210
1211   clib_bihash_free_8_8 (&nm->static_mapping_by_local);
1212   clib_bihash_free_8_8 (&nm->static_mapping_by_external);
1213
1214   return error;
1215 }
1216
1217 int
1218 nat44_ei_plugin_disable ()
1219 {
1220   nat44_ei_main_t *nm = &nat44_ei_main;
1221   nat44_ei_main_per_thread_data_t *tnm;
1222   int rc, error = 0;
1223
1224   nat_ha_disable ();
1225
1226   rc = nat44_ei_del_static_mappings ();
1227   if (rc)
1228     error = 1;
1229
1230   rc = nat44_ei_del_addresses ();
1231   if (rc)
1232     error = 1;
1233
1234   rc = nat44_ei_del_interfaces ();
1235   if (rc)
1236     error = 1;
1237
1238   rc = nat44_ei_del_output_interfaces ();
1239   if (rc)
1240     error = 1;
1241
1242   if (nm->pat)
1243     {
1244       clib_bihash_free_8_8 (&nm->in2out);
1245       clib_bihash_free_8_8 (&nm->out2in);
1246
1247       vec_foreach (tnm, nm->per_thread_data)
1248         {
1249           nat44_ei_worker_db_free (tnm);
1250         }
1251     }
1252
1253   clib_memset (&nm->rconfig, 0, sizeof (nm->rconfig));
1254
1255   nm->forwarding_enabled = 0;
1256   nm->enabled = 0;
1257
1258   return error;
1259 }
1260
1261 int
1262 nat44_ei_set_outside_address_and_port (nat44_ei_address_t *addresses,
1263                                        u32 thread_index, ip4_address_t addr,
1264                                        u16 port, nat_protocol_t protocol)
1265 {
1266   nat44_ei_address_t *a = 0;
1267   u32 address_index;
1268   u16 port_host_byte_order = clib_net_to_host_u16 (port);
1269
1270   for (address_index = 0; address_index < vec_len (addresses); address_index++)
1271     {
1272       if (addresses[address_index].addr.as_u32 != addr.as_u32)
1273         continue;
1274
1275       a = addresses + address_index;
1276       if (nat44_ei_port_is_used (a, protocol, port_host_byte_order))
1277         return VNET_API_ERROR_INSTANCE_IN_USE;
1278
1279       nat44_ei_port_get (a, protocol, port_host_byte_order);
1280       a->busy_ports_per_thread[protocol][thread_index]++;
1281       a->busy_ports[protocol]++;
1282       return 0;
1283     }
1284
1285   return VNET_API_ERROR_NO_SUCH_ENTRY;
1286 }
1287
1288 void
1289 nat44_ei_add_del_address_dpo (ip4_address_t addr, u8 is_add)
1290 {
1291   nat44_ei_main_t *nm = &nat44_ei_main;
1292   dpo_id_t dpo_v4 = DPO_INVALID;
1293   fib_prefix_t pfx = {
1294     .fp_proto = FIB_PROTOCOL_IP4,
1295     .fp_len = 32,
1296     .fp_addr.ip4.as_u32 = addr.as_u32,
1297   };
1298
1299   if (is_add)
1300     {
1301       nat_dpo_create (DPO_PROTO_IP4, 0, &dpo_v4);
1302       fib_table_entry_special_dpo_add (0, &pfx, nm->fib_src_hi,
1303                                        FIB_ENTRY_FLAG_EXCLUSIVE, &dpo_v4);
1304       dpo_reset (&dpo_v4);
1305     }
1306   else
1307     {
1308       fib_table_entry_special_remove (0, &pfx, nm->fib_src_hi);
1309     }
1310 }
1311
1312 void
1313 nat44_ei_free_outside_address_and_port (nat44_ei_address_t *addresses,
1314                                         u32 thread_index, ip4_address_t *addr,
1315                                         u16 port, nat_protocol_t protocol)
1316 {
1317   nat44_ei_address_t *a;
1318   u32 address_index;
1319   u16 port_host_byte_order = clib_net_to_host_u16 (port);
1320
1321   for (address_index = 0; address_index < vec_len (addresses); address_index++)
1322     {
1323       if (addresses[address_index].addr.as_u32 == addr->as_u32)
1324         break;
1325     }
1326
1327   ASSERT (address_index < vec_len (addresses));
1328
1329   a = addresses + address_index;
1330   nat44_ei_port_put (a, protocol, port_host_byte_order);
1331   a->busy_ports[protocol]--;
1332   a->busy_ports_per_thread[protocol][thread_index]--;
1333 }
1334
1335 void
1336 nat44_ei_free_session_data_v2 (nat44_ei_main_t *nm, nat44_ei_session_t *s,
1337                                u32 thread_index, u8 is_ha)
1338 {
1339   clib_bihash_kv_8_8_t kv;
1340
1341   /* session lookup tables */
1342   init_nat_i2o_k (&kv, s);
1343   if (clib_bihash_add_del_8_8 (&nm->in2out, &kv, 0))
1344     nat_elog_warn (nm, "in2out key del failed");
1345   init_nat_o2i_k (&kv, s);
1346   if (clib_bihash_add_del_8_8 (&nm->out2in, &kv, 0))
1347     nat_elog_warn (nm, "out2in key del failed");
1348
1349   if (!is_ha)
1350     nat_syslog_nat44_apmdel (s->user_index, s->in2out.fib_index,
1351                              &s->in2out.addr, s->in2out.port, &s->out2in.addr,
1352                              s->out2in.port, s->nat_proto);
1353
1354   if (nat44_ei_is_unk_proto_session (s))
1355     return;
1356
1357   if (!is_ha)
1358     {
1359       /* log NAT event */
1360       nat_ipfix_logging_nat44_ses_delete (
1361         thread_index, s->in2out.addr.as_u32, s->out2in.addr.as_u32,
1362         nat_proto_to_ip_proto (s->nat_proto), s->in2out.port, s->out2in.port,
1363         s->in2out.fib_index);
1364
1365       nat_ha_sdel (&s->out2in.addr, s->out2in.port, &s->ext_host_addr,
1366                    s->ext_host_port, s->nat_proto, s->out2in.fib_index,
1367                    thread_index);
1368     }
1369
1370   if (nat44_ei_is_session_static (s))
1371     return;
1372
1373   nat44_ei_free_outside_address_and_port (nm->addresses, thread_index,
1374                                           &s->out2in.addr, s->out2in.port,
1375                                           s->nat_proto);
1376 }
1377
1378 nat44_ei_user_t *
1379 nat44_ei_user_get_or_create (nat44_ei_main_t *nm, ip4_address_t *addr,
1380                              u32 fib_index, u32 thread_index)
1381 {
1382   nat44_ei_user_t *u = 0;
1383   nat44_ei_user_key_t user_key;
1384   clib_bihash_kv_8_8_t kv, value;
1385   nat44_ei_main_per_thread_data_t *tnm = &nm->per_thread_data[thread_index];
1386   dlist_elt_t *per_user_list_head_elt;
1387
1388   user_key.addr.as_u32 = addr->as_u32;
1389   user_key.fib_index = fib_index;
1390   kv.key = user_key.as_u64;
1391
1392   /* Ever heard of the "user" = src ip4 address before? */
1393   if (clib_bihash_search_8_8 (&tnm->user_hash, &kv, &value))
1394     {
1395       if (pool_elts (tnm->users) >= nm->max_users_per_thread)
1396         {
1397           vlib_increment_simple_counter (&nm->user_limit_reached, thread_index,
1398                                          0, 1);
1399           nat_elog_warn (nm, "maximum user limit reached");
1400           return NULL;
1401         }
1402       /* no, make a new one */
1403       pool_get (tnm->users, u);
1404       clib_memset (u, 0, sizeof (*u));
1405
1406       u->addr.as_u32 = addr->as_u32;
1407       u->fib_index = fib_index;
1408
1409       pool_get (tnm->list_pool, per_user_list_head_elt);
1410
1411       u->sessions_per_user_list_head_index =
1412         per_user_list_head_elt - tnm->list_pool;
1413
1414       clib_dlist_init (tnm->list_pool, u->sessions_per_user_list_head_index);
1415
1416       kv.value = u - tnm->users;
1417
1418       /* add user */
1419       if (clib_bihash_add_del_8_8 (&tnm->user_hash, &kv, 1))
1420         {
1421           nat_elog_warn (nm, "user_hash key add failed");
1422           nat44_ei_delete_user_with_no_session (nm, u, thread_index);
1423           return NULL;
1424         }
1425
1426       vlib_set_simple_counter (&nm->total_users, thread_index, 0,
1427                                pool_elts (tnm->users));
1428     }
1429   else
1430     {
1431       u = pool_elt_at_index (tnm->users, value.value);
1432     }
1433
1434   return u;
1435 }
1436
1437 nat44_ei_session_t *
1438 nat44_ei_session_alloc_or_recycle (nat44_ei_main_t *nm, nat44_ei_user_t *u,
1439                                    u32 thread_index, f64 now)
1440 {
1441   nat44_ei_session_t *s;
1442   nat44_ei_main_per_thread_data_t *tnm = &nm->per_thread_data[thread_index];
1443   u32 oldest_per_user_translation_list_index, session_index;
1444   dlist_elt_t *oldest_per_user_translation_list_elt;
1445   dlist_elt_t *per_user_translation_list_elt;
1446
1447   /* Over quota? Recycle the least recently used translation */
1448   if ((u->nsessions + u->nstaticsessions) >= nm->max_translations_per_user)
1449     {
1450       oldest_per_user_translation_list_index = clib_dlist_remove_head (
1451         tnm->list_pool, u->sessions_per_user_list_head_index);
1452
1453       ASSERT (oldest_per_user_translation_list_index != ~0);
1454
1455       /* Add it back to the end of the LRU list */
1456       clib_dlist_addtail (tnm->list_pool, u->sessions_per_user_list_head_index,
1457                           oldest_per_user_translation_list_index);
1458       /* Get the list element */
1459       oldest_per_user_translation_list_elt = pool_elt_at_index (
1460         tnm->list_pool, oldest_per_user_translation_list_index);
1461
1462       /* Get the session index from the list element */
1463       session_index = oldest_per_user_translation_list_elt->value;
1464
1465       /* Get the session */
1466       s = pool_elt_at_index (tnm->sessions, session_index);
1467
1468       nat44_ei_free_session_data_v2 (nm, s, thread_index, 0);
1469       if (nat44_ei_is_session_static (s))
1470         u->nstaticsessions--;
1471       else
1472         u->nsessions--;
1473       s->flags = 0;
1474       s->total_bytes = 0;
1475       s->total_pkts = 0;
1476       s->state = 0;
1477       s->ext_host_addr.as_u32 = 0;
1478       s->ext_host_port = 0;
1479       s->ext_host_nat_addr.as_u32 = 0;
1480       s->ext_host_nat_port = 0;
1481     }
1482   else
1483     {
1484       pool_get (tnm->sessions, s);
1485       clib_memset (s, 0, sizeof (*s));
1486
1487       /* Create list elts */
1488       pool_get (tnm->list_pool, per_user_translation_list_elt);
1489       clib_dlist_init (tnm->list_pool,
1490                        per_user_translation_list_elt - tnm->list_pool);
1491
1492       per_user_translation_list_elt->value = s - tnm->sessions;
1493       s->per_user_index = per_user_translation_list_elt - tnm->list_pool;
1494       s->per_user_list_head_index = u->sessions_per_user_list_head_index;
1495
1496       clib_dlist_addtail (tnm->list_pool, s->per_user_list_head_index,
1497                           per_user_translation_list_elt - tnm->list_pool);
1498
1499       s->user_index = u - tnm->users;
1500       vlib_set_simple_counter (&nm->total_sessions, thread_index, 0,
1501                                pool_elts (tnm->sessions));
1502     }
1503
1504   s->ha_last_refreshed = now;
1505
1506   return s;
1507 }
1508
1509 void
1510 nat44_ei_free_session_data (nat44_ei_main_t *nm, nat44_ei_session_t *s,
1511                             u32 thread_index, u8 is_ha)
1512 {
1513   clib_bihash_kv_8_8_t kv;
1514
1515   init_nat_i2o_k (&kv, s);
1516   if (clib_bihash_add_del_8_8 (&nm->in2out, &kv, 0))
1517     nat_elog_warn (nm, "in2out key del failed");
1518
1519   init_nat_o2i_k (&kv, s);
1520   if (clib_bihash_add_del_8_8 (&nm->out2in, &kv, 0))
1521     nat_elog_warn (nm, "out2in key del failed");
1522
1523   if (!is_ha)
1524     {
1525       nat_syslog_nat44_apmdel (s->user_index, s->in2out.fib_index,
1526                                &s->in2out.addr, s->in2out.port,
1527                                &s->out2in.addr, s->out2in.port, s->nat_proto);
1528
1529       nat_ipfix_logging_nat44_ses_delete (
1530         thread_index, s->in2out.addr.as_u32, s->out2in.addr.as_u32,
1531         nat_proto_to_ip_proto (s->nat_proto), s->in2out.port, s->out2in.port,
1532         s->in2out.fib_index);
1533
1534       nat_ha_sdel (&s->out2in.addr, s->out2in.port, &s->ext_host_addr,
1535                    s->ext_host_port, s->nat_proto, s->out2in.fib_index,
1536                    thread_index);
1537     }
1538
1539   if (nat44_ei_is_session_static (s))
1540     return;
1541
1542   nat44_ei_free_outside_address_and_port (nm->addresses, thread_index,
1543                                           &s->out2in.addr, s->out2in.port,
1544                                           s->nat_proto);
1545 }
1546
1547 static_always_inline void
1548 nat44_ei_user_del_sessions (nat44_ei_user_t *u, u32 thread_index)
1549 {
1550   dlist_elt_t *elt;
1551   nat44_ei_session_t *s;
1552
1553   nat44_ei_main_t *nm = &nat44_ei_main;
1554   nat44_ei_main_per_thread_data_t *tnm = &nm->per_thread_data[thread_index];
1555
1556   // get head
1557   elt =
1558     pool_elt_at_index (tnm->list_pool, u->sessions_per_user_list_head_index);
1559   // get first element
1560   elt = pool_elt_at_index (tnm->list_pool, elt->next);
1561
1562   while (elt->value != ~0)
1563     {
1564       s = pool_elt_at_index (tnm->sessions, elt->value);
1565       elt = pool_elt_at_index (tnm->list_pool, elt->next);
1566
1567       nat44_ei_free_session_data (nm, s, thread_index, 0);
1568       nat44_ei_delete_session (nm, s, thread_index);
1569     }
1570 }
1571
1572 int
1573 nat44_ei_user_del (ip4_address_t *addr, u32 fib_index)
1574 {
1575   int rv = 1;
1576
1577   nat44_ei_main_t *nm = &nat44_ei_main;
1578   nat44_ei_main_per_thread_data_t *tnm;
1579
1580   nat44_ei_user_key_t user_key;
1581   clib_bihash_kv_8_8_t kv, value;
1582
1583   user_key.addr.as_u32 = addr->as_u32;
1584   user_key.fib_index = fib_index;
1585   kv.key = user_key.as_u64;
1586
1587   if (nm->num_workers > 1)
1588     {
1589       vec_foreach (tnm, nm->per_thread_data)
1590         {
1591           if (!clib_bihash_search_8_8 (&tnm->user_hash, &kv, &value))
1592             {
1593               nat44_ei_user_del_sessions (
1594                 pool_elt_at_index (tnm->users, value.value),
1595                 tnm->thread_index);
1596               rv = 0;
1597               break;
1598             }
1599         }
1600     }
1601   else
1602     {
1603       tnm = vec_elt_at_index (nm->per_thread_data, nm->num_workers);
1604       if (!clib_bihash_search_8_8 (&tnm->user_hash, &kv, &value))
1605         {
1606           nat44_ei_user_del_sessions (
1607             pool_elt_at_index (tnm->users, value.value), tnm->thread_index);
1608           rv = 0;
1609         }
1610     }
1611   return rv;
1612 }
1613
1614 void
1615 nat44_ei_static_mapping_del_sessions (nat44_ei_main_t *nm,
1616                                       nat44_ei_main_per_thread_data_t *tnm,
1617                                       nat44_ei_user_key_t u_key, int addr_only,
1618                                       ip4_address_t e_addr, u16 e_port)
1619 {
1620   clib_bihash_kv_8_8_t kv, value;
1621   kv.key = u_key.as_u64;
1622   u64 user_index;
1623   dlist_elt_t *head, *elt;
1624   nat44_ei_user_t *u;
1625   nat44_ei_session_t *s;
1626   u32 elt_index, head_index, ses_index;
1627
1628   if (!clib_bihash_search_8_8 (&tnm->user_hash, &kv, &value))
1629     {
1630       user_index = value.value;
1631       u = pool_elt_at_index (tnm->users, user_index);
1632       if (u->nstaticsessions)
1633         {
1634           head_index = u->sessions_per_user_list_head_index;
1635           head = pool_elt_at_index (tnm->list_pool, head_index);
1636           elt_index = head->next;
1637           elt = pool_elt_at_index (tnm->list_pool, elt_index);
1638           ses_index = elt->value;
1639           while (ses_index != ~0)
1640             {
1641               s = pool_elt_at_index (tnm->sessions, ses_index);
1642               elt = pool_elt_at_index (tnm->list_pool, elt->next);
1643               ses_index = elt->value;
1644
1645               if (!addr_only)
1646                 {
1647                   if ((s->out2in.addr.as_u32 != e_addr.as_u32) ||
1648                       (s->out2in.port != e_port))
1649                     continue;
1650                 }
1651
1652               if (!nat44_ei_is_session_static (s))
1653                 continue;
1654
1655               nat44_ei_free_session_data_v2 (nm, s, tnm - nm->per_thread_data,
1656                                              0);
1657               nat44_ei_delete_session (nm, s, tnm - nm->per_thread_data);
1658
1659               if (!addr_only)
1660                 break;
1661             }
1662         }
1663     }
1664 }
1665
1666 u32
1667 nat44_ei_get_in2out_worker_index (ip4_header_t *ip0, u32 rx_fib_index0,
1668                                   u8 is_output)
1669 {
1670   nat44_ei_main_t *nm = &nat44_ei_main;
1671   u32 next_worker_index = 0;
1672   u32 hash;
1673
1674   next_worker_index = nm->first_worker_index;
1675   hash = ip0->src_address.as_u32 + (ip0->src_address.as_u32 >> 8) +
1676          (ip0->src_address.as_u32 >> 16) + (ip0->src_address.as_u32 >> 24);
1677
1678   if (PREDICT_TRUE (is_pow2 (_vec_len (nm->workers))))
1679     next_worker_index += nm->workers[hash & (_vec_len (nm->workers) - 1)];
1680   else
1681     next_worker_index += nm->workers[hash % _vec_len (nm->workers)];
1682
1683   return next_worker_index;
1684 }
1685
1686 u32
1687 nat44_ei_get_thread_idx_by_port (u16 e_port)
1688 {
1689   nat44_ei_main_t *nm = &nat44_ei_main;
1690   u32 thread_idx = nm->num_workers;
1691   if (nm->num_workers > 1)
1692     {
1693       thread_idx = nm->first_worker_index +
1694                    nm->workers[(e_port - 1024) / nm->port_per_thread %
1695                                _vec_len (nm->workers)];
1696     }
1697   return thread_idx;
1698 }
1699
1700 u32
1701 nat44_ei_get_out2in_worker_index (vlib_buffer_t *b, ip4_header_t *ip0,
1702                                   u32 rx_fib_index0, u8 is_output)
1703 {
1704   nat44_ei_main_t *nm = &nat44_ei_main;
1705   udp_header_t *udp;
1706   u16 port;
1707   clib_bihash_kv_8_8_t kv, value;
1708   nat44_ei_static_mapping_t *m;
1709   u32 proto;
1710   u32 next_worker_index = 0;
1711
1712   /* first try static mappings without port */
1713   if (PREDICT_FALSE (pool_elts (nm->static_mappings)))
1714     {
1715       init_nat_k (&kv, ip0->dst_address, 0, rx_fib_index0, 0);
1716       if (!clib_bihash_search_8_8 (&nm->static_mapping_by_external, &kv,
1717                                    &value))
1718         {
1719           m = pool_elt_at_index (nm->static_mappings, value.value);
1720           return m->workers[0];
1721         }
1722     }
1723
1724   proto = ip_proto_to_nat_proto (ip0->protocol);
1725   udp = ip4_next_header (ip0);
1726   port = vnet_buffer (b)->ip.reass.l4_dst_port;
1727
1728   /* unknown protocol */
1729   if (PREDICT_FALSE (proto == NAT_PROTOCOL_OTHER))
1730     {
1731       /* use current thread */
1732       return vlib_get_thread_index ();
1733     }
1734
1735   if (PREDICT_FALSE (ip0->protocol == IP_PROTOCOL_ICMP))
1736     {
1737       icmp46_header_t *icmp = (icmp46_header_t *) udp;
1738       icmp_echo_header_t *echo = (icmp_echo_header_t *) (icmp + 1);
1739       if (!icmp_type_is_error_message (
1740             vnet_buffer (b)->ip.reass.icmp_type_or_tcp_flags))
1741         port = vnet_buffer (b)->ip.reass.l4_src_port;
1742       else
1743         {
1744           /* if error message, then it's not fragmented and we can access it */
1745           ip4_header_t *inner_ip = (ip4_header_t *) (echo + 1);
1746           proto = ip_proto_to_nat_proto (inner_ip->protocol);
1747           void *l4_header = ip4_next_header (inner_ip);
1748           switch (proto)
1749             {
1750             case NAT_PROTOCOL_ICMP:
1751               icmp = (icmp46_header_t *) l4_header;
1752               echo = (icmp_echo_header_t *) (icmp + 1);
1753               port = echo->identifier;
1754               break;
1755             case NAT_PROTOCOL_UDP:
1756             case NAT_PROTOCOL_TCP:
1757               port = ((tcp_udp_header_t *) l4_header)->src_port;
1758               break;
1759             default:
1760               return vlib_get_thread_index ();
1761             }
1762         }
1763     }
1764
1765   /* try static mappings with port */
1766   if (PREDICT_FALSE (pool_elts (nm->static_mappings)))
1767     {
1768       init_nat_k (&kv, ip0->dst_address, port, rx_fib_index0, proto);
1769       if (!clib_bihash_search_8_8 (&nm->static_mapping_by_external, &kv,
1770                                    &value))
1771         {
1772           m = pool_elt_at_index (nm->static_mappings, value.value);
1773           return m->workers[0];
1774         }
1775     }
1776
1777   /* worker by outside port */
1778   next_worker_index =
1779     nat44_ei_get_thread_idx_by_port (clib_net_to_host_u16 (port));
1780   return next_worker_index;
1781 }
1782
1783 static int
1784 nat44_ei_alloc_default_cb (nat44_ei_address_t *addresses, u32 fib_index,
1785                            u32 thread_index, nat_protocol_t proto,
1786                            ip4_address_t s_addr, ip4_address_t *addr,
1787                            u16 *port, u16 port_per_thread,
1788                            u32 snat_thread_index)
1789 {
1790   nat44_ei_main_t *nm = &nat44_ei_main;
1791   nat44_ei_address_t *a, *ga = 0;
1792   u32 portnum;
1793   int i;
1794
1795   if (vec_len (addresses) > 0)
1796     {
1797       int s_addr_offset = s_addr.as_u32 % vec_len (addresses);
1798
1799       for (i = s_addr_offset; i < vec_len (addresses); ++i)
1800         {
1801           a = addresses + i;
1802
1803           if (a->busy_ports_per_thread[proto][thread_index] < port_per_thread)
1804             {
1805               if (a->fib_index == fib_index)
1806                 {
1807                   while (1)
1808                     {
1809                       portnum = (port_per_thread * snat_thread_index) +
1810                                 nat_random_port (&nm->random_seed, 0,
1811                                                  port_per_thread - 1) +
1812                                 1024;
1813                       if (nat44_ei_port_is_used (a, proto, portnum))
1814                         continue;
1815                       nat44_ei_port_get (a, proto, portnum);
1816                       a->busy_ports_per_thread[proto][thread_index]++;
1817                       a->busy_ports[proto]++;
1818                       *addr = a->addr;
1819                       *port = clib_host_to_net_u16 (portnum);
1820                       return 0;
1821                     }
1822                 }
1823               else if (a->fib_index == ~0)
1824                 {
1825                   ga = a;
1826                 }
1827             }
1828         }
1829
1830       for (i = 0; i < s_addr_offset; ++i)
1831         {
1832           a = addresses + i;
1833           if (a->busy_ports_per_thread[proto][thread_index] < port_per_thread)
1834             {
1835               if (a->fib_index == fib_index)
1836                 {
1837                   while (1)
1838                     {
1839                       portnum = (port_per_thread * snat_thread_index) +
1840                                 nat_random_port (&nm->random_seed, 0,
1841                                                  port_per_thread - 1) +
1842                                 1024;
1843                       if (nat44_ei_port_is_used (a, proto, portnum))
1844                         continue;
1845                       nat44_ei_port_get (a, proto, portnum);
1846                       a->busy_ports_per_thread[proto][thread_index]++;
1847                       a->busy_ports[proto]++;
1848                       *addr = a->addr;
1849                       *port = clib_host_to_net_u16 (portnum);
1850                       return 0;
1851                     }
1852                 }
1853               else if (a->fib_index == ~0)
1854                 {
1855                   ga = a;
1856                 }
1857             }
1858         }
1859
1860       if (ga)
1861         {
1862           a = ga;
1863           if (a->busy_ports_per_thread[proto][thread_index] < port_per_thread)
1864             {
1865               if (a->fib_index == ~0)
1866                 {
1867                   while (1)
1868                     {
1869                       portnum = (port_per_thread * snat_thread_index) +
1870                                 nat_random_port (&nm->random_seed, 0,
1871                                                  port_per_thread - 1) +
1872                                 1024;
1873                       if (nat44_ei_port_is_used (a, proto, portnum))
1874                         continue;
1875                       nat44_ei_port_get (a, proto, portnum);
1876                       a->busy_ports_per_thread[proto][thread_index]++;
1877                       a->busy_ports[proto]++;
1878                       *addr = a->addr;
1879                       *port = clib_host_to_net_u16 (portnum);
1880                       return 0;
1881                     }
1882                 }
1883             }
1884         }
1885     }
1886
1887   /* Totally out of translations to use... */
1888   nat_ipfix_logging_addresses_exhausted (thread_index, 0);
1889   return 1;
1890 }
1891
1892 static int
1893 nat44_ei_alloc_range_cb (nat44_ei_address_t *addresses, u32 fib_index,
1894                          u32 thread_index, nat_protocol_t proto,
1895                          ip4_address_t s_addr, ip4_address_t *addr, u16 *port,
1896                          u16 port_per_thread, u32 snat_thread_index)
1897 {
1898   nat44_ei_main_t *nm = &nat44_ei_main;
1899   nat44_ei_address_t *a = addresses;
1900   u16 portnum, ports;
1901
1902   ports = nm->end_port - nm->start_port + 1;
1903
1904   if (!vec_len (addresses))
1905     goto exhausted;
1906
1907   if (a->busy_ports[proto] < ports)
1908     {
1909       while (1)
1910         {
1911           portnum =
1912             nat_random_port (&nm->random_seed, nm->start_port, nm->end_port);
1913           if (nat44_ei_port_is_used (a, proto, portnum))
1914             continue;
1915           nat44_ei_port_get (a, proto, portnum);
1916           a->busy_ports[proto]++;
1917           *addr = a->addr;
1918           *port = clib_host_to_net_u16 (portnum);
1919           return 0;
1920         }
1921     }
1922
1923 exhausted:
1924   /* Totally out of translations to use... */
1925   nat_ipfix_logging_addresses_exhausted (thread_index, 0);
1926   return 1;
1927 }
1928
1929 static int
1930 nat44_ei_alloc_mape_cb (nat44_ei_address_t *addresses, u32 fib_index,
1931                         u32 thread_index, nat_protocol_t proto,
1932                         ip4_address_t s_addr, ip4_address_t *addr, u16 *port,
1933                         u16 port_per_thread, u32 snat_thread_index)
1934 {
1935   nat44_ei_main_t *nm = &nat44_ei_main;
1936   nat44_ei_address_t *a = addresses;
1937   u16 m, ports, portnum, A, j;
1938   m = 16 - (nm->psid_offset + nm->psid_length);
1939   ports = (1 << (16 - nm->psid_length)) - (1 << m);
1940
1941   if (!vec_len (addresses))
1942     goto exhausted;
1943
1944   if (a->busy_ports[proto] < ports)
1945     {
1946       while (1)
1947         {
1948           A =
1949             nat_random_port (&nm->random_seed, 1, pow2_mask (nm->psid_offset));
1950           j = nat_random_port (&nm->random_seed, 0, pow2_mask (m));
1951           portnum = A | (nm->psid << nm->psid_offset) | (j << (16 - m));
1952           if (nat44_ei_port_is_used (a, proto, portnum))
1953             continue;
1954           nat44_ei_port_get (a, proto, portnum);
1955           a->busy_ports[proto]++;
1956           *addr = a->addr;
1957           *port = clib_host_to_net_u16 (portnum);
1958           return 0;
1959         }
1960     }
1961
1962 exhausted:
1963   /* Totally out of translations to use... */
1964   nat_ipfix_logging_addresses_exhausted (thread_index, 0);
1965   return 1;
1966 }
1967
1968 void
1969 nat44_ei_set_alloc_default ()
1970 {
1971   nat44_ei_main_t *nm = &nat44_ei_main;
1972
1973   nm->addr_and_port_alloc_alg = NAT44_EI_ADDR_AND_PORT_ALLOC_ALG_DEFAULT;
1974   nm->alloc_addr_and_port = nat44_ei_alloc_default_cb;
1975 }
1976
1977 void
1978 nat44_ei_set_alloc_range (u16 start_port, u16 end_port)
1979 {
1980   nat44_ei_main_t *nm = &nat44_ei_main;
1981
1982   nm->addr_and_port_alloc_alg = NAT44_EI_ADDR_AND_PORT_ALLOC_ALG_RANGE;
1983   nm->alloc_addr_and_port = nat44_ei_alloc_range_cb;
1984   nm->start_port = start_port;
1985   nm->end_port = end_port;
1986 }
1987
1988 void
1989 nat44_ei_set_alloc_mape (u16 psid, u16 psid_offset, u16 psid_length)
1990 {
1991   nat44_ei_main_t *nm = &nat44_ei_main;
1992
1993   nm->addr_and_port_alloc_alg = NAT44_EI_ADDR_AND_PORT_ALLOC_ALG_MAPE;
1994   nm->alloc_addr_and_port = nat44_ei_alloc_mape_cb;
1995   nm->psid = psid;
1996   nm->psid_offset = psid_offset;
1997   nm->psid_length = psid_length;
1998 }
1999
2000 void
2001 nat44_ei_delete_session (nat44_ei_main_t *nm, nat44_ei_session_t *ses,
2002                          u32 thread_index)
2003 {
2004   nat44_ei_main_per_thread_data_t *tnm =
2005     vec_elt_at_index (nm->per_thread_data, thread_index);
2006   clib_bihash_kv_8_8_t kv, value;
2007   nat44_ei_user_t *u;
2008   const nat44_ei_user_key_t u_key = { .addr = ses->in2out.addr,
2009                                       .fib_index = ses->in2out.fib_index };
2010   const u8 u_static = nat44_ei_is_session_static (ses);
2011
2012   clib_dlist_remove (tnm->list_pool, ses->per_user_index);
2013   pool_put_index (tnm->list_pool, ses->per_user_index);
2014
2015   pool_put (tnm->sessions, ses);
2016   vlib_set_simple_counter (&nm->total_sessions, thread_index, 0,
2017                            pool_elts (tnm->sessions));
2018
2019   kv.key = u_key.as_u64;
2020   if (!clib_bihash_search_8_8 (&tnm->user_hash, &kv, &value))
2021     {
2022       u = pool_elt_at_index (tnm->users, value.value);
2023       if (u_static)
2024         u->nstaticsessions--;
2025       else
2026         u->nsessions--;
2027
2028       nat44_ei_delete_user_with_no_session (nm, u, thread_index);
2029     }
2030 }
2031
2032 int
2033 nat44_ei_del_session (nat44_ei_main_t *nm, ip4_address_t *addr, u16 port,
2034                       nat_protocol_t proto, u32 vrf_id, int is_in)
2035 {
2036   nat44_ei_main_per_thread_data_t *tnm;
2037   clib_bihash_kv_8_8_t kv, value;
2038   u32 fib_index;
2039   nat44_ei_session_t *s;
2040   clib_bihash_8_8_t *t;
2041
2042   fail_if_disabled ();
2043
2044   fib_index = fib_table_find (FIB_PROTOCOL_IP4, vrf_id);
2045   init_nat_k (&kv, *addr, port, fib_index, proto);
2046   t = is_in ? &nm->in2out : &nm->out2in;
2047   if (!clib_bihash_search_8_8 (t, &kv, &value))
2048     {
2049       // this is called from API/CLI, so the world is stopped here
2050       // it's safe to manipulate arbitrary per-thread data
2051       u32 thread_index = nat_value_get_thread_index (&value);
2052       tnm = vec_elt_at_index (nm->per_thread_data, thread_index);
2053       u32 session_index = nat_value_get_session_index (&value);
2054       if (pool_is_free_index (tnm->sessions, session_index))
2055         return VNET_API_ERROR_UNSPECIFIED;
2056
2057       s = pool_elt_at_index (tnm->sessions, session_index);
2058       nat44_ei_free_session_data_v2 (nm, s, tnm - nm->per_thread_data, 0);
2059       nat44_ei_delete_session (nm, s, tnm - nm->per_thread_data);
2060       return 0;
2061     }
2062
2063   return VNET_API_ERROR_NO_SUCH_ENTRY;
2064 }
2065
2066 void
2067 nat44_ei_add_del_addr_to_fib (ip4_address_t *addr, u8 p_len, u32 sw_if_index,
2068                               int is_add)
2069 {
2070   nat44_ei_main_t *nm = &nat44_ei_main;
2071   fib_prefix_t prefix = {
2072     .fp_len = p_len,
2073     .fp_proto = FIB_PROTOCOL_IP4,
2074     .fp_addr = {
2075                 .ip4.as_u32 = addr->as_u32,
2076                 },
2077   };
2078   u32 fib_index = ip4_fib_table_get_index_for_sw_if_index (sw_if_index);
2079
2080   if (is_add)
2081     {
2082       fib_table_entry_update_one_path (fib_index, &prefix, nm->fib_src_low,
2083                                        (FIB_ENTRY_FLAG_CONNECTED |
2084                                         FIB_ENTRY_FLAG_LOCAL |
2085                                         FIB_ENTRY_FLAG_EXCLUSIVE),
2086                                        DPO_PROTO_IP4, NULL, sw_if_index, ~0, 1,
2087                                        NULL, FIB_ROUTE_PATH_FLAG_NONE);
2088     }
2089   else
2090     {
2091       fib_table_entry_delete (fib_index, &prefix, nm->fib_src_low);
2092     }
2093 }
2094
2095 int
2096 nat44_ei_reserve_port (ip4_address_t addr, u16 port, nat_protocol_t proto)
2097 {
2098   u32 ti = nat44_ei_get_thread_idx_by_port (port);
2099   nat44_ei_main_t *nm = &nat44_ei_main;
2100   nat44_ei_address_t *a = 0;
2101   int i;
2102
2103   for (i = 0; i < vec_len (nm->addresses); i++)
2104     {
2105       a = nm->addresses + i;
2106
2107       if (a->addr.as_u32 != addr.as_u32)
2108         continue;
2109
2110       if (nat44_ei_port_is_used (a, proto, port))
2111         continue;
2112
2113       nat44_ei_port_get (a, proto, port);
2114       if (port > 1024)
2115         {
2116           a->busy_ports[proto]++;
2117           a->busy_ports_per_thread[proto][ti]++;
2118         }
2119       return 0;
2120     }
2121
2122   return 1;
2123 }
2124
2125 int
2126 nat44_ei_free_port (ip4_address_t addr, u16 port, nat_protocol_t proto)
2127 {
2128   u32 ti = nat44_ei_get_thread_idx_by_port (port);
2129   nat44_ei_main_t *nm = &nat44_ei_main;
2130   nat44_ei_address_t *a = 0;
2131   int i;
2132
2133   for (i = 0; i < vec_len (nm->addresses); i++)
2134     {
2135       a = nm->addresses + i;
2136
2137       if (a->addr.as_u32 != addr.as_u32)
2138         continue;
2139
2140       nat44_ei_port_put (a, proto, port);
2141       if (port > 1024)
2142         {
2143           a->busy_ports[proto]--;
2144           a->busy_ports_per_thread[proto][ti]--;
2145         }
2146       return 0;
2147     }
2148
2149   return 1;
2150 }
2151
2152 void
2153 nat44_ei_add_resolve_record (ip4_address_t l_addr, u16 l_port, u16 e_port,
2154                              nat_protocol_t proto, u32 vrf_id, u32 sw_if_index,
2155                              u32 flags, ip4_address_t pool_addr, u8 *tag)
2156 {
2157   nat44_ei_static_map_resolve_t *rp;
2158   nat44_ei_main_t *nm = &nat44_ei_main;
2159
2160   vec_add2 (nm->to_resolve, rp, 1);
2161   rp->l_addr.as_u32 = l_addr.as_u32;
2162   rp->l_port = l_port;
2163   rp->e_port = e_port;
2164   rp->sw_if_index = sw_if_index;
2165   rp->vrf_id = vrf_id;
2166   rp->proto = proto;
2167   rp->flags = flags;
2168   rp->pool_addr = pool_addr;
2169   rp->tag = vec_dup (tag);
2170 }
2171
2172 int
2173 nat44_ei_get_resolve_record (ip4_address_t l_addr, u16 l_port, u16 e_port,
2174                              nat_protocol_t proto, u32 vrf_id, u32 sw_if_index,
2175                              u32 flags, int *out)
2176 {
2177   nat44_ei_static_map_resolve_t *rp;
2178   nat44_ei_main_t *nm = &nat44_ei_main;
2179   int i;
2180
2181   for (i = 0; i < vec_len (nm->to_resolve); i++)
2182     {
2183       rp = nm->to_resolve + i;
2184
2185       if (rp->sw_if_index == sw_if_index && rp->vrf_id == vrf_id)
2186         {
2187           if (is_sm_identity_nat (rp->flags) && is_sm_identity_nat (flags))
2188             {
2189               if (!(is_sm_addr_only (rp->flags) && is_sm_addr_only (flags)))
2190                 {
2191                   if (rp->e_port != e_port || rp->proto != proto)
2192                     {
2193                       continue;
2194                     }
2195                 }
2196             }
2197           else if (rp->l_addr.as_u32 == l_addr.as_u32)
2198             {
2199               if (!(is_sm_addr_only (rp->flags) && is_sm_addr_only (flags)))
2200                 {
2201                   if (rp->l_port != l_port || rp->e_port != e_port ||
2202                       rp->proto != proto)
2203                     {
2204                       continue;
2205                     }
2206                 }
2207             }
2208           else
2209             {
2210               continue;
2211             }
2212           if (out)
2213             {
2214               *out = i;
2215             }
2216           return 0;
2217         }
2218     }
2219   return 1;
2220 }
2221
2222 int
2223 nat44_ei_del_resolve_record (ip4_address_t l_addr, u16 l_port, u16 e_port,
2224                              nat_protocol_t proto, u32 vrf_id, u32 sw_if_index,
2225                              u32 flags)
2226 {
2227   nat44_ei_main_t *nm = &nat44_ei_main;
2228   int i;
2229   if (!nat44_ei_get_resolve_record (l_addr, l_port, e_port, proto, vrf_id,
2230                                     sw_if_index, flags, &i))
2231     {
2232       vec_del1 (nm->to_resolve, i);
2233       return 0;
2234     }
2235   return 1;
2236 }
2237
2238 void
2239 delete_matching_dynamic_sessions (const nat44_ei_static_mapping_t *m,
2240                                   u32 worker_index)
2241 {
2242   nat44_ei_main_t *nm = &nat44_ei_main;
2243   clib_bihash_kv_8_8_t kv, value;
2244   nat44_ei_session_t *s;
2245   nat44_ei_user_key_t u_key;
2246   nat44_ei_user_t *u;
2247   nat44_ei_main_per_thread_data_t *tnm;
2248   dlist_elt_t *head, *elt;
2249   u32 elt_index, head_index;
2250   u32 ses_index;
2251   u64 user_index;
2252
2253   if (nm->static_mapping_only)
2254     return;
2255
2256   tnm = vec_elt_at_index (nm->per_thread_data, worker_index);
2257
2258   u_key.addr = m->local_addr;
2259   u_key.fib_index = m->fib_index;
2260   kv.key = u_key.as_u64;
2261   if (!clib_bihash_search_8_8 (&tnm->user_hash, &kv, &value))
2262     {
2263       user_index = value.value;
2264       u = pool_elt_at_index (tnm->users, user_index);
2265       if (u->nsessions)
2266         {
2267           head_index = u->sessions_per_user_list_head_index;
2268           head = pool_elt_at_index (tnm->list_pool, head_index);
2269           elt_index = head->next;
2270           elt = pool_elt_at_index (tnm->list_pool, elt_index);
2271           ses_index = elt->value;
2272           while (ses_index != ~0)
2273             {
2274               s = pool_elt_at_index (tnm->sessions, ses_index);
2275               elt = pool_elt_at_index (tnm->list_pool, elt->next);
2276               ses_index = elt->value;
2277
2278               if (nat44_ei_is_session_static (s))
2279                 continue;
2280
2281               if (!is_sm_addr_only (m->flags) &&
2282                   s->in2out.port != m->local_port)
2283                 continue;
2284
2285               nat44_ei_free_session_data_v2 (nm, s, tnm - nm->per_thread_data,
2286                                              0);
2287               nat44_ei_delete_session (nm, s, tnm - nm->per_thread_data);
2288
2289               if (!is_sm_addr_only (m->flags))
2290                 break;
2291             }
2292         }
2293     }
2294 }
2295
2296 int
2297 nat44_ei_add_static_mapping (ip4_address_t l_addr, ip4_address_t e_addr,
2298                              u16 l_port, u16 e_port, nat_protocol_t proto,
2299                              u32 vrf_id, u32 sw_if_index, u32 flags,
2300                              ip4_address_t pool_addr, u8 *tag)
2301
2302 {
2303   nat44_ei_main_t *nm = &nat44_ei_main;
2304
2305   if (is_sm_switch_address (flags))
2306     {
2307       if (!nat44_ei_get_resolve_record (l_addr, l_port, e_port, proto, vrf_id,
2308                                         sw_if_index, flags, 0))
2309         {
2310           return VNET_API_ERROR_VALUE_EXIST;
2311         }
2312
2313       nat44_ei_add_resolve_record (l_addr, l_port, e_port, proto, vrf_id,
2314                                    sw_if_index, flags, pool_addr, tag);
2315
2316       ip4_address_t *first_int_addr =
2317         ip4_interface_first_address (nm->ip4_main, sw_if_index, 0);
2318       if (!first_int_addr)
2319         {
2320           // dhcp resolution required
2321           return 0;
2322         }
2323
2324       e_addr.as_u32 = first_int_addr->as_u32;
2325     }
2326
2327   return nat44_ei_add_static_mapping_internal (l_addr, e_addr, l_port, e_port,
2328                                                proto, vrf_id, sw_if_index,
2329                                                flags, pool_addr, tag);
2330 }
2331
2332 int
2333 nat44_ei_del_static_mapping (ip4_address_t l_addr, ip4_address_t e_addr,
2334                              u16 l_port, u16 e_port, nat_protocol_t proto,
2335                              u32 vrf_id, u32 sw_if_index, u32 flags)
2336 {
2337   nat44_ei_main_t *nm = &nat44_ei_main;
2338
2339   if (is_sm_switch_address (flags))
2340     {
2341
2342       if (nat44_ei_del_resolve_record (l_addr, l_port, e_port, proto, vrf_id,
2343                                        sw_if_index, flags))
2344         {
2345           return VNET_API_ERROR_NO_SUCH_ENTRY;
2346         }
2347
2348       ip4_address_t *first_int_addr =
2349         ip4_interface_first_address (nm->ip4_main, sw_if_index, 0);
2350       if (!first_int_addr)
2351         {
2352           // dhcp resolution required
2353           return 0;
2354         }
2355
2356       e_addr.as_u32 = first_int_addr->as_u32;
2357     }
2358
2359   return nat44_ei_del_static_mapping_internal (
2360     l_addr, e_addr, l_port, e_port, proto, vrf_id, sw_if_index, flags);
2361 }
2362
2363 static int
2364 nat44_ei_add_static_mapping_internal (ip4_address_t l_addr,
2365                                       ip4_address_t e_addr, u16 l_port,
2366                                       u16 e_port, nat_protocol_t proto,
2367                                       u32 vrf_id, u32 sw_if_index, u32 flags,
2368                                       ip4_address_t pool_addr, u8 *tag)
2369 {
2370   nat44_ei_main_t *nm = &nat44_ei_main;
2371   clib_bihash_kv_8_8_t kv, value;
2372   nat44_ei_lb_addr_port_t *local;
2373   nat44_ei_static_mapping_t *m;
2374   u32 fib_index = ~0;
2375   u32 worker_index;
2376
2377   fail_if_disabled ();
2378
2379   if (is_sm_addr_only (flags))
2380     {
2381       e_port = l_port = proto = 0;
2382     }
2383
2384   if (is_sm_identity_nat (flags))
2385     {
2386       l_port = e_port;
2387       l_addr.as_u32 = e_addr.as_u32;
2388     }
2389
2390   // fib index 0
2391   init_nat_k (&kv, e_addr, e_port, 0, proto);
2392
2393   if (!clib_bihash_search_8_8 (&nm->static_mapping_by_external, &kv, &value))
2394     {
2395       m = pool_elt_at_index (nm->static_mappings, value.value);
2396       if (!is_sm_identity_nat (m->flags))
2397         {
2398           return VNET_API_ERROR_VALUE_EXIST;
2399         }
2400
2401       // case:
2402       // adding local identity nat record for different vrf table
2403       pool_foreach (local, m->locals)
2404         {
2405           if (local->vrf_id == vrf_id)
2406             {
2407               return VNET_API_ERROR_VALUE_EXIST;
2408             }
2409         }
2410
2411       pool_get (m->locals, local);
2412
2413       local->vrf_id = vrf_id;
2414       local->fib_index = fib_table_find_or_create_and_lock (
2415         FIB_PROTOCOL_IP4, vrf_id, nm->fib_src_low);
2416
2417       init_nat_kv (&kv, m->local_addr, m->local_port, local->fib_index,
2418                    m->proto, 0, m - nm->static_mappings);
2419       clib_bihash_add_del_8_8 (&nm->static_mapping_by_local, &kv, 1);
2420
2421       return 0;
2422     }
2423
2424   if (vrf_id != ~0)
2425     {
2426       fib_index = fib_table_find_or_create_and_lock (FIB_PROTOCOL_IP4, vrf_id,
2427                                                      nm->fib_src_low);
2428     }
2429   else
2430     {
2431       // fallback to default vrf
2432       vrf_id = nm->inside_vrf_id;
2433       fib_index = nm->inside_fib_index;
2434       fib_table_lock (fib_index, FIB_PROTOCOL_IP4, nm->fib_src_low);
2435     }
2436
2437   if (!is_sm_identity_nat (flags))
2438     {
2439       init_nat_k (&kv, l_addr, l_port, fib_index, proto);
2440       if (!clib_bihash_search_8_8 (&nm->static_mapping_by_local, &kv, &value))
2441         {
2442           return VNET_API_ERROR_VALUE_EXIST;
2443         }
2444     }
2445
2446   if (!(is_sm_addr_only (flags) || nm->static_mapping_only))
2447     {
2448       if (nat44_ei_reserve_port (e_addr, e_port, proto))
2449         {
2450           // remove resolve record
2451           if ((is_sm_switch_address (flags)) && !is_sm_identity_nat (flags))
2452             {
2453               nat44_ei_del_resolve_record (l_addr, l_port, e_port, proto,
2454                                            vrf_id, sw_if_index, flags);
2455             }
2456           return VNET_API_ERROR_NO_SUCH_ENTRY;
2457         }
2458     }
2459
2460   pool_get (nm->static_mappings, m);
2461   clib_memset (m, 0, sizeof (*m));
2462
2463   m->flags = flags;
2464   m->local_addr = l_addr;
2465   m->external_addr = e_addr;
2466
2467   m->tag = vec_dup (tag);
2468
2469   if (!is_sm_addr_only (flags))
2470     {
2471       m->local_port = l_port;
2472       m->external_port = e_port;
2473       m->proto = proto;
2474     }
2475
2476   if (is_sm_identity_nat (flags))
2477     {
2478       pool_get (m->locals, local);
2479
2480       local->vrf_id = vrf_id;
2481       local->fib_index = fib_index;
2482     }
2483   else
2484     {
2485       m->vrf_id = vrf_id;
2486       m->fib_index = fib_index;
2487     }
2488
2489   init_nat_kv (&kv, m->local_addr, m->local_port, fib_index, m->proto, 0,
2490                m - nm->static_mappings);
2491   clib_bihash_add_del_8_8 (&nm->static_mapping_by_local, &kv, 1);
2492
2493   init_nat_kv (&kv, m->external_addr, m->external_port, 0, m->proto, 0,
2494                m - nm->static_mappings);
2495   clib_bihash_add_del_8_8 (&nm->static_mapping_by_external, &kv, 1);
2496
2497   if (nm->num_workers > 1)
2498     {
2499       // store worker index for this record
2500       ip4_header_t ip = {
2501         .src_address = m->local_addr,
2502       };
2503       worker_index = nat44_ei_get_in2out_worker_index (&ip, m->fib_index, 0);
2504       vec_add1 (m->workers, worker_index);
2505     }
2506   else
2507     {
2508       worker_index = nm->num_workers;
2509     }
2510   delete_matching_dynamic_sessions (m, worker_index);
2511
2512   if (is_sm_addr_only (flags))
2513     {
2514       nat44_ei_add_del_addr_to_fib_foreach_out_if (&e_addr, 1);
2515     }
2516
2517   return 0;
2518 }
2519
2520 static int
2521 nat44_ei_del_static_mapping_internal (ip4_address_t l_addr,
2522                                       ip4_address_t e_addr, u16 l_port,
2523                                       u16 e_port, nat_protocol_t proto,
2524                                       u32 vrf_id, u32 sw_if_index, u32 flags)
2525 {
2526   nat44_ei_main_per_thread_data_t *tnm;
2527   nat44_ei_main_t *nm = &nat44_ei_main;
2528   clib_bihash_kv_8_8_t kv, value;
2529   nat44_ei_lb_addr_port_t *local;
2530   nat44_ei_static_mapping_t *m;
2531   u32 fib_index = ~0;
2532   nat44_ei_user_key_t u_key;
2533
2534   fail_if_disabled ();
2535
2536   if (is_sm_addr_only (flags))
2537     {
2538       e_port = l_port = proto = 0;
2539     }
2540
2541   if (is_sm_identity_nat (flags))
2542     {
2543       l_port = e_port;
2544       l_addr.as_u32 = e_addr.as_u32;
2545     }
2546
2547   // fib index 0
2548   init_nat_k (&kv, e_addr, e_port, 0, proto);
2549
2550   if (clib_bihash_search_8_8 (&nm->static_mapping_by_external, &kv, &value))
2551     {
2552       if (is_sm_switch_address (flags))
2553         {
2554           return 0;
2555         }
2556       return VNET_API_ERROR_NO_SUCH_ENTRY;
2557     }
2558
2559   m = pool_elt_at_index (nm->static_mappings, value.value);
2560
2561   if (is_sm_identity_nat (flags))
2562     {
2563       u8 found = 0;
2564
2565       if (vrf_id == ~0)
2566         {
2567           vrf_id = nm->inside_vrf_id;
2568         }
2569
2570       pool_foreach (local, m->locals)
2571         {
2572           if (local->vrf_id == vrf_id)
2573             {
2574               local = pool_elt_at_index (m->locals, local - m->locals);
2575               fib_index = local->fib_index;
2576               pool_put (m->locals, local);
2577               found = 1;
2578             }
2579         }
2580       if (!found)
2581         {
2582           return VNET_API_ERROR_NO_SUCH_ENTRY;
2583         }
2584     }
2585   else
2586     {
2587       fib_index = m->fib_index;
2588     }
2589
2590   if (!(is_sm_addr_only (flags) || nm->static_mapping_only))
2591     {
2592       if (nat44_ei_free_port (e_addr, e_port, proto))
2593         {
2594           return VNET_API_ERROR_INVALID_VALUE;
2595         }
2596     }
2597
2598   init_nat_k (&kv, l_addr, l_port, fib_index, proto);
2599   clib_bihash_add_del_8_8 (&nm->static_mapping_by_local, &kv, 0);
2600
2601   if (!nm->static_mapping_only || nm->static_mapping_connection_tracking)
2602     {
2603       // delete sessions for static mapping
2604       if (nm->num_workers > 1)
2605         tnm = vec_elt_at_index (nm->per_thread_data, m->workers[0]);
2606       else
2607         tnm = vec_elt_at_index (nm->per_thread_data, nm->num_workers);
2608
2609       u_key.addr = m->local_addr;
2610       u_key.fib_index = fib_index;
2611       kv.key = u_key.as_u64;
2612       nat44_ei_static_mapping_del_sessions (
2613         nm, tnm, u_key, is_sm_addr_only (flags), e_addr, e_port);
2614     }
2615
2616   fib_table_unlock (fib_index, FIB_PROTOCOL_IP4, nm->fib_src_low);
2617
2618   if (!pool_elts (m->locals))
2619     {
2620       // this is last record remove all required stuff
2621       // fib_index 0
2622       init_nat_k (&kv, e_addr, e_port, 0, proto);
2623       clib_bihash_add_del_8_8 (&nm->static_mapping_by_external, &kv, 0);
2624
2625       vec_free (m->tag);
2626       vec_free (m->workers);
2627       pool_put (nm->static_mappings, m);
2628
2629       if (is_sm_addr_only (flags) && !is_sm_identity_nat (flags))
2630         {
2631           nat44_ei_add_del_addr_to_fib_foreach_out_if (&e_addr, 0);
2632         }
2633     }
2634
2635   return 0;
2636 }
2637
2638 int
2639 nat44_ei_static_mapping_match (ip4_address_t match_addr, u16 match_port,
2640                                u32 match_fib_index,
2641                                nat_protocol_t match_protocol,
2642                                ip4_address_t *mapping_addr, u16 *mapping_port,
2643                                u32 *mapping_fib_index, u8 by_external,
2644                                u8 *is_addr_only, u8 *is_identity_nat)
2645 {
2646   nat44_ei_main_t *nm = &nat44_ei_main;
2647   clib_bihash_kv_8_8_t kv, value;
2648   nat44_ei_static_mapping_t *m;
2649   u16 port;
2650
2651   if (by_external)
2652     {
2653       init_nat_k (&kv, match_addr, match_port, 0, match_protocol);
2654       if (clib_bihash_search_8_8 (&nm->static_mapping_by_external, &kv,
2655                                   &value))
2656         {
2657           /* Try address only mapping */
2658           init_nat_k (&kv, match_addr, 0, 0, 0);
2659           if (clib_bihash_search_8_8 (&nm->static_mapping_by_external, &kv,
2660                                       &value))
2661             return 1;
2662         }
2663       m = pool_elt_at_index (nm->static_mappings, value.value);
2664
2665       *mapping_fib_index = m->fib_index;
2666       *mapping_addr = m->local_addr;
2667       port = m->local_port;
2668     }
2669   else
2670     {
2671       init_nat_k (&kv, match_addr, match_port, match_fib_index,
2672                   match_protocol);
2673       if (clib_bihash_search_8_8 (&nm->static_mapping_by_local, &kv, &value))
2674         {
2675           /* Try address only mapping */
2676           init_nat_k (&kv, match_addr, 0, match_fib_index, 0);
2677           if (clib_bihash_search_8_8 (&nm->static_mapping_by_local, &kv,
2678                                       &value))
2679             return 1;
2680         }
2681       m = pool_elt_at_index (nm->static_mappings, value.value);
2682
2683       *mapping_fib_index = nm->outside_fib_index;
2684       *mapping_addr = m->external_addr;
2685       port = m->external_port;
2686     }
2687
2688   /* Address only mapping doesn't change port */
2689   if (is_sm_addr_only (m->flags))
2690     *mapping_port = match_port;
2691   else
2692     *mapping_port = port;
2693
2694   if (PREDICT_FALSE (is_addr_only != 0))
2695     *is_addr_only = is_sm_addr_only (m->flags);
2696
2697   if (PREDICT_FALSE (is_identity_nat != 0))
2698     *is_identity_nat = is_sm_identity_nat (m->flags);
2699
2700   return 0;
2701 }
2702
2703 static void
2704 nat44_ei_worker_db_free (nat44_ei_main_per_thread_data_t *tnm)
2705 {
2706   pool_free (tnm->list_pool);
2707   pool_free (tnm->lru_pool);
2708   pool_free (tnm->sessions);
2709   pool_free (tnm->users);
2710
2711   clib_bihash_free_8_8 (&tnm->user_hash);
2712 }
2713
2714 u8 *
2715 format_nat44_ei_key (u8 *s, va_list *args)
2716 {
2717   u64 key = va_arg (*args, u64);
2718
2719   ip4_address_t addr;
2720   u16 port;
2721   nat_protocol_t protocol;
2722   u32 fib_index;
2723
2724   split_nat_key (key, &addr, &port, &fib_index, &protocol);
2725
2726   s = format (s, "%U proto %U port %d fib %d", format_ip4_address, &addr,
2727               format_nat_protocol, protocol, clib_net_to_host_u16 (port),
2728               fib_index);
2729   return s;
2730 }
2731
2732 u8 *
2733 format_nat44_ei_user_kvp (u8 *s, va_list *args)
2734 {
2735   clib_bihash_kv_8_8_t *v = va_arg (*args, clib_bihash_kv_8_8_t *);
2736   nat44_ei_user_key_t k;
2737
2738   k.as_u64 = v->key;
2739
2740   s = format (s, "%U fib %d user-index %llu", format_ip4_address, &k.addr,
2741               k.fib_index, v->value);
2742
2743   return s;
2744 }
2745
2746 u8 *
2747 format_nat44_ei_session_kvp (u8 *s, va_list *args)
2748 {
2749   clib_bihash_kv_8_8_t *v = va_arg (*args, clib_bihash_kv_8_8_t *);
2750
2751   s = format (s, "%U thread-index %llu session-index %llu",
2752               format_nat44_ei_key, v->key, nat_value_get_thread_index (v),
2753               nat_value_get_session_index (v));
2754
2755   return s;
2756 }
2757
2758 u8 *
2759 format_nat44_ei_static_mapping_kvp (u8 *s, va_list *args)
2760 {
2761   clib_bihash_kv_8_8_t *v = va_arg (*args, clib_bihash_kv_8_8_t *);
2762
2763   s = format (s, "%U static-mapping-index %llu", format_nat44_ei_key, v->key,
2764               v->value);
2765
2766   return s;
2767 }
2768
2769 static void
2770 nat44_ei_worker_db_init (nat44_ei_main_per_thread_data_t *tnm,
2771                          u32 translations, u32 translation_buckets,
2772                          u32 user_buckets)
2773 {
2774   dlist_elt_t *head;
2775
2776   pool_alloc (tnm->list_pool, translations);
2777   pool_alloc (tnm->lru_pool, translations);
2778   pool_alloc (tnm->sessions, translations);
2779
2780   clib_bihash_init_8_8 (&tnm->user_hash, "users", user_buckets, 0);
2781
2782   clib_bihash_set_kvp_format_fn_8_8 (&tnm->user_hash,
2783                                      format_nat44_ei_user_kvp);
2784
2785   pool_get (tnm->lru_pool, head);
2786   tnm->tcp_trans_lru_head_index = head - tnm->lru_pool;
2787   clib_dlist_init (tnm->lru_pool, tnm->tcp_trans_lru_head_index);
2788
2789   pool_get (tnm->lru_pool, head);
2790   tnm->tcp_estab_lru_head_index = head - tnm->lru_pool;
2791   clib_dlist_init (tnm->lru_pool, tnm->tcp_estab_lru_head_index);
2792
2793   pool_get (tnm->lru_pool, head);
2794   tnm->udp_lru_head_index = head - tnm->lru_pool;
2795   clib_dlist_init (tnm->lru_pool, tnm->udp_lru_head_index);
2796
2797   pool_get (tnm->lru_pool, head);
2798   tnm->icmp_lru_head_index = head - tnm->lru_pool;
2799   clib_dlist_init (tnm->lru_pool, tnm->icmp_lru_head_index);
2800
2801   pool_get (tnm->lru_pool, head);
2802   tnm->unk_proto_lru_head_index = head - tnm->lru_pool;
2803   clib_dlist_init (tnm->lru_pool, tnm->unk_proto_lru_head_index);
2804 }
2805
2806 static void
2807 nat44_ei_db_init (u32 translations, u32 translation_buckets, u32 user_buckets)
2808 {
2809   nat44_ei_main_t *nm = &nat44_ei_main;
2810   nat44_ei_main_per_thread_data_t *tnm;
2811
2812   u32 static_mapping_buckets = 1024;
2813   u32 static_mapping_memory_size = 64 << 20;
2814
2815   clib_bihash_init_8_8 (&nm->static_mapping_by_local,
2816                         "static_mapping_by_local", static_mapping_buckets,
2817                         static_mapping_memory_size);
2818   clib_bihash_init_8_8 (&nm->static_mapping_by_external,
2819                         "static_mapping_by_external", static_mapping_buckets,
2820                         static_mapping_memory_size);
2821   clib_bihash_set_kvp_format_fn_8_8 (&nm->static_mapping_by_local,
2822                                      format_nat44_ei_static_mapping_kvp);
2823   clib_bihash_set_kvp_format_fn_8_8 (&nm->static_mapping_by_external,
2824                                      format_nat44_ei_static_mapping_kvp);
2825
2826   if (nm->pat)
2827     {
2828       clib_bihash_init_8_8 (&nm->in2out, "in2out", translation_buckets, 0);
2829       clib_bihash_init_8_8 (&nm->out2in, "out2in", translation_buckets, 0);
2830       clib_bihash_set_kvp_format_fn_8_8 (&nm->in2out,
2831                                          format_nat44_ei_session_kvp);
2832       clib_bihash_set_kvp_format_fn_8_8 (&nm->out2in,
2833                                          format_nat44_ei_session_kvp);
2834       vec_foreach (tnm, nm->per_thread_data)
2835         {
2836           nat44_ei_worker_db_init (tnm, translations, translation_buckets,
2837                                    user_buckets);
2838         }
2839     }
2840 }
2841
2842 void
2843 nat44_ei_sessions_clear ()
2844 {
2845   nat44_ei_main_t *nm = &nat44_ei_main;
2846   nat44_ei_main_per_thread_data_t *tnm;
2847
2848   if (nm->pat)
2849     {
2850       clib_bihash_free_8_8 (&nm->in2out);
2851       clib_bihash_free_8_8 (&nm->out2in);
2852       clib_bihash_init_8_8 (&nm->in2out, "in2out", nm->translation_buckets, 0);
2853       clib_bihash_init_8_8 (&nm->out2in, "out2in", nm->translation_buckets, 0);
2854       clib_bihash_set_kvp_format_fn_8_8 (&nm->in2out,
2855                                          format_nat44_ei_session_kvp);
2856       clib_bihash_set_kvp_format_fn_8_8 (&nm->out2in,
2857                                          format_nat44_ei_session_kvp);
2858       vec_foreach (tnm, nm->per_thread_data)
2859         {
2860           nat44_ei_worker_db_free (tnm);
2861           nat44_ei_worker_db_init (tnm, nm->translations,
2862                                    nm->translation_buckets, nm->user_buckets);
2863         }
2864     }
2865
2866   vlib_zero_simple_counter (&nm->total_users, 0);
2867   vlib_zero_simple_counter (&nm->total_sessions, 0);
2868   vlib_zero_simple_counter (&nm->user_limit_reached, 0);
2869 }
2870
2871 static void
2872 nat44_ei_update_outside_fib (ip4_main_t *im, uword opaque, u32 sw_if_index,
2873                              u32 new_fib_index, u32 old_fib_index)
2874 {
2875   nat44_ei_main_t *nm = &nat44_ei_main;
2876   nat44_ei_outside_fib_t *outside_fib;
2877   nat44_ei_interface_t *i;
2878   u8 is_add = 1;
2879   u8 match = 0;
2880
2881   if (!nm->enabled || (new_fib_index == old_fib_index) ||
2882       (!vec_len (nm->outside_fibs)))
2883     {
2884       return;
2885     }
2886
2887   pool_foreach (i, nm->interfaces)
2888     {
2889       if (i->sw_if_index == sw_if_index)
2890         {
2891           if (!(nat44_ei_interface_is_outside (i)))
2892             return;
2893           match = 1;
2894         }
2895     }
2896
2897   pool_foreach (i, nm->output_feature_interfaces)
2898     {
2899       if (i->sw_if_index == sw_if_index)
2900         {
2901           if (!(nat44_ei_interface_is_outside (i)))
2902             return;
2903           match = 1;
2904         }
2905     }
2906
2907   if (!match)
2908     return;
2909
2910   vec_foreach (outside_fib, nm->outside_fibs)
2911     {
2912       if (outside_fib->fib_index == old_fib_index)
2913         {
2914           outside_fib->refcount--;
2915           if (!outside_fib->refcount)
2916             vec_del1 (nm->outside_fibs, outside_fib - nm->outside_fibs);
2917           break;
2918         }
2919     }
2920
2921   vec_foreach (outside_fib, nm->outside_fibs)
2922     {
2923       if (outside_fib->fib_index == new_fib_index)
2924         {
2925           outside_fib->refcount++;
2926           is_add = 0;
2927           break;
2928         }
2929     }
2930
2931   if (is_add)
2932     {
2933       vec_add2 (nm->outside_fibs, outside_fib, 1);
2934       outside_fib->refcount = 1;
2935       outside_fib->fib_index = new_fib_index;
2936     }
2937 }
2938
2939 int
2940 nat44_ei_add_address (ip4_address_t *addr, u32 vrf_id)
2941 {
2942   nat44_ei_main_t *nm = &nat44_ei_main;
2943   vlib_thread_main_t *tm = vlib_get_thread_main ();
2944   nat44_ei_address_t *ap;
2945
2946   fail_if_disabled ();
2947
2948   /* Check if address already exists */
2949   vec_foreach (ap, nm->addresses)
2950     {
2951       if (ap->addr.as_u32 == addr->as_u32)
2952         {
2953           nat44_ei_log_err ("address exist");
2954           return VNET_API_ERROR_VALUE_EXIST;
2955         }
2956     }
2957
2958   vec_add2 (nm->addresses, ap, 1);
2959
2960   ap->fib_index = ~0;
2961   ap->addr = *addr;
2962
2963   if (vrf_id != ~0)
2964     {
2965       ap->fib_index = fib_table_find_or_create_and_lock (
2966         FIB_PROTOCOL_IP4, vrf_id, nm->fib_src_low);
2967     }
2968
2969   nat_protocol_t proto;
2970   for (proto = 0; proto < NAT_N_PROTOCOLS; ++proto)
2971     {
2972       ap->busy_port_bitmap[proto] = 0;
2973       ap->busy_ports[proto] = 0;
2974       ap->busy_ports_per_thread[proto] = 0;
2975       vec_validate_init_empty (ap->busy_ports_per_thread[proto],
2976                                tm->n_vlib_mains - 1, 0);
2977     }
2978
2979     nat44_ei_add_del_addr_to_fib_foreach_out_if (addr, 1);
2980
2981   return 0;
2982 }
2983
2984 int
2985 nat44_ei_del_address (ip4_address_t addr, u8 delete_sm)
2986 {
2987   nat44_ei_main_t *nm = &nat44_ei_main;
2988   nat44_ei_address_t *a = 0;
2989   nat44_ei_session_t *ses;
2990   u32 *ses_to_be_removed = 0, *ses_index;
2991   nat44_ei_main_per_thread_data_t *tnm;
2992   nat44_ei_static_mapping_t *m;
2993   int j;
2994
2995   fail_if_disabled ();
2996
2997   /* Find SNAT address */
2998   for (j = 0; j < vec_len (nm->addresses); j++)
2999     {
3000       if (nm->addresses[j].addr.as_u32 == addr.as_u32)
3001         {
3002           a = nm->addresses + j;
3003           break;
3004         }
3005     }
3006   if (!a)
3007     {
3008       nat44_ei_log_err ("no such address");
3009       return VNET_API_ERROR_NO_SUCH_ENTRY;
3010     }
3011
3012   if (delete_sm)
3013     {
3014       pool_foreach (m, nm->static_mappings)
3015         {
3016           if (m->external_addr.as_u32 == addr.as_u32)
3017             nat44_ei_del_static_mapping_internal (
3018               m->local_addr, m->external_addr, m->local_port, m->external_port,
3019               m->proto, m->vrf_id, ~0, m->flags);
3020         }
3021     }
3022   else
3023     {
3024       /* Check if address is used in some static mapping */
3025       if (nat44_ei_is_address_used_in_static_mapping (addr))
3026         {
3027           nat44_ei_log_err ("address used in static mapping");
3028           return VNET_API_ERROR_UNSPECIFIED;
3029         }
3030     }
3031
3032   /* Delete sessions using address */
3033   if (a->busy_ports[NAT_PROTOCOL_TCP] || a->busy_ports[NAT_PROTOCOL_UDP] ||
3034       a->busy_ports[NAT_PROTOCOL_ICMP])
3035     {
3036       vec_foreach (tnm, nm->per_thread_data)
3037         {
3038           pool_foreach (ses, tnm->sessions)
3039             {
3040               if (ses->out2in.addr.as_u32 == addr.as_u32)
3041                 {
3042                   nat44_ei_free_session_data (nm, ses,
3043                                               tnm - nm->per_thread_data, 0);
3044                   vec_add1 (ses_to_be_removed, ses - tnm->sessions);
3045                 }
3046             }
3047           vec_foreach (ses_index, ses_to_be_removed)
3048             {
3049               ses = pool_elt_at_index (tnm->sessions, ses_index[0]);
3050               nat44_ei_delete_session (nm, ses, tnm - nm->per_thread_data);
3051             }
3052           vec_free (ses_to_be_removed);
3053         }
3054     }
3055
3056   nat44_ei_add_del_addr_to_fib_foreach_out_if (&addr, 0);
3057
3058   if (a->fib_index != ~0)
3059     {
3060       fib_table_unlock (a->fib_index, FIB_PROTOCOL_IP4, nm->fib_src_low);
3061     }
3062
3063   nat_protocol_t proto;
3064   for (proto = 0; proto < NAT_N_PROTOCOLS; ++proto)
3065     {
3066       vec_free (a->busy_ports_per_thread[proto]);
3067     }
3068
3069   vec_del1 (nm->addresses, j);
3070   return 0;
3071 }
3072
3073 int
3074 nat44_ei_add_interface_address (u32 sw_if_index)
3075 {
3076   nat44_ei_main_t *nm = &nat44_ei_main;
3077   ip4_main_t *ip4_main = nm->ip4_main;
3078   ip4_address_t *first_int_addr;
3079   u32 *auto_add_sw_if_indices = nm->auto_add_sw_if_indices;
3080   int i;
3081
3082   for (i = 0; i < vec_len (auto_add_sw_if_indices); i++)
3083     {
3084       if (auto_add_sw_if_indices[i] == sw_if_index)
3085         {
3086           return VNET_API_ERROR_VALUE_EXIST;
3087         }
3088     }
3089
3090   /* add to the auto-address list */
3091   vec_add1 (nm->auto_add_sw_if_indices, sw_if_index);
3092
3093   // if the address is already bound - or static - add it now
3094   first_int_addr = ip4_interface_first_address (ip4_main, sw_if_index, 0);
3095   if (first_int_addr)
3096     {
3097       (void) nat44_ei_add_address (first_int_addr, ~0);
3098     }
3099
3100   return 0;
3101 }
3102
3103 int
3104 nat44_ei_del_interface_address (u32 sw_if_index)
3105 {
3106   nat44_ei_main_t *nm = &nat44_ei_main;
3107   ip4_main_t *ip4_main = nm->ip4_main;
3108   ip4_address_t *first_int_addr;
3109   nat44_ei_static_map_resolve_t *rp;
3110   u32 *indices_to_delete = 0;
3111   int i, j;
3112   u32 *auto_add_sw_if_indices = nm->auto_add_sw_if_indices;
3113
3114   fail_if_disabled ();
3115
3116   first_int_addr = ip4_interface_first_address (ip4_main, sw_if_index, 0);
3117
3118   for (i = 0; i < vec_len (auto_add_sw_if_indices); i++)
3119     {
3120       if (auto_add_sw_if_indices[i] == sw_if_index)
3121         {
3122           first_int_addr =
3123             ip4_interface_first_address (ip4_main, sw_if_index, 0);
3124           if (first_int_addr)
3125             {
3126               (void) nat44_ei_del_address (first_int_addr[0], 1);
3127             }
3128           else
3129             {
3130               for (j = 0; j < vec_len (nm->to_resolve); j++)
3131                 {
3132                   rp = nm->to_resolve + j;
3133                   if (rp->sw_if_index == sw_if_index)
3134                     {
3135                       vec_add1 (indices_to_delete, j);
3136                     }
3137                 }
3138               if (vec_len (indices_to_delete))
3139                 {
3140                   for (j = vec_len (indices_to_delete) - 1; j >= 0; j--)
3141                     {
3142                       vec_del1 (nm->to_resolve, j);
3143                     }
3144                   vec_free (indices_to_delete);
3145                 }
3146             }
3147
3148           vec_del1 (nm->auto_add_sw_if_indices, i);
3149           return 0;
3150         }
3151     }
3152   return VNET_API_ERROR_NO_SUCH_ENTRY;
3153 }
3154
3155 static_always_inline int
3156 is_sw_if_index_reg_for_auto_resolve (u32 *sw_if_indices, u32 sw_if_index)
3157 {
3158   u32 *i;
3159   vec_foreach (i, sw_if_indices)
3160     {
3161       if (*i == sw_if_index)
3162         {
3163           return 1;
3164         }
3165     }
3166   return 0;
3167 }
3168
3169 static void
3170 nat44_ei_ip4_add_del_interface_address_cb (ip4_main_t *im, uword opaque,
3171                                            u32 sw_if_index,
3172                                            ip4_address_t *address,
3173                                            u32 address_length,
3174                                            u32 if_address_index, u32 is_delete)
3175 {
3176   nat44_ei_main_t *nm = &nat44_ei_main;
3177   nat44_ei_static_map_resolve_t *rp;
3178   nat44_ei_address_t *addresses = nm->addresses;
3179   int rv, i;
3180
3181   if (!nm->enabled)
3182     {
3183       return;
3184     }
3185
3186   if (!is_sw_if_index_reg_for_auto_resolve (nm->auto_add_sw_if_indices,
3187                                             sw_if_index))
3188     {
3189       return;
3190     }
3191
3192   if (!is_delete)
3193     {
3194       /* Don't trip over lease renewal, static config */
3195       for (i = 0; i < vec_len (addresses); i++)
3196         {
3197           if (addresses[i].addr.as_u32 == address->as_u32)
3198             {
3199               return;
3200             }
3201         }
3202
3203       (void) nat44_ei_add_address (address, ~0);
3204
3205       /* Scan static map resolution vector */
3206       for (i = 0; i < vec_len (nm->to_resolve); i++)
3207         {
3208           rp = nm->to_resolve + i;
3209           if (is_sm_addr_only (rp->flags))
3210             {
3211               continue;
3212             }
3213           /* On this interface? */
3214           if (rp->sw_if_index == sw_if_index)
3215             {
3216               rv = nat44_ei_add_static_mapping_internal (
3217                 rp->l_addr, address[0], rp->l_port, rp->e_port, rp->proto,
3218                 rp->vrf_id, ~0, rp->flags, rp->pool_addr, rp->tag);
3219               if (rv)
3220                 {
3221                   nat_elog_notice_X1 (
3222                     nm, "add_static_mapping_internal returned %d", "i4", rv);
3223                 }
3224             }
3225         }
3226     }
3227   else
3228     {
3229       // remove all static mapping records
3230       (void) nat44_ei_del_address (address[0], 1);
3231     }
3232 }
3233
3234 int
3235 nat44_ei_set_frame_queue_nelts (u32 frame_queue_nelts)
3236 {
3237   fail_if_enabled ();
3238   nat44_ei_main_t *nm = &nat44_ei_main;
3239   nm->frame_queue_nelts = frame_queue_nelts;
3240   return 0;
3241 }
3242
3243 static void
3244 nat44_ei_ip4_add_del_addr_only_sm_cb (ip4_main_t *im, uword opaque,
3245                                       u32 sw_if_index, ip4_address_t *address,
3246                                       u32 address_length, u32 if_address_index,
3247                                       u32 is_delete)
3248 {
3249   nat44_ei_main_t *nm = &nat44_ei_main;
3250   nat44_ei_static_map_resolve_t *rp;
3251   nat44_ei_static_mapping_t *m;
3252   clib_bihash_kv_8_8_t kv, value;
3253   int i, rv = 0, match = 0;
3254
3255   if (!nm->enabled)
3256     {
3257       return;
3258     }
3259
3260   for (i = 0; i < vec_len (nm->to_resolve); i++)
3261     {
3262       rp = nm->to_resolve + i;
3263
3264       if (is_sm_addr_only (rp->flags) && rp->sw_if_index == sw_if_index)
3265         {
3266           match = 1;
3267           break;
3268         }
3269     }
3270
3271   if (!match)
3272     {
3273       return;
3274     }
3275
3276   init_nat_k (&kv, *address, is_sm_addr_only (rp->flags) ? 0 : rp->e_port,
3277               nm->outside_fib_index,
3278               is_sm_addr_only (rp->flags) ? 0 : rp->proto);
3279   if (clib_bihash_search_8_8 (&nm->static_mapping_by_external, &kv, &value))
3280     m = 0;
3281   else
3282     m = pool_elt_at_index (nm->static_mappings, value.value);
3283
3284   if (is_delete)
3285     {
3286       if (!m)
3287         return;
3288       rv = nat44_ei_del_static_mapping_internal (
3289         rp->l_addr, address[0], rp->l_port, rp->e_port, rp->proto, rp->vrf_id,
3290         ~0, rp->flags);
3291       if (rv)
3292         {
3293           nat_elog_notice_X1 (nm, "nat44_ei_del_static_mapping returned %d",
3294                               "i4", rv);
3295         }
3296     }
3297   else
3298     {
3299       if (m)
3300         return;
3301       rv = nat44_ei_add_static_mapping_internal (
3302         rp->l_addr, address[0], rp->l_port, rp->e_port, rp->proto, rp->vrf_id,
3303         ~0, rp->flags, rp->pool_addr, rp->tag);
3304
3305       if (rv)
3306         {
3307           nat_elog_notice_X1 (nm, "nat44_ei_add_static_mapping returned %d",
3308                               "i4", rv);
3309         }
3310     }
3311 }
3312
3313 static_always_inline uword
3314 nat44_ei_classify_inline_fn (vlib_main_t *vm, vlib_node_runtime_t *node,
3315                              vlib_frame_t *frame)
3316 {
3317   u32 n_left_from, *from, *to_next;
3318   nat44_ei_classify_next_t next_index;
3319   nat44_ei_main_t *nm = &nat44_ei_main;
3320   nat44_ei_static_mapping_t *m;
3321   u32 next_in2out = 0, next_out2in = 0;
3322
3323   from = vlib_frame_vector_args (frame);
3324   n_left_from = frame->n_vectors;
3325   next_index = node->cached_next_index;
3326
3327   while (n_left_from > 0)
3328     {
3329       u32 n_left_to_next;
3330
3331       vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next);
3332
3333       while (n_left_from > 0 && n_left_to_next > 0)
3334         {
3335           u32 bi0;
3336           vlib_buffer_t *b0;
3337           u32 next0 = NAT44_EI_CLASSIFY_NEXT_IN2OUT;
3338           ip4_header_t *ip0;
3339           nat44_ei_address_t *ap;
3340           clib_bihash_kv_8_8_t kv0, value0;
3341
3342           /* speculatively enqueue b0 to the current next frame */
3343           bi0 = from[0];
3344           to_next[0] = bi0;
3345           from += 1;
3346           to_next += 1;
3347           n_left_from -= 1;
3348           n_left_to_next -= 1;
3349
3350           b0 = vlib_get_buffer (vm, bi0);
3351           ip0 = vlib_buffer_get_current (b0);
3352
3353           vec_foreach (ap, nm->addresses)
3354             {
3355               if (ip0->dst_address.as_u32 == ap->addr.as_u32)
3356                 {
3357                   next0 = NAT44_EI_CLASSIFY_NEXT_OUT2IN;
3358                   goto enqueue0;
3359                 }
3360             }
3361
3362           if (PREDICT_FALSE (pool_elts (nm->static_mappings)))
3363             {
3364               init_nat_k (&kv0, ip0->dst_address, 0, 0, 0);
3365               /* try to classify the fragment based on IP header alone */
3366               if (!clib_bihash_search_8_8 (&nm->static_mapping_by_external,
3367                                            &kv0, &value0))
3368                 {
3369                   m = pool_elt_at_index (nm->static_mappings, value0.value);
3370                   if (m->local_addr.as_u32 != m->external_addr.as_u32)
3371                     next0 = NAT44_EI_CLASSIFY_NEXT_OUT2IN;
3372                   goto enqueue0;
3373                 }
3374               init_nat_k (&kv0, ip0->dst_address,
3375                           vnet_buffer (b0)->ip.reass.l4_dst_port, 0,
3376                           ip_proto_to_nat_proto (ip0->protocol));
3377               if (!clib_bihash_search_8_8 (&nm->static_mapping_by_external,
3378                                            &kv0, &value0))
3379                 {
3380                   m = pool_elt_at_index (nm->static_mappings, value0.value);
3381                   if (m->local_addr.as_u32 != m->external_addr.as_u32)
3382                     next0 = NAT44_EI_CLASSIFY_NEXT_OUT2IN;
3383                 }
3384             }
3385
3386         enqueue0:
3387           if (PREDICT_FALSE ((node->flags & VLIB_NODE_FLAG_TRACE) &&
3388                              (b0->flags & VLIB_BUFFER_IS_TRACED)))
3389             {
3390               nat44_ei_classify_trace_t *t =
3391                 vlib_add_trace (vm, node, b0, sizeof (*t));
3392               t->cached = 0;
3393               t->next_in2out = next0 == NAT44_EI_CLASSIFY_NEXT_IN2OUT ? 1 : 0;
3394             }
3395
3396           next_in2out += next0 == NAT44_EI_CLASSIFY_NEXT_IN2OUT;
3397           next_out2in += next0 == NAT44_EI_CLASSIFY_NEXT_OUT2IN;
3398
3399           /* verify speculative enqueue, maybe switch current next frame */
3400           vlib_validate_buffer_enqueue_x1 (vm, node, next_index, to_next,
3401                                            n_left_to_next, bi0, next0);
3402         }
3403
3404       vlib_put_next_frame (vm, node, next_index, n_left_to_next);
3405     }
3406
3407   vlib_node_increment_counter (
3408     vm, node->node_index, NAT44_EI_CLASSIFY_ERROR_NEXT_IN2OUT, next_in2out);
3409   vlib_node_increment_counter (
3410     vm, node->node_index, NAT44_EI_CLASSIFY_ERROR_NEXT_OUT2IN, next_out2in);
3411   return frame->n_vectors;
3412 }
3413
3414 VLIB_NODE_FN (nat44_ei_classify_node)
3415 (vlib_main_t *vm, vlib_node_runtime_t *node, vlib_frame_t *frame)
3416 {
3417   return nat44_ei_classify_inline_fn (vm, node, frame);
3418 }
3419
3420 VLIB_REGISTER_NODE (nat44_ei_classify_node) = {
3421   .name = "nat44-ei-classify",
3422   .vector_size = sizeof (u32),
3423   .format_trace = format_nat44_ei_classify_trace,
3424   .type = VLIB_NODE_TYPE_INTERNAL,
3425   .n_errors = ARRAY_LEN(nat44_ei_classify_error_strings),
3426   .error_strings = nat44_ei_classify_error_strings,
3427   .n_next_nodes = NAT44_EI_CLASSIFY_N_NEXT,
3428   .next_nodes = {
3429     [NAT44_EI_CLASSIFY_NEXT_IN2OUT] = "nat44-ei-in2out",
3430     [NAT44_EI_CLASSIFY_NEXT_OUT2IN] = "nat44-ei-out2in",
3431     [NAT44_EI_CLASSIFY_NEXT_DROP] = "error-drop",
3432   },
3433 };
3434
3435 VLIB_NODE_FN (nat44_ei_handoff_classify_node)
3436 (vlib_main_t *vm, vlib_node_runtime_t *node, vlib_frame_t *frame)
3437 {
3438   return nat44_ei_classify_inline_fn (vm, node, frame);
3439 }
3440
3441 VLIB_REGISTER_NODE (nat44_ei_handoff_classify_node) = {
3442   .name = "nat44-ei-handoff-classify",
3443   .vector_size = sizeof (u32),
3444   .format_trace = format_nat44_ei_classify_trace,
3445   .type = VLIB_NODE_TYPE_INTERNAL,
3446   .n_errors = ARRAY_LEN(nat44_ei_classify_error_strings),
3447   .error_strings = nat44_ei_classify_error_strings,
3448   .n_next_nodes = NAT44_EI_CLASSIFY_N_NEXT,
3449   .next_nodes = {
3450     [NAT44_EI_CLASSIFY_NEXT_IN2OUT] = "nat44-ei-in2out-worker-handoff",
3451     [NAT44_EI_CLASSIFY_NEXT_OUT2IN] = "nat44-ei-out2in-worker-handoff",
3452     [NAT44_EI_CLASSIFY_NEXT_DROP] = "error-drop",
3453   },
3454 };
3455
3456 /*
3457  * fd.io coding-style-patch-verification: ON
3458  *
3459  * Local Variables:
3460  * eval: (c-set-style "gnu")
3461  * End:
3462  */