nat: static mappings in flow hash
[vpp.git] / src / plugins / nat / nat44-ei / nat44_ei.c
1 /*
2  * nat44_ei.c - nat44 endpoint dependent plugin
3  *
4  * Copyright (c) 2020 Cisco and/or its affiliates.
5  * Licensed under the Apache License, Version 2.0 (the "License");
6  * you may not use this file except in compliance with the License.
7  * You may obtain a copy of the License at:
8  *
9  *     http://www.apache.org/licenses/LICENSE-2.0
10  *
11  * Unless required by applicable law or agreed to in writing, software
12  * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
13  * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
14  * License for the specific language governing permissions and limitations
15  * under the License.
16  */
17
18 #include <vnet/plugin/plugin.h>
19 #include <vpp/app/version.h>
20
21 #include <vnet/vnet.h>
22 #include <vnet/ip/ip.h>
23 #include <vnet/ip/ip4.h>
24 #include <vnet/ip/ip_table.h>
25 #include <vnet/ip/reass/ip4_sv_reass.h>
26 #include <vnet/fib/fib_table.h>
27 #include <vnet/fib/ip4_fib.h>
28 #include <vnet/plugin/plugin.h>
29
30 // nat lib
31 #include <nat/lib/log.h>
32 #include <nat/lib/nat_syslog.h>
33 #include <nat/lib/nat_inlines.h>
34 #include <nat/lib/ipfix_logging.h>
35
36 #include <nat/nat44-ei/nat44_ei_dpo.h>
37 #include <nat/nat44-ei/nat44_ei_inlines.h>
38 #include <nat/nat44-ei/nat44_ei.h>
39
40 nat44_ei_main_t nat44_ei_main;
41
42 extern vlib_node_registration_t nat44_ei_hairpinning_node;
43 extern vlib_node_registration_t nat44_ei_hairpin_dst_node;
44 extern vlib_node_registration_t
45   nat44_ei_in2out_hairpinning_finish_ip4_lookup_node;
46 extern vlib_node_registration_t
47   nat44_ei_in2out_hairpinning_finish_interface_output_node;
48
49 #define skip_if_disabled()                                                    \
50   do                                                                          \
51     {                                                                         \
52       nat44_ei_main_t *nm = &nat44_ei_main;                                   \
53       if (PREDICT_FALSE (!nm->enabled))                                       \
54         return;                                                               \
55     }                                                                         \
56   while (0)
57
58 #define fail_if_enabled()                                                     \
59   do                                                                          \
60     {                                                                         \
61       nat44_ei_main_t *nm = &nat44_ei_main;                                   \
62       if (PREDICT_FALSE (nm->enabled))                                        \
63         {                                                                     \
64           nat44_ei_log_err ("plugin enabled");                                \
65           return 1;                                                           \
66         }                                                                     \
67     }                                                                         \
68   while (0)
69
70 #define fail_if_disabled()                                                    \
71   do                                                                          \
72     {                                                                         \
73       nat44_ei_main_t *nm = &nat44_ei_main;                                   \
74       if (PREDICT_FALSE (!nm->enabled))                                       \
75         {                                                                     \
76           nat44_ei_log_err ("plugin disabled");                               \
77           return 1;                                                           \
78         }                                                                     \
79     }                                                                         \
80   while (0)
81
82 /* Hook up input features */
83 VNET_FEATURE_INIT (ip4_nat_classify, static) = {
84   .arc_name = "ip4-unicast",
85   .node_name = "nat44-ei-classify",
86   .runs_after = VNET_FEATURES ("acl-plugin-in-ip4-fa",
87                                "ip4-sv-reassembly-feature"),
88 };
89 VNET_FEATURE_INIT (ip4_nat_handoff_classify, static) = {
90   .arc_name = "ip4-unicast",
91   .node_name = "nat44-ei-handoff-classify",
92   .runs_after = VNET_FEATURES ("acl-plugin-in-ip4-fa",
93                                "ip4-sv-reassembly-feature"),
94 };
95 VNET_FEATURE_INIT (ip4_nat44_ei_in2out, static) = {
96   .arc_name = "ip4-unicast",
97   .node_name = "nat44-ei-in2out",
98   .runs_after = VNET_FEATURES ("acl-plugin-in-ip4-fa",
99                                "ip4-sv-reassembly-feature"),
100 };
101 VNET_FEATURE_INIT (ip4_nat44_ei_out2in, static) = {
102   .arc_name = "ip4-unicast",
103   .node_name = "nat44-ei-out2in",
104   .runs_after = VNET_FEATURES ("acl-plugin-in-ip4-fa",
105                                "ip4-sv-reassembly-feature",
106                                "ip4-dhcp-client-detect"),
107 };
108 VNET_FEATURE_INIT (ip4_nat44_ei_in2out_output, static) = {
109   .arc_name = "ip4-output",
110   .node_name = "nat44-ei-in2out-output",
111   .runs_after = VNET_FEATURES ("acl-plugin-out-ip4-fa",
112                                "ip4-sv-reassembly-output-feature"),
113 };
114 VNET_FEATURE_INIT (ip4_nat44_ei_in2out_fast, static) = {
115   .arc_name = "ip4-unicast",
116   .node_name = "nat44-ei-in2out-fast",
117   .runs_after = VNET_FEATURES ("acl-plugin-in-ip4-fa",
118                                "ip4-sv-reassembly-feature"),
119 };
120 VNET_FEATURE_INIT (ip4_nat44_ei_out2in_fast, static) = {
121   .arc_name = "ip4-unicast",
122   .node_name = "nat44-ei-out2in-fast",
123   .runs_after = VNET_FEATURES ("acl-plugin-in-ip4-fa",
124                                "ip4-sv-reassembly-feature",
125                                "ip4-dhcp-client-detect"),
126 };
127 VNET_FEATURE_INIT (ip4_nat44_ei_hairpin_dst, static) = {
128   .arc_name = "ip4-unicast",
129   .node_name = "nat44-ei-hairpin-dst",
130   .runs_after = VNET_FEATURES ("acl-plugin-in-ip4-fa",
131                                "ip4-sv-reassembly-feature"),
132 };
133 VNET_FEATURE_INIT (ip4_nat44_ei_hairpin_src, static) = {
134   .arc_name = "ip4-output",
135   .node_name = "nat44-ei-hairpin-src",
136   .runs_after = VNET_FEATURES ("acl-plugin-out-ip4-fa",
137                                "ip4-sv-reassembly-output-feature"),
138 };
139 VNET_FEATURE_INIT (ip4_nat44_ei_hairpinning, static) = {
140   .arc_name = "ip4-local",
141   .node_name = "nat44-ei-hairpinning",
142   .runs_before = VNET_FEATURES ("ip4-local-end-of-arc"),
143 };
144 VNET_FEATURE_INIT (ip4_nat44_ei_in2out_worker_handoff, static) = {
145   .arc_name = "ip4-unicast",
146   .node_name = "nat44-ei-in2out-worker-handoff",
147   .runs_after = VNET_FEATURES ("acl-plugin-in-ip4-fa"),
148 };
149 VNET_FEATURE_INIT (ip4_nat44_ei_out2in_worker_handoff, static) = {
150   .arc_name = "ip4-unicast",
151   .node_name = "nat44-ei-out2in-worker-handoff",
152   .runs_after = VNET_FEATURES ("acl-plugin-in-ip4-fa",
153                                "ip4-dhcp-client-detect"),
154 };
155 VNET_FEATURE_INIT (ip4_nat44_ei_in2out_output_worker_handoff, static) = {
156   .arc_name = "ip4-output",
157   .node_name = "nat44-ei-in2out-output-worker-handoff",
158   .runs_after = VNET_FEATURES ("acl-plugin-out-ip4-fa",
159                                "ip4-sv-reassembly-output-feature"),
160 };
161
162 VLIB_PLUGIN_REGISTER () = {
163   .version = VPP_BUILD_VER,
164   .description = "IPv4 Endpoint-Independent NAT (NAT44 EI)",
165 };
166
167 #define foreach_nat44_ei_classify_error                                       \
168   _ (NEXT_IN2OUT, "next in2out")                                              \
169   _ (NEXT_OUT2IN, "next out2in")                                              \
170   _ (FRAG_CACHED, "fragment cached")
171
172 typedef enum
173 {
174 #define _(sym, str) NAT44_EI_CLASSIFY_ERROR_##sym,
175   foreach_nat44_ei_classify_error
176 #undef _
177     NAT44_EI_CLASSIFY_N_ERROR,
178 } nat44_ei_classify_error_t;
179
180 static char *nat44_ei_classify_error_strings[] = {
181 #define _(sym, string) string,
182   foreach_nat44_ei_classify_error
183 #undef _
184 };
185
186 typedef enum
187 {
188   NAT44_EI_CLASSIFY_NEXT_IN2OUT,
189   NAT44_EI_CLASSIFY_NEXT_OUT2IN,
190   NAT44_EI_CLASSIFY_NEXT_DROP,
191   NAT44_EI_CLASSIFY_N_NEXT,
192 } nat44_ei_classify_next_t;
193
194 typedef struct
195 {
196   u8 next_in2out;
197   u8 cached;
198 } nat44_ei_classify_trace_t;
199
200 void nat44_ei_add_del_addr_to_fib (ip4_address_t *addr, u8 p_len,
201                                    u32 sw_if_index, int is_add);
202
203 static u8 *
204 format_nat44_ei_classify_trace (u8 *s, va_list *args)
205 {
206   CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
207   CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
208   nat44_ei_classify_trace_t *t = va_arg (*args, nat44_ei_classify_trace_t *);
209   char *next;
210
211   if (t->cached)
212     s = format (s, "nat44-ei-classify: fragment cached");
213   else
214     {
215       next = t->next_in2out ? "nat44-ei-in2out" : "nat44-ei-out2in";
216       s = format (s, "nat44-ei-classify: next %s", next);
217     }
218
219   return s;
220 }
221
222 static void nat44_ei_db_free ();
223
224 static void nat44_ei_db_init (u32 translations, u32 translation_buckets,
225                               u32 user_buckets);
226
227 static void nat44_ei_ip4_add_del_interface_address_cb (
228   ip4_main_t *im, uword opaque, u32 sw_if_index, ip4_address_t *address,
229   u32 address_length, u32 if_address_index, u32 is_delete);
230
231 static void nat44_ei_ip4_add_del_addr_only_sm_cb (
232   ip4_main_t *im, uword opaque, u32 sw_if_index, ip4_address_t *address,
233   u32 address_length, u32 if_address_index, u32 is_delete);
234
235 static void nat44_ei_update_outside_fib (ip4_main_t *im, uword opaque,
236                                          u32 sw_if_index, u32 new_fib_index,
237                                          u32 old_fib_index);
238
239 void
240 nat44_ei_set_node_indexes (nat44_ei_main_t *nm, vlib_main_t *vm)
241 {
242   vlib_node_t *node;
243   node = vlib_get_node_by_name (vm, (u8 *) "nat44-ei-out2in");
244   nm->out2in_node_index = node->index;
245   node = vlib_get_node_by_name (vm, (u8 *) "nat44-ei-in2out");
246   nm->in2out_node_index = node->index;
247   node = vlib_get_node_by_name (vm, (u8 *) "nat44-ei-in2out-output");
248   nm->in2out_output_node_index = node->index;
249 }
250
251 int
252 nat44_ei_set_workers (uword *bitmap)
253 {
254   nat44_ei_main_t *nm = &nat44_ei_main;
255   int i, j = 0;
256
257   if (nm->num_workers < 2)
258     return VNET_API_ERROR_FEATURE_DISABLED;
259
260   if (clib_bitmap_last_set (bitmap) >= nm->num_workers)
261     return VNET_API_ERROR_INVALID_WORKER;
262
263   vec_free (nm->workers);
264   clib_bitmap_foreach (i, bitmap)
265     {
266       vec_add1 (nm->workers, i);
267       nm->per_thread_data[nm->first_worker_index + i].snat_thread_index = j;
268       nm->per_thread_data[nm->first_worker_index + i].thread_index = i;
269       j++;
270     }
271
272   nm->port_per_thread = (0xffff - 1024) / _vec_len (nm->workers);
273
274   return 0;
275 }
276
277 #define nat_validate_simple_counter(c, i)                                     \
278   do                                                                          \
279     {                                                                         \
280       vlib_validate_simple_counter (&c, i);                                   \
281       vlib_zero_simple_counter (&c, i);                                       \
282     }                                                                         \
283   while (0);
284
285 #define nat_init_simple_counter(c, n, sn)                                     \
286   do                                                                          \
287     {                                                                         \
288       c.name = n;                                                             \
289       c.stat_segment_name = sn;                                               \
290       nat_validate_simple_counter (c, 0);                                     \
291     }                                                                         \
292   while (0);
293
294 static_always_inline void
295 nat_validate_interface_counters (nat44_ei_main_t *nm, u32 sw_if_index)
296 {
297 #define _(x)                                                                  \
298   nat_validate_simple_counter (nm->counters.fastpath.in2out.x, sw_if_index);  \
299   nat_validate_simple_counter (nm->counters.fastpath.out2in.x, sw_if_index);  \
300   nat_validate_simple_counter (nm->counters.slowpath.in2out.x, sw_if_index);  \
301   nat_validate_simple_counter (nm->counters.slowpath.out2in.x, sw_if_index);
302   foreach_nat_counter;
303 #undef _
304   nat_validate_simple_counter (nm->counters.hairpinning, sw_if_index);
305 }
306
307 clib_error_t *
308 nat44_ei_init (vlib_main_t *vm)
309 {
310   nat44_ei_main_t *nm = &nat44_ei_main;
311   vlib_thread_main_t *tm = vlib_get_thread_main ();
312   vlib_thread_registration_t *tr;
313   ip4_add_del_interface_address_callback_t cbi = { 0 };
314   ip4_table_bind_callback_t cbt = { 0 };
315   u32 i, num_threads = 0;
316   uword *p, *bitmap = 0;
317
318   clib_memset (nm, 0, sizeof (*nm));
319
320   // required
321   nm->vnet_main = vnet_get_main ();
322   // convenience
323   nm->ip4_main = &ip4_main;
324   nm->api_main = vlibapi_get_main ();
325   nm->ip4_lookup_main = &ip4_main.lookup_main;
326
327   // handoff stuff
328   nm->fq_out2in_index = ~0;
329   nm->fq_in2out_index = ~0;
330   nm->fq_in2out_output_index = ~0;
331
332   nm->log_level = NAT_LOG_ERROR;
333
334   nat44_ei_set_node_indexes (nm, vm);
335   nm->log_class = vlib_log_register_class ("nat44-ei", 0);
336
337   nat_init_simple_counter (nm->total_users, "total-users",
338                            "/nat44-ei/total-users");
339   nat_init_simple_counter (nm->total_sessions, "total-sessions",
340                            "/nat44-ei/total-sessions");
341   nat_init_simple_counter (nm->user_limit_reached, "user-limit-reached",
342                            "/nat44-ei/user-limit-reached");
343
344 #define _(x)                                                                  \
345   nat_init_simple_counter (nm->counters.fastpath.in2out.x, #x,                \
346                            "/nat44-ei/in2out/fastpath/" #x);                  \
347   nat_init_simple_counter (nm->counters.fastpath.out2in.x, #x,                \
348                            "/nat44-ei/out2in/fastpath/" #x);                  \
349   nat_init_simple_counter (nm->counters.slowpath.in2out.x, #x,                \
350                            "/nat44-ei/in2out/slowpath/" #x);                  \
351   nat_init_simple_counter (nm->counters.slowpath.out2in.x, #x,                \
352                            "/nat44-ei/out2in/slowpath/" #x);
353   foreach_nat_counter;
354 #undef _
355   nat_init_simple_counter (nm->counters.hairpinning, "hairpinning",
356                            "/nat44-ei/hairpinning");
357
358   p = hash_get_mem (tm->thread_registrations_by_name, "workers");
359   if (p)
360     {
361       tr = (vlib_thread_registration_t *) p[0];
362       if (tr)
363         {
364           nm->num_workers = tr->count;
365           nm->first_worker_index = tr->first_index;
366         }
367     }
368   num_threads = tm->n_vlib_mains - 1;
369   nm->port_per_thread = 0xffff - 1024;
370   vec_validate (nm->per_thread_data, num_threads);
371
372   /* Use all available workers by default */
373   if (nm->num_workers > 1)
374     {
375
376       for (i = 0; i < nm->num_workers; i++)
377         bitmap = clib_bitmap_set (bitmap, i, 1);
378       nat44_ei_set_workers (bitmap);
379       clib_bitmap_free (bitmap);
380     }
381   else
382     nm->per_thread_data[0].snat_thread_index = 0;
383
384   /* callbacks to call when interface address changes. */
385   cbi.function = nat44_ei_ip4_add_del_interface_address_cb;
386   vec_add1 (nm->ip4_main->add_del_interface_address_callbacks, cbi);
387   cbi.function = nat44_ei_ip4_add_del_addr_only_sm_cb;
388   vec_add1 (nm->ip4_main->add_del_interface_address_callbacks, cbi);
389
390   /* callbacks to call when interface to table biding changes */
391   cbt.function = nat44_ei_update_outside_fib;
392   vec_add1 (nm->ip4_main->table_bind_callbacks, cbt);
393
394   nm->fib_src_low = fib_source_allocate (
395     "nat44-ei-low", FIB_SOURCE_PRIORITY_LOW, FIB_SOURCE_BH_SIMPLE);
396   nm->fib_src_hi = fib_source_allocate ("nat44-ei-hi", FIB_SOURCE_PRIORITY_HI,
397                                         FIB_SOURCE_BH_SIMPLE);
398
399   // used only by out2in-dpo feature
400   nat_dpo_module_init ();
401   nat_ha_init (vm, nm->num_workers, num_threads);
402
403   nm->hairpinning_fq_index =
404     vlib_frame_queue_main_init (nat44_ei_hairpinning_node.index, 0);
405   nm->hairpin_dst_fq_index =
406     vlib_frame_queue_main_init (nat44_ei_hairpin_dst_node.index, 0);
407   nm->in2out_hairpinning_finish_ip4_lookup_node_fq_index =
408     vlib_frame_queue_main_init (
409       nat44_ei_in2out_hairpinning_finish_ip4_lookup_node.index, 0);
410   nm->in2out_hairpinning_finish_interface_output_node_fq_index =
411     vlib_frame_queue_main_init (
412       nat44_ei_in2out_hairpinning_finish_interface_output_node.index, 0);
413   return nat44_ei_api_hookup (vm);
414 }
415
416 VLIB_INIT_FUNCTION (nat44_ei_init);
417
418 int
419 nat44_ei_plugin_enable (nat44_ei_config_t c)
420 {
421   nat44_ei_main_t *nm = &nat44_ei_main;
422
423   fail_if_enabled ();
424
425   if (!c.users)
426     c.users = 1024;
427
428   if (!c.sessions)
429     c.sessions = 10 * 1024;
430
431   if (!c.user_sessions)
432     c.user_sessions = c.sessions;
433
434   nm->rconfig = c;
435
436   if (!nm->frame_queue_nelts)
437     nm->frame_queue_nelts = NAT_FQ_NELTS_DEFAULT;
438
439   nm->translations = c.sessions;
440   nm->translation_buckets = nat_calc_bihash_buckets (c.sessions);
441   nm->user_buckets = nat_calc_bihash_buckets (c.users);
442
443   nm->pat = (!c.static_mapping_only ||
444              (c.static_mapping_only && c.connection_tracking));
445
446   nm->static_mapping_only = c.static_mapping_only;
447   nm->static_mapping_connection_tracking = c.connection_tracking;
448   nm->out2in_dpo = c.out2in_dpo;
449   nm->forwarding_enabled = 0;
450   nm->mss_clamping = 0;
451
452   nm->max_users_per_thread = c.users;
453   nm->max_translations_per_thread = c.sessions;
454   nm->max_translations_per_user = c.user_sessions;
455
456   nm->inside_vrf_id = c.inside_vrf;
457   nm->inside_fib_index = fib_table_find_or_create_and_lock (
458     FIB_PROTOCOL_IP4, c.inside_vrf, nm->fib_src_hi);
459
460   nm->outside_vrf_id = c.outside_vrf;
461   nm->outside_fib_index = fib_table_find_or_create_and_lock (
462     FIB_PROTOCOL_IP4, c.outside_vrf, nm->fib_src_hi);
463
464   nat_reset_timeouts (&nm->timeouts);
465   nat44_ei_db_init (nm->translations, nm->translation_buckets,
466                     nm->user_buckets);
467   nat44_ei_set_alloc_default ();
468
469   // TODO: zero simple counter for all counters missing
470
471   vlib_zero_simple_counter (&nm->total_users, 0);
472   vlib_zero_simple_counter (&nm->total_sessions, 0);
473   vlib_zero_simple_counter (&nm->user_limit_reached, 0);
474
475   nat_ha_enable ();
476   nm->enabled = 1;
477
478   return 0;
479 }
480
481 void
482 nat44_ei_addresses_free (nat44_ei_address_t **addresses)
483 {
484   nat44_ei_address_t *ap;
485   vec_foreach (ap, *addresses)
486     {
487 #define _(N, i, n, s) vec_free (ap->busy_##n##_ports_per_thread);
488       foreach_nat_protocol
489 #undef _
490     }
491   vec_free (*addresses);
492   *addresses = 0;
493 }
494
495 int
496 nat44_ei_interface_add_del (u32 sw_if_index, u8 is_inside, int is_del)
497 {
498   const char *feature_name, *del_feature_name;
499   nat44_ei_main_t *nm = &nat44_ei_main;
500   nat44_ei_interface_t *i;
501   nat44_ei_address_t *ap;
502   nat44_ei_static_mapping_t *m;
503   nat44_ei_outside_fib_t *outside_fib;
504   u32 fib_index =
505     fib_table_get_index_for_sw_if_index (FIB_PROTOCOL_IP4, sw_if_index);
506
507   fail_if_disabled ();
508
509   if (nm->out2in_dpo && !is_inside)
510     {
511       nat44_ei_log_err ("error unsupported");
512       return VNET_API_ERROR_UNSUPPORTED;
513     }
514
515   pool_foreach (i, nm->output_feature_interfaces)
516     {
517       if (i->sw_if_index == sw_if_index)
518         {
519           nat44_ei_log_err ("error interface already configured");
520           return VNET_API_ERROR_VALUE_EXIST;
521         }
522     }
523
524   if (nm->static_mapping_only && !(nm->static_mapping_connection_tracking))
525     feature_name = is_inside ? "nat44-ei-in2out-fast" : "nat44-ei-out2in-fast";
526   else
527     {
528       if (nm->num_workers > 1)
529         feature_name = is_inside ? "nat44-ei-in2out-worker-handoff" :
530                                    "nat44-ei-out2in-worker-handoff";
531       else
532         feature_name = is_inside ? "nat44-ei-in2out" : "nat44-ei-out2in";
533     }
534
535   if (nm->fq_in2out_index == ~0 && nm->num_workers > 1)
536     nm->fq_in2out_index = vlib_frame_queue_main_init (nm->in2out_node_index,
537                                                       nm->frame_queue_nelts);
538
539   if (nm->fq_out2in_index == ~0 && nm->num_workers > 1)
540     nm->fq_out2in_index = vlib_frame_queue_main_init (nm->out2in_node_index,
541                                                       nm->frame_queue_nelts);
542
543   if (!is_inside)
544     {
545       vec_foreach (outside_fib, nm->outside_fibs)
546         {
547           if (outside_fib->fib_index == fib_index)
548             {
549               if (is_del)
550                 {
551                   outside_fib->refcount--;
552                   if (!outside_fib->refcount)
553                     vec_del1 (nm->outside_fibs,
554                               outside_fib - nm->outside_fibs);
555                 }
556               else
557                 outside_fib->refcount++;
558               goto feature_set;
559             }
560         }
561       if (!is_del)
562         {
563           vec_add2 (nm->outside_fibs, outside_fib, 1);
564           outside_fib->refcount = 1;
565           outside_fib->fib_index = fib_index;
566         }
567     }
568
569 feature_set:
570   pool_foreach (i, nm->interfaces)
571     {
572       if (i->sw_if_index == sw_if_index)
573         {
574           if (is_del)
575             {
576               if (nat44_ei_interface_is_inside (i) &&
577                   nat44_ei_interface_is_outside (i))
578                 {
579                   if (is_inside)
580                     i->flags &= ~NAT44_EI_INTERFACE_FLAG_IS_INSIDE;
581                   else
582                     i->flags &= ~NAT44_EI_INTERFACE_FLAG_IS_OUTSIDE;
583
584                   if (nm->num_workers > 1)
585                     {
586                       del_feature_name = "nat44-ei-handoff-classify";
587                       clib_warning (
588                         "del_feature_name = nat44-ei-handoff-classify");
589                       feature_name = !is_inside ?
590                                        "nat44-ei-in2out-worker-handoff" :
591                                        "nat44-ei-out2in-worker-handoff";
592                     }
593                   else
594                     {
595                       del_feature_name = "nat44-ei-classify";
596                       clib_warning ("del_feature_name = nat44-ei-classify");
597                       feature_name =
598                         !is_inside ? "nat44-ei-in2out" : "nat44-ei-out2in";
599                     }
600
601                   int rv =
602                     ip4_sv_reass_enable_disable_with_refcnt (sw_if_index, 0);
603                   if (rv)
604                     return rv;
605                   rv = vnet_feature_enable_disable (
606                     "ip4-unicast", del_feature_name, sw_if_index, 0, 0, 0);
607                   if (rv)
608                     return rv;
609                   rv = vnet_feature_enable_disable (
610                     "ip4-unicast", feature_name, sw_if_index, 1, 0, 0);
611                   if (rv)
612                     return rv;
613                   if (!is_inside)
614                     {
615                       rv = vnet_feature_enable_disable ("ip4-local",
616                                                         "nat44-ei-hairpinning",
617                                                         sw_if_index, 1, 0, 0);
618                       if (rv)
619                         return rv;
620                     }
621                 }
622               else
623                 {
624                   int rv =
625                     ip4_sv_reass_enable_disable_with_refcnt (sw_if_index, 0);
626                   if (rv)
627                     return rv;
628                   rv = vnet_feature_enable_disable (
629                     "ip4-unicast", feature_name, sw_if_index, 0, 0, 0);
630                   if (rv)
631                     return rv;
632                   pool_put (nm->interfaces, i);
633                   if (is_inside)
634                     {
635                       rv = vnet_feature_enable_disable ("ip4-local",
636                                                         "nat44-ei-hairpinning",
637                                                         sw_if_index, 0, 0, 0);
638                       if (rv)
639                         return rv;
640                     }
641                 }
642             }
643           else
644             {
645               if ((nat44_ei_interface_is_inside (i) && is_inside) ||
646                   (nat44_ei_interface_is_outside (i) && !is_inside))
647                 return 0;
648
649               if (nm->num_workers > 1)
650                 {
651                   del_feature_name = !is_inside ?
652                                        "nat44-ei-in2out-worker-handoff" :
653                                        "nat44-ei-out2in-worker-handoff";
654                   feature_name = "nat44-ei-handoff-classify";
655                   clib_warning ("feature_name = nat44-ei-handoff-classify");
656                 }
657               else
658                 {
659                   del_feature_name =
660                     !is_inside ? "nat44-ei-in2out" : "nat44-ei-out2in";
661                   feature_name = "nat44-ei-classify";
662                   clib_warning ("feature_name = nat44-ei-classify");
663                 }
664
665               int rv =
666                 ip4_sv_reass_enable_disable_with_refcnt (sw_if_index, 1);
667               if (rv)
668                 return rv;
669               rv = vnet_feature_enable_disable (
670                 "ip4-unicast", del_feature_name, sw_if_index, 0, 0, 0);
671               if (rv)
672                 return rv;
673               rv = vnet_feature_enable_disable ("ip4-unicast", feature_name,
674                                                 sw_if_index, 1, 0, 0);
675               if (rv)
676                 return rv;
677               if (!is_inside)
678                 {
679                   rv = vnet_feature_enable_disable (
680                     "ip4-local", "nat44-ei-hairpinning", sw_if_index, 0, 0, 0);
681                   if (rv)
682                     return rv;
683                 }
684               goto set_flags;
685             }
686
687           goto fib;
688         }
689     }
690
691   if (is_del)
692     {
693       nat44_ei_log_err ("error interface couldn't be found");
694       return VNET_API_ERROR_NO_SUCH_ENTRY;
695     }
696
697   pool_get (nm->interfaces, i);
698   i->sw_if_index = sw_if_index;
699   i->flags = 0;
700   nat_validate_interface_counters (nm, sw_if_index);
701
702   int rv = vnet_feature_enable_disable ("ip4-unicast", feature_name,
703                                         sw_if_index, 1, 0, 0);
704   if (rv)
705     return rv;
706
707   rv = ip4_sv_reass_enable_disable_with_refcnt (sw_if_index, 1);
708   if (rv)
709     return rv;
710
711   if (is_inside && !nm->out2in_dpo)
712     {
713       rv = vnet_feature_enable_disable ("ip4-local", "nat44-ei-hairpinning",
714                                         sw_if_index, 1, 0, 0);
715       if (rv)
716         return rv;
717     }
718
719 set_flags:
720   if (is_inside)
721     {
722       i->flags |= NAT44_EI_INTERFACE_FLAG_IS_INSIDE;
723       return 0;
724     }
725   else
726     i->flags |= NAT44_EI_INTERFACE_FLAG_IS_OUTSIDE;
727
728   /* Add/delete external addresses to FIB */
729 fib:
730   vec_foreach (ap, nm->addresses)
731     nat44_ei_add_del_addr_to_fib (&ap->addr, 32, sw_if_index, !is_del);
732
733   pool_foreach (m, nm->static_mappings)
734     {
735       if (!(nat44_ei_is_addr_only_static_mapping (m)) ||
736           (m->local_addr.as_u32 == m->external_addr.as_u32))
737         continue;
738
739       nat44_ei_add_del_addr_to_fib (&m->external_addr, 32, sw_if_index,
740                                     !is_del);
741     }
742
743   return 0;
744 }
745
746 int
747 nat44_ei_interface_add_del_output_feature (u32 sw_if_index, u8 is_inside,
748                                            int is_del)
749 {
750   nat44_ei_main_t *nm = &nat44_ei_main;
751   nat44_ei_interface_t *i;
752   nat44_ei_address_t *ap;
753   nat44_ei_static_mapping_t *m;
754   nat44_ei_outside_fib_t *outside_fib;
755   u32 fib_index =
756     fib_table_get_index_for_sw_if_index (FIB_PROTOCOL_IP4, sw_if_index);
757
758   fail_if_disabled ();
759
760   if (nm->static_mapping_only && !(nm->static_mapping_connection_tracking))
761     {
762       nat44_ei_log_err ("error unsupported");
763       return VNET_API_ERROR_UNSUPPORTED;
764     }
765
766   pool_foreach (i, nm->interfaces)
767     {
768       if (i->sw_if_index == sw_if_index)
769         {
770           nat44_ei_log_err ("error interface already configured");
771           return VNET_API_ERROR_VALUE_EXIST;
772         }
773     }
774
775   if (!is_inside)
776     {
777       vec_foreach (outside_fib, nm->outside_fibs)
778         {
779           if (outside_fib->fib_index == fib_index)
780             {
781               if (is_del)
782                 {
783                   outside_fib->refcount--;
784                   if (!outside_fib->refcount)
785                     vec_del1 (nm->outside_fibs,
786                               outside_fib - nm->outside_fibs);
787                 }
788               else
789                 outside_fib->refcount++;
790               goto feature_set;
791             }
792         }
793       if (!is_del)
794         {
795           vec_add2 (nm->outside_fibs, outside_fib, 1);
796           outside_fib->refcount = 1;
797           outside_fib->fib_index = fib_index;
798         }
799     }
800
801 feature_set:
802   if (is_inside)
803     {
804       int rv = ip4_sv_reass_enable_disable_with_refcnt (sw_if_index, !is_del);
805       if (rv)
806         return rv;
807       rv =
808         ip4_sv_reass_output_enable_disable_with_refcnt (sw_if_index, !is_del);
809       if (rv)
810         return rv;
811       rv = vnet_feature_enable_disable ("ip4-unicast", "nat44-ei-hairpin-dst",
812                                         sw_if_index, !is_del, 0, 0);
813       if (rv)
814         return rv;
815       rv = vnet_feature_enable_disable ("ip4-output", "nat44-ei-hairpin-src",
816                                         sw_if_index, !is_del, 0, 0);
817       if (rv)
818         return rv;
819       goto fq;
820     }
821
822   if (nm->num_workers > 1)
823     {
824       int rv = ip4_sv_reass_enable_disable_with_refcnt (sw_if_index, !is_del);
825       if (rv)
826         return rv;
827       rv =
828         ip4_sv_reass_output_enable_disable_with_refcnt (sw_if_index, !is_del);
829       if (rv)
830         return rv;
831       rv = vnet_feature_enable_disable ("ip4-unicast",
832                                         "nat44-ei-out2in-worker-handoff",
833                                         sw_if_index, !is_del, 0, 0);
834       if (rv)
835         return rv;
836       rv = vnet_feature_enable_disable (
837         "ip4-output", "nat44-ei-in2out-output-worker-handoff", sw_if_index,
838         !is_del, 0, 0);
839       if (rv)
840         return rv;
841     }
842   else
843     {
844       int rv = ip4_sv_reass_enable_disable_with_refcnt (sw_if_index, !is_del);
845       if (rv)
846         return rv;
847       rv =
848         ip4_sv_reass_output_enable_disable_with_refcnt (sw_if_index, !is_del);
849       if (rv)
850         return rv;
851       rv = vnet_feature_enable_disable ("ip4-unicast", "nat44-ei-out2in",
852                                         sw_if_index, !is_del, 0, 0);
853       if (rv)
854         return rv;
855       rv = vnet_feature_enable_disable ("ip4-output", "nat44-ei-in2out-output",
856                                         sw_if_index, !is_del, 0, 0);
857       if (rv)
858         return rv;
859     }
860
861 fq:
862   if (nm->fq_in2out_output_index == ~0 && nm->num_workers > 1)
863     nm->fq_in2out_output_index =
864       vlib_frame_queue_main_init (nm->in2out_output_node_index, 0);
865
866   if (nm->fq_out2in_index == ~0 && nm->num_workers > 1)
867     nm->fq_out2in_index =
868       vlib_frame_queue_main_init (nm->out2in_node_index, 0);
869
870   pool_foreach (i, nm->output_feature_interfaces)
871     {
872       if (i->sw_if_index == sw_if_index)
873         {
874           if (is_del)
875             pool_put (nm->output_feature_interfaces, i);
876           else
877             return VNET_API_ERROR_VALUE_EXIST;
878
879           goto fib;
880         }
881     }
882
883   if (is_del)
884     {
885       nat44_ei_log_err ("error interface couldn't be found");
886       return VNET_API_ERROR_NO_SUCH_ENTRY;
887     }
888
889   pool_get (nm->output_feature_interfaces, i);
890   i->sw_if_index = sw_if_index;
891   i->flags = 0;
892   nat_validate_interface_counters (nm, sw_if_index);
893   if (is_inside)
894     i->flags |= NAT44_EI_INTERFACE_FLAG_IS_INSIDE;
895   else
896     i->flags |= NAT44_EI_INTERFACE_FLAG_IS_OUTSIDE;
897
898   /* Add/delete external addresses to FIB */
899 fib:
900   if (is_inside)
901     return 0;
902
903   vec_foreach (ap, nm->addresses)
904     nat44_ei_add_del_addr_to_fib (&ap->addr, 32, sw_if_index, !is_del);
905
906   pool_foreach (m, nm->static_mappings)
907     {
908       if (!((nat44_ei_is_addr_only_static_mapping (m))) ||
909           (m->local_addr.as_u32 == m->external_addr.as_u32))
910         continue;
911
912       nat44_ei_add_del_addr_to_fib (&m->external_addr, 32, sw_if_index,
913                                     !is_del);
914     }
915
916   return 0;
917 }
918
919 int
920 nat44_ei_plugin_disable ()
921 {
922   nat44_ei_main_t *nm = &nat44_ei_main;
923   nat44_ei_interface_t *i, *pool;
924   int error = 0;
925
926   // first unregister all nodes from interfaces
927   pool = pool_dup (nm->interfaces);
928   pool_foreach (i, pool)
929     {
930       if (nat44_ei_interface_is_inside (i))
931         error = nat44_ei_interface_add_del (i->sw_if_index, 1, 1);
932       if (nat44_ei_interface_is_outside (i))
933         error = nat44_ei_interface_add_del (i->sw_if_index, 0, 1);
934
935       if (error)
936         {
937           nat44_ei_log_err ("error occurred while removing interface %u",
938                             i->sw_if_index);
939         }
940     }
941   pool_free (pool);
942   pool_free (nm->interfaces);
943
944   pool = pool_dup (nm->output_feature_interfaces);
945   pool_foreach (i, pool)
946     {
947       if (nat44_ei_interface_is_inside (i))
948         error =
949           nat44_ei_interface_add_del_output_feature (i->sw_if_index, 1, 1);
950       if (nat44_ei_interface_is_outside (i))
951         error =
952           nat44_ei_interface_add_del_output_feature (i->sw_if_index, 0, 1);
953
954       if (error)
955         {
956           nat44_ei_log_err ("error occurred while removing interface %u",
957                             i->sw_if_index);
958         }
959     }
960   pool_free (pool);
961   pool_free (nm->output_feature_interfaces);
962
963   nat_ha_disable ();
964   nat44_ei_db_free ();
965
966   nat44_ei_addresses_free (&nm->addresses);
967
968   vec_free (nm->to_resolve);
969   vec_free (nm->auto_add_sw_if_indices);
970
971   nm->to_resolve = 0;
972   nm->auto_add_sw_if_indices = 0;
973
974   nm->forwarding_enabled = 0;
975
976   nm->enabled = 0;
977   clib_memset (&nm->rconfig, 0, sizeof (nm->rconfig));
978
979   return 0;
980 }
981
982 int
983 nat44_ei_set_outside_address_and_port (nat44_ei_address_t *addresses,
984                                        u32 thread_index, ip4_address_t addr,
985                                        u16 port, nat_protocol_t protocol)
986 {
987   nat44_ei_main_t *nm = &nat44_ei_main;
988   nat44_ei_address_t *a = 0;
989   u32 address_index;
990   u16 port_host_byte_order = clib_net_to_host_u16 (port);
991
992   for (address_index = 0; address_index < vec_len (addresses); address_index++)
993     {
994       if (addresses[address_index].addr.as_u32 != addr.as_u32)
995         continue;
996
997       a = addresses + address_index;
998       switch (protocol)
999         {
1000 #define _(N, j, n, s)                                                         \
1001   case NAT_PROTOCOL_##N:                                                      \
1002     if (a->busy_##n##_port_refcounts[port_host_byte_order])                   \
1003       return VNET_API_ERROR_INSTANCE_IN_USE;                                  \
1004     ++a->busy_##n##_port_refcounts[port_host_byte_order];                     \
1005     a->busy_##n##_ports_per_thread[thread_index]++;                           \
1006     a->busy_##n##_ports++;                                                    \
1007     return 0;
1008           foreach_nat_protocol
1009 #undef _
1010             default : nat_elog_info (nm, "unknown protocol");
1011           return 1;
1012         }
1013     }
1014
1015   return VNET_API_ERROR_NO_SUCH_ENTRY;
1016 }
1017
1018 void
1019 nat44_ei_add_del_address_dpo (ip4_address_t addr, u8 is_add)
1020 {
1021   nat44_ei_main_t *nm = &nat44_ei_main;
1022   dpo_id_t dpo_v4 = DPO_INVALID;
1023   fib_prefix_t pfx = {
1024     .fp_proto = FIB_PROTOCOL_IP4,
1025     .fp_len = 32,
1026     .fp_addr.ip4.as_u32 = addr.as_u32,
1027   };
1028
1029   if (is_add)
1030     {
1031       nat_dpo_create (DPO_PROTO_IP4, 0, &dpo_v4);
1032       fib_table_entry_special_dpo_add (0, &pfx, nm->fib_src_hi,
1033                                        FIB_ENTRY_FLAG_EXCLUSIVE, &dpo_v4);
1034       dpo_reset (&dpo_v4);
1035     }
1036   else
1037     {
1038       fib_table_entry_special_remove (0, &pfx, nm->fib_src_hi);
1039     }
1040 }
1041
1042 void
1043 nat44_ei_free_outside_address_and_port (nat44_ei_address_t *addresses,
1044                                         u32 thread_index, ip4_address_t *addr,
1045                                         u16 port, nat_protocol_t protocol)
1046 {
1047   nat44_ei_main_t *nm = &nat44_ei_main;
1048   nat44_ei_address_t *a;
1049   u32 address_index;
1050   u16 port_host_byte_order = clib_net_to_host_u16 (port);
1051
1052   for (address_index = 0; address_index < vec_len (addresses); address_index++)
1053     {
1054       if (addresses[address_index].addr.as_u32 == addr->as_u32)
1055         break;
1056     }
1057
1058   ASSERT (address_index < vec_len (addresses));
1059
1060   a = addresses + address_index;
1061
1062   switch (protocol)
1063     {
1064 #define _(N, i, n, s)                                                         \
1065   case NAT_PROTOCOL_##N:                                                      \
1066     ASSERT (a->busy_##n##_port_refcounts[port_host_byte_order] >= 1);         \
1067     --a->busy_##n##_port_refcounts[port_host_byte_order];                     \
1068     a->busy_##n##_ports--;                                                    \
1069     a->busy_##n##_ports_per_thread[thread_index]--;                           \
1070     break;
1071       foreach_nat_protocol
1072 #undef _
1073         default : nat_elog_info (nm, "unknown protocol");
1074       return;
1075     }
1076 }
1077
1078 void
1079 nat44_ei_free_session_data_v2 (nat44_ei_main_t *nm, nat44_ei_session_t *s,
1080                                u32 thread_index, u8 is_ha)
1081 {
1082   clib_bihash_kv_8_8_t kv;
1083
1084   /* session lookup tables */
1085   init_nat_i2o_k (&kv, s);
1086   if (clib_bihash_add_del_8_8 (&nm->in2out, &kv, 0))
1087     nat_elog_warn (nm, "in2out key del failed");
1088   init_nat_o2i_k (&kv, s);
1089   if (clib_bihash_add_del_8_8 (&nm->out2in, &kv, 0))
1090     nat_elog_warn (nm, "out2in key del failed");
1091
1092   if (!is_ha)
1093     nat_syslog_nat44_apmdel (s->user_index, s->in2out.fib_index,
1094                              &s->in2out.addr, s->in2out.port, &s->out2in.addr,
1095                              s->out2in.port, s->nat_proto);
1096
1097   if (nat44_ei_is_unk_proto_session (s))
1098     return;
1099
1100   if (!is_ha)
1101     {
1102       /* log NAT event */
1103       nat_ipfix_logging_nat44_ses_delete (
1104         thread_index, s->in2out.addr.as_u32, s->out2in.addr.as_u32,
1105         nat_proto_to_ip_proto (s->nat_proto), s->in2out.port, s->out2in.port,
1106         s->in2out.fib_index);
1107
1108       nat_ha_sdel (&s->out2in.addr, s->out2in.port, &s->ext_host_addr,
1109                    s->ext_host_port, s->nat_proto, s->out2in.fib_index,
1110                    thread_index);
1111     }
1112
1113   if (nat44_ei_is_session_static (s))
1114     return;
1115
1116   nat44_ei_free_outside_address_and_port (nm->addresses, thread_index,
1117                                           &s->out2in.addr, s->out2in.port,
1118                                           s->nat_proto);
1119 }
1120
1121 nat44_ei_user_t *
1122 nat44_ei_user_get_or_create (nat44_ei_main_t *nm, ip4_address_t *addr,
1123                              u32 fib_index, u32 thread_index)
1124 {
1125   nat44_ei_user_t *u = 0;
1126   nat44_ei_user_key_t user_key;
1127   clib_bihash_kv_8_8_t kv, value;
1128   nat44_ei_main_per_thread_data_t *tnm = &nm->per_thread_data[thread_index];
1129   dlist_elt_t *per_user_list_head_elt;
1130
1131   user_key.addr.as_u32 = addr->as_u32;
1132   user_key.fib_index = fib_index;
1133   kv.key = user_key.as_u64;
1134
1135   /* Ever heard of the "user" = src ip4 address before? */
1136   if (clib_bihash_search_8_8 (&tnm->user_hash, &kv, &value))
1137     {
1138       if (pool_elts (tnm->users) >= nm->max_users_per_thread)
1139         {
1140           vlib_increment_simple_counter (&nm->user_limit_reached, thread_index,
1141                                          0, 1);
1142           nat_elog_warn (nm, "maximum user limit reached");
1143           return NULL;
1144         }
1145       /* no, make a new one */
1146       pool_get (tnm->users, u);
1147       clib_memset (u, 0, sizeof (*u));
1148
1149       u->addr.as_u32 = addr->as_u32;
1150       u->fib_index = fib_index;
1151
1152       pool_get (tnm->list_pool, per_user_list_head_elt);
1153
1154       u->sessions_per_user_list_head_index =
1155         per_user_list_head_elt - tnm->list_pool;
1156
1157       clib_dlist_init (tnm->list_pool, u->sessions_per_user_list_head_index);
1158
1159       kv.value = u - tnm->users;
1160
1161       /* add user */
1162       if (clib_bihash_add_del_8_8 (&tnm->user_hash, &kv, 1))
1163         {
1164           nat_elog_warn (nm, "user_hash key add failed");
1165           nat44_ei_delete_user_with_no_session (nm, u, thread_index);
1166           return NULL;
1167         }
1168
1169       vlib_set_simple_counter (&nm->total_users, thread_index, 0,
1170                                pool_elts (tnm->users));
1171     }
1172   else
1173     {
1174       u = pool_elt_at_index (tnm->users, value.value);
1175     }
1176
1177   return u;
1178 }
1179
1180 nat44_ei_session_t *
1181 nat44_ei_session_alloc_or_recycle (nat44_ei_main_t *nm, nat44_ei_user_t *u,
1182                                    u32 thread_index, f64 now)
1183 {
1184   nat44_ei_session_t *s;
1185   nat44_ei_main_per_thread_data_t *tnm = &nm->per_thread_data[thread_index];
1186   u32 oldest_per_user_translation_list_index, session_index;
1187   dlist_elt_t *oldest_per_user_translation_list_elt;
1188   dlist_elt_t *per_user_translation_list_elt;
1189
1190   /* Over quota? Recycle the least recently used translation */
1191   if ((u->nsessions + u->nstaticsessions) >= nm->max_translations_per_user)
1192     {
1193       oldest_per_user_translation_list_index = clib_dlist_remove_head (
1194         tnm->list_pool, u->sessions_per_user_list_head_index);
1195
1196       ASSERT (oldest_per_user_translation_list_index != ~0);
1197
1198       /* Add it back to the end of the LRU list */
1199       clib_dlist_addtail (tnm->list_pool, u->sessions_per_user_list_head_index,
1200                           oldest_per_user_translation_list_index);
1201       /* Get the list element */
1202       oldest_per_user_translation_list_elt = pool_elt_at_index (
1203         tnm->list_pool, oldest_per_user_translation_list_index);
1204
1205       /* Get the session index from the list element */
1206       session_index = oldest_per_user_translation_list_elt->value;
1207
1208       /* Get the session */
1209       s = pool_elt_at_index (tnm->sessions, session_index);
1210
1211       nat44_ei_free_session_data_v2 (nm, s, thread_index, 0);
1212       if (nat44_ei_is_session_static (s))
1213         u->nstaticsessions--;
1214       else
1215         u->nsessions--;
1216       s->flags = 0;
1217       s->total_bytes = 0;
1218       s->total_pkts = 0;
1219       s->state = 0;
1220       s->ext_host_addr.as_u32 = 0;
1221       s->ext_host_port = 0;
1222       s->ext_host_nat_addr.as_u32 = 0;
1223       s->ext_host_nat_port = 0;
1224     }
1225   else
1226     {
1227       pool_get (tnm->sessions, s);
1228       clib_memset (s, 0, sizeof (*s));
1229
1230       /* Create list elts */
1231       pool_get (tnm->list_pool, per_user_translation_list_elt);
1232       clib_dlist_init (tnm->list_pool,
1233                        per_user_translation_list_elt - tnm->list_pool);
1234
1235       per_user_translation_list_elt->value = s - tnm->sessions;
1236       s->per_user_index = per_user_translation_list_elt - tnm->list_pool;
1237       s->per_user_list_head_index = u->sessions_per_user_list_head_index;
1238
1239       clib_dlist_addtail (tnm->list_pool, s->per_user_list_head_index,
1240                           per_user_translation_list_elt - tnm->list_pool);
1241
1242       s->user_index = u - tnm->users;
1243       vlib_set_simple_counter (&nm->total_sessions, thread_index, 0,
1244                                pool_elts (tnm->sessions));
1245     }
1246
1247   s->ha_last_refreshed = now;
1248
1249   return s;
1250 }
1251
1252 void
1253 nat44_ei_free_session_data (nat44_ei_main_t *nm, nat44_ei_session_t *s,
1254                             u32 thread_index, u8 is_ha)
1255 {
1256   clib_bihash_kv_8_8_t kv;
1257
1258   init_nat_i2o_k (&kv, s);
1259   if (clib_bihash_add_del_8_8 (&nm->in2out, &kv, 0))
1260     nat_elog_warn (nm, "in2out key del failed");
1261
1262   init_nat_o2i_k (&kv, s);
1263   if (clib_bihash_add_del_8_8 (&nm->out2in, &kv, 0))
1264     nat_elog_warn (nm, "out2in key del failed");
1265
1266   if (!is_ha)
1267     {
1268       nat_syslog_nat44_apmdel (s->user_index, s->in2out.fib_index,
1269                                &s->in2out.addr, s->in2out.port,
1270                                &s->out2in.addr, s->out2in.port, s->nat_proto);
1271
1272       nat_ipfix_logging_nat44_ses_delete (
1273         thread_index, s->in2out.addr.as_u32, s->out2in.addr.as_u32,
1274         nat_proto_to_ip_proto (s->nat_proto), s->in2out.port, s->out2in.port,
1275         s->in2out.fib_index);
1276
1277       nat_ha_sdel (&s->out2in.addr, s->out2in.port, &s->ext_host_addr,
1278                    s->ext_host_port, s->nat_proto, s->out2in.fib_index,
1279                    thread_index);
1280     }
1281
1282   if (nat44_ei_is_session_static (s))
1283     return;
1284
1285   nat44_ei_free_outside_address_and_port (nm->addresses, thread_index,
1286                                           &s->out2in.addr, s->out2in.port,
1287                                           s->nat_proto);
1288 }
1289
1290 static_always_inline void
1291 nat44_ei_user_del_sessions (nat44_ei_user_t *u, u32 thread_index)
1292 {
1293   dlist_elt_t *elt;
1294   nat44_ei_session_t *s;
1295
1296   nat44_ei_main_t *nm = &nat44_ei_main;
1297   nat44_ei_main_per_thread_data_t *tnm = &nm->per_thread_data[thread_index];
1298
1299   // get head
1300   elt =
1301     pool_elt_at_index (tnm->list_pool, u->sessions_per_user_list_head_index);
1302   // get first element
1303   elt = pool_elt_at_index (tnm->list_pool, elt->next);
1304
1305   while (elt->value != ~0)
1306     {
1307       s = pool_elt_at_index (tnm->sessions, elt->value);
1308       elt = pool_elt_at_index (tnm->list_pool, elt->next);
1309
1310       nat44_ei_free_session_data (nm, s, thread_index, 0);
1311       nat44_ei_delete_session (nm, s, thread_index);
1312     }
1313 }
1314
1315 int
1316 nat44_ei_user_del (ip4_address_t *addr, u32 fib_index)
1317 {
1318   int rv = 1;
1319
1320   nat44_ei_main_t *nm = &nat44_ei_main;
1321   nat44_ei_main_per_thread_data_t *tnm;
1322
1323   nat44_ei_user_key_t user_key;
1324   clib_bihash_kv_8_8_t kv, value;
1325
1326   user_key.addr.as_u32 = addr->as_u32;
1327   user_key.fib_index = fib_index;
1328   kv.key = user_key.as_u64;
1329
1330   if (nm->num_workers > 1)
1331     {
1332       vec_foreach (tnm, nm->per_thread_data)
1333         {
1334           if (!clib_bihash_search_8_8 (&tnm->user_hash, &kv, &value))
1335             {
1336               nat44_ei_user_del_sessions (
1337                 pool_elt_at_index (tnm->users, value.value),
1338                 tnm->thread_index);
1339               rv = 0;
1340               break;
1341             }
1342         }
1343     }
1344   else
1345     {
1346       tnm = vec_elt_at_index (nm->per_thread_data, nm->num_workers);
1347       if (!clib_bihash_search_8_8 (&tnm->user_hash, &kv, &value))
1348         {
1349           nat44_ei_user_del_sessions (
1350             pool_elt_at_index (tnm->users, value.value), tnm->thread_index);
1351           rv = 0;
1352         }
1353     }
1354   return rv;
1355 }
1356
1357 void
1358 nat44_ei_static_mapping_del_sessions (nat44_ei_main_t *nm,
1359                                       nat44_ei_main_per_thread_data_t *tnm,
1360                                       nat44_ei_user_key_t u_key, int addr_only,
1361                                       ip4_address_t e_addr, u16 e_port)
1362 {
1363   clib_bihash_kv_8_8_t kv, value;
1364   kv.key = u_key.as_u64;
1365   u64 user_index;
1366   dlist_elt_t *head, *elt;
1367   nat44_ei_user_t *u;
1368   nat44_ei_session_t *s;
1369   u32 elt_index, head_index, ses_index;
1370
1371   if (!clib_bihash_search_8_8 (&tnm->user_hash, &kv, &value))
1372     {
1373       user_index = value.value;
1374       u = pool_elt_at_index (tnm->users, user_index);
1375       if (u->nstaticsessions)
1376         {
1377           head_index = u->sessions_per_user_list_head_index;
1378           head = pool_elt_at_index (tnm->list_pool, head_index);
1379           elt_index = head->next;
1380           elt = pool_elt_at_index (tnm->list_pool, elt_index);
1381           ses_index = elt->value;
1382           while (ses_index != ~0)
1383             {
1384               s = pool_elt_at_index (tnm->sessions, ses_index);
1385               elt = pool_elt_at_index (tnm->list_pool, elt->next);
1386               ses_index = elt->value;
1387
1388               if (!addr_only)
1389                 {
1390                   if ((s->out2in.addr.as_u32 != e_addr.as_u32) ||
1391                       (s->out2in.port != e_port))
1392                     continue;
1393                 }
1394
1395               if (!nat44_ei_is_session_static (s))
1396                 continue;
1397
1398               nat44_ei_free_session_data_v2 (nm, s, tnm - nm->per_thread_data,
1399                                              0);
1400               nat44_ei_delete_session (nm, s, tnm - nm->per_thread_data);
1401
1402               if (!addr_only)
1403                 break;
1404             }
1405         }
1406     }
1407 }
1408
1409 u32
1410 nat44_ei_get_in2out_worker_index (ip4_header_t *ip0, u32 rx_fib_index0,
1411                                   u8 is_output)
1412 {
1413   nat44_ei_main_t *nm = &nat44_ei_main;
1414   u32 next_worker_index = 0;
1415   u32 hash;
1416
1417   next_worker_index = nm->first_worker_index;
1418   hash = ip0->src_address.as_u32 + (ip0->src_address.as_u32 >> 8) +
1419          (ip0->src_address.as_u32 >> 16) + (ip0->src_address.as_u32 >> 24);
1420
1421   if (PREDICT_TRUE (is_pow2 (_vec_len (nm->workers))))
1422     next_worker_index += nm->workers[hash & (_vec_len (nm->workers) - 1)];
1423   else
1424     next_worker_index += nm->workers[hash % _vec_len (nm->workers)];
1425
1426   return next_worker_index;
1427 }
1428
1429 u32
1430 nat44_ei_get_out2in_worker_index (vlib_buffer_t *b, ip4_header_t *ip0,
1431                                   u32 rx_fib_index0, u8 is_output)
1432 {
1433   nat44_ei_main_t *nm = &nat44_ei_main;
1434   udp_header_t *udp;
1435   u16 port;
1436   clib_bihash_kv_8_8_t kv, value;
1437   nat44_ei_static_mapping_t *m;
1438   u32 proto;
1439   u32 next_worker_index = 0;
1440
1441   /* first try static mappings without port */
1442   if (PREDICT_FALSE (pool_elts (nm->static_mappings)))
1443     {
1444       init_nat_k (&kv, ip0->dst_address, 0, rx_fib_index0, 0);
1445       if (!clib_bihash_search_8_8 (&nm->static_mapping_by_external, &kv,
1446                                    &value))
1447         {
1448           m = pool_elt_at_index (nm->static_mappings, value.value);
1449           return m->workers[0];
1450         }
1451     }
1452
1453   proto = ip_proto_to_nat_proto (ip0->protocol);
1454   udp = ip4_next_header (ip0);
1455   port = vnet_buffer (b)->ip.reass.l4_dst_port;
1456
1457   /* unknown protocol */
1458   if (PREDICT_FALSE (proto == NAT_PROTOCOL_OTHER))
1459     {
1460       /* use current thread */
1461       return vlib_get_thread_index ();
1462     }
1463
1464   if (PREDICT_FALSE (ip0->protocol == IP_PROTOCOL_ICMP))
1465     {
1466       icmp46_header_t *icmp = (icmp46_header_t *) udp;
1467       icmp_echo_header_t *echo = (icmp_echo_header_t *) (icmp + 1);
1468       if (!icmp_type_is_error_message (
1469             vnet_buffer (b)->ip.reass.icmp_type_or_tcp_flags))
1470         port = vnet_buffer (b)->ip.reass.l4_src_port;
1471       else
1472         {
1473           /* if error message, then it's not fragmented and we can access it */
1474           ip4_header_t *inner_ip = (ip4_header_t *) (echo + 1);
1475           proto = ip_proto_to_nat_proto (inner_ip->protocol);
1476           void *l4_header = ip4_next_header (inner_ip);
1477           switch (proto)
1478             {
1479             case NAT_PROTOCOL_ICMP:
1480               icmp = (icmp46_header_t *) l4_header;
1481               echo = (icmp_echo_header_t *) (icmp + 1);
1482               port = echo->identifier;
1483               break;
1484             case NAT_PROTOCOL_UDP:
1485             case NAT_PROTOCOL_TCP:
1486               port = ((tcp_udp_header_t *) l4_header)->src_port;
1487               break;
1488             default:
1489               return vlib_get_thread_index ();
1490             }
1491         }
1492     }
1493
1494   /* try static mappings with port */
1495   if (PREDICT_FALSE (pool_elts (nm->static_mappings)))
1496     {
1497       init_nat_k (&kv, ip0->dst_address, port, rx_fib_index0, proto);
1498       if (!clib_bihash_search_8_8 (&nm->static_mapping_by_external, &kv,
1499                                    &value))
1500         {
1501           m = pool_elt_at_index (nm->static_mappings, value.value);
1502           return m->workers[0];
1503         }
1504     }
1505
1506   /* worker by outside port */
1507   next_worker_index = nm->first_worker_index;
1508   next_worker_index +=
1509     nm->workers[(clib_net_to_host_u16 (port) - 1024) / nm->port_per_thread];
1510   return next_worker_index;
1511 }
1512
1513 static int
1514 nat44_ei_alloc_default_cb (nat44_ei_address_t *addresses, u32 fib_index,
1515                            u32 thread_index, nat_protocol_t proto,
1516                            ip4_address_t s_addr, ip4_address_t *addr,
1517                            u16 *port, u16 port_per_thread,
1518                            u32 snat_thread_index)
1519 {
1520   nat44_ei_main_t *nm = &nat44_ei_main;
1521   nat44_ei_address_t *a, *ga = 0;
1522   u32 portnum;
1523   int i;
1524
1525   if (vec_len (addresses) > 0)
1526     {
1527
1528       int s_addr_offset = s_addr.as_u32 % vec_len (addresses);
1529
1530       for (i = s_addr_offset; i < vec_len (addresses); ++i)
1531         {
1532           a = addresses + i;
1533           switch (proto)
1534             {
1535 #define _(N, j, n, s)                                                         \
1536   case NAT_PROTOCOL_##N:                                                      \
1537     if (a->busy_##n##_ports_per_thread[thread_index] < port_per_thread)       \
1538       {                                                                       \
1539         if (a->fib_index == fib_index)                                        \
1540           {                                                                   \
1541             while (1)                                                         \
1542               {                                                               \
1543                 portnum = (port_per_thread * snat_thread_index) +             \
1544                           nat_random_port (&nm->random_seed, 0,               \
1545                                            port_per_thread - 1) +             \
1546                           1024;                                               \
1547                 if (a->busy_##n##_port_refcounts[portnum])                    \
1548                   continue;                                                   \
1549                 --a->busy_##n##_port_refcounts[portnum];                      \
1550                 a->busy_##n##_ports_per_thread[thread_index]++;               \
1551                 a->busy_##n##_ports++;                                        \
1552                 *addr = a->addr;                                              \
1553                 *port = clib_host_to_net_u16 (portnum);                       \
1554                 return 0;                                                     \
1555               }                                                               \
1556           }                                                                   \
1557         else if (a->fib_index == ~0)                                          \
1558           {                                                                   \
1559             ga = a;                                                           \
1560           }                                                                   \
1561       }                                                                       \
1562     break;
1563               foreach_nat_protocol;
1564             default:
1565               nat_elog_info (nm, "unknown protocol");
1566               return 1;
1567             }
1568         }
1569
1570       for (i = 0; i < s_addr_offset; ++i)
1571         {
1572           a = addresses + i;
1573           switch (proto)
1574             {
1575               foreach_nat_protocol;
1576             default:
1577               nat_elog_info (nm, "unknown protocol");
1578               return 1;
1579             }
1580         }
1581   if (ga)
1582     {
1583       a = ga;
1584       // fake fib index to reuse macro
1585       fib_index = ~0;
1586       switch (proto)
1587         {
1588           foreach_nat_protocol;
1589             default : nat_elog_info (nm, "unknown protocol");
1590           return 1;
1591         }
1592     }
1593     }
1594
1595 #undef _
1596
1597   /* Totally out of translations to use... */
1598   nat_ipfix_logging_addresses_exhausted (thread_index, 0);
1599   return 1;
1600 }
1601
1602 static int
1603 nat44_ei_alloc_range_cb (nat44_ei_address_t *addresses, u32 fib_index,
1604                          u32 thread_index, nat_protocol_t proto,
1605                          ip4_address_t s_addr, ip4_address_t *addr, u16 *port,
1606                          u16 port_per_thread, u32 snat_thread_index)
1607 {
1608   nat44_ei_main_t *nm = &nat44_ei_main;
1609   nat44_ei_address_t *a = addresses;
1610   u16 portnum, ports;
1611
1612   ports = nm->end_port - nm->start_port + 1;
1613
1614   if (!vec_len (addresses))
1615     goto exhausted;
1616
1617   switch (proto)
1618     {
1619 #define _(N, i, n, s)                                                         \
1620   case NAT_PROTOCOL_##N:                                                      \
1621     if (a->busy_##n##_ports < ports)                                          \
1622       {                                                                       \
1623         while (1)                                                             \
1624           {                                                                   \
1625             portnum = nat_random_port (&nm->random_seed, nm->start_port,      \
1626                                        nm->end_port);                         \
1627             if (a->busy_##n##_port_refcounts[portnum])                        \
1628               continue;                                                       \
1629             ++a->busy_##n##_port_refcounts[portnum];                          \
1630             a->busy_##n##_ports++;                                            \
1631             *addr = a->addr;                                                  \
1632             *port = clib_host_to_net_u16 (portnum);                           \
1633             return 0;                                                         \
1634           }                                                                   \
1635       }                                                                       \
1636     break;
1637       foreach_nat_protocol
1638 #undef _
1639         default : nat_elog_info (nm, "unknown protocol");
1640       return 1;
1641     }
1642
1643 exhausted:
1644   /* Totally out of translations to use... */
1645   nat_ipfix_logging_addresses_exhausted (thread_index, 0);
1646   return 1;
1647 }
1648
1649 static int
1650 nat44_ei_alloc_mape_cb (nat44_ei_address_t *addresses, u32 fib_index,
1651                         u32 thread_index, nat_protocol_t proto,
1652                         ip4_address_t s_addr, ip4_address_t *addr, u16 *port,
1653                         u16 port_per_thread, u32 snat_thread_index)
1654 {
1655   nat44_ei_main_t *nm = &nat44_ei_main;
1656   nat44_ei_address_t *a = addresses;
1657   u16 m, ports, portnum, A, j;
1658   m = 16 - (nm->psid_offset + nm->psid_length);
1659   ports = (1 << (16 - nm->psid_length)) - (1 << m);
1660
1661   if (!vec_len (addresses))
1662     goto exhausted;
1663
1664   switch (proto)
1665     {
1666 #define _(N, i, n, s)                                                         \
1667   case NAT_PROTOCOL_##N:                                                      \
1668     if (a->busy_##n##_ports < ports)                                          \
1669       {                                                                       \
1670         while (1)                                                             \
1671           {                                                                   \
1672             A = nat_random_port (&nm->random_seed, 1,                         \
1673                                  pow2_mask (nm->psid_offset));                \
1674             j = nat_random_port (&nm->random_seed, 0, pow2_mask (m));         \
1675             portnum = A | (nm->psid << nm->psid_offset) | (j << (16 - m));    \
1676             if (a->busy_##n##_port_refcounts[portnum])                        \
1677               continue;                                                       \
1678             ++a->busy_##n##_port_refcounts[portnum];                          \
1679             a->busy_##n##_ports++;                                            \
1680             *addr = a->addr;                                                  \
1681             *port = clib_host_to_net_u16 (portnum);                           \
1682             return 0;                                                         \
1683           }                                                                   \
1684       }                                                                       \
1685     break;
1686       foreach_nat_protocol
1687 #undef _
1688         default : nat_elog_info (nm, "unknown protocol");
1689       return 1;
1690     }
1691
1692 exhausted:
1693   /* Totally out of translations to use... */
1694   nat_ipfix_logging_addresses_exhausted (thread_index, 0);
1695   return 1;
1696 }
1697
1698 void
1699 nat44_ei_set_alloc_default ()
1700 {
1701   nat44_ei_main_t *nm = &nat44_ei_main;
1702
1703   nm->addr_and_port_alloc_alg = NAT44_EI_ADDR_AND_PORT_ALLOC_ALG_DEFAULT;
1704   nm->alloc_addr_and_port = nat44_ei_alloc_default_cb;
1705 }
1706
1707 void
1708 nat44_ei_set_alloc_range (u16 start_port, u16 end_port)
1709 {
1710   nat44_ei_main_t *nm = &nat44_ei_main;
1711
1712   nm->addr_and_port_alloc_alg = NAT44_EI_ADDR_AND_PORT_ALLOC_ALG_RANGE;
1713   nm->alloc_addr_and_port = nat44_ei_alloc_range_cb;
1714   nm->start_port = start_port;
1715   nm->end_port = end_port;
1716 }
1717
1718 void
1719 nat44_ei_set_alloc_mape (u16 psid, u16 psid_offset, u16 psid_length)
1720 {
1721   nat44_ei_main_t *nm = &nat44_ei_main;
1722
1723   nm->addr_and_port_alloc_alg = NAT44_EI_ADDR_AND_PORT_ALLOC_ALG_MAPE;
1724   nm->alloc_addr_and_port = nat44_ei_alloc_mape_cb;
1725   nm->psid = psid;
1726   nm->psid_offset = psid_offset;
1727   nm->psid_length = psid_length;
1728 }
1729
1730 static void
1731 nat44_ei_add_static_mapping_when_resolved (ip4_address_t l_addr, u16 l_port,
1732                                            u16 e_port, nat_protocol_t proto,
1733                                            u32 sw_if_index, u32 vrf_id,
1734                                            int addr_only, int identity_nat,
1735                                            u8 *tag)
1736 {
1737   nat44_ei_main_t *nm = &nat44_ei_main;
1738   nat44_ei_static_map_resolve_t *rp;
1739
1740   vec_add2 (nm->to_resolve, rp, 1);
1741   clib_memset (rp, 0, sizeof (*rp));
1742
1743   rp->l_addr.as_u32 = l_addr.as_u32;
1744   rp->l_port = l_port;
1745   rp->e_port = e_port;
1746   rp->sw_if_index = sw_if_index;
1747   rp->vrf_id = vrf_id;
1748   rp->proto = proto;
1749   rp->addr_only = addr_only;
1750   rp->identity_nat = identity_nat;
1751   rp->tag = vec_dup (tag);
1752 }
1753
1754 void
1755 nat44_ei_delete_session (nat44_ei_main_t *nm, nat44_ei_session_t *ses,
1756                          u32 thread_index)
1757 {
1758   nat44_ei_main_per_thread_data_t *tnm =
1759     vec_elt_at_index (nm->per_thread_data, thread_index);
1760   clib_bihash_kv_8_8_t kv, value;
1761   nat44_ei_user_t *u;
1762   const nat44_ei_user_key_t u_key = { .addr = ses->in2out.addr,
1763                                       .fib_index = ses->in2out.fib_index };
1764   const u8 u_static = nat44_ei_is_session_static (ses);
1765
1766   clib_dlist_remove (tnm->list_pool, ses->per_user_index);
1767   pool_put_index (tnm->list_pool, ses->per_user_index);
1768
1769   pool_put (tnm->sessions, ses);
1770   vlib_set_simple_counter (&nm->total_sessions, thread_index, 0,
1771                            pool_elts (tnm->sessions));
1772
1773   kv.key = u_key.as_u64;
1774   if (!clib_bihash_search_8_8 (&tnm->user_hash, &kv, &value))
1775     {
1776       u = pool_elt_at_index (tnm->users, value.value);
1777       if (u_static)
1778         u->nstaticsessions--;
1779       else
1780         u->nsessions--;
1781
1782       nat44_ei_delete_user_with_no_session (nm, u, thread_index);
1783     }
1784 }
1785
1786 int
1787 nat44_ei_del_session (nat44_ei_main_t *nm, ip4_address_t *addr, u16 port,
1788                       nat_protocol_t proto, u32 vrf_id, int is_in)
1789 {
1790   nat44_ei_main_per_thread_data_t *tnm;
1791   clib_bihash_kv_8_8_t kv, value;
1792   u32 fib_index = fib_table_find (FIB_PROTOCOL_IP4, vrf_id);
1793   nat44_ei_session_t *s;
1794   clib_bihash_8_8_t *t;
1795
1796   init_nat_k (&kv, *addr, port, fib_index, proto);
1797   t = is_in ? &nm->in2out : &nm->out2in;
1798   if (!clib_bihash_search_8_8 (t, &kv, &value))
1799     {
1800       // this is called from API/CLI, so the world is stopped here
1801       // it's safe to manipulate arbitrary per-thread data
1802       u32 thread_index = nat_value_get_thread_index (&value);
1803       tnm = vec_elt_at_index (nm->per_thread_data, thread_index);
1804       u32 session_index = nat_value_get_session_index (&value);
1805       if (pool_is_free_index (tnm->sessions, session_index))
1806         return VNET_API_ERROR_UNSPECIFIED;
1807
1808       s = pool_elt_at_index (tnm->sessions, session_index);
1809       nat44_ei_free_session_data_v2 (nm, s, tnm - nm->per_thread_data, 0);
1810       nat44_ei_delete_session (nm, s, tnm - nm->per_thread_data);
1811       return 0;
1812     }
1813
1814   return VNET_API_ERROR_NO_SUCH_ENTRY;
1815 }
1816
1817 u32
1818 nat44_ei_get_thread_idx_by_port (u16 e_port)
1819 {
1820   nat44_ei_main_t *nm = &nat44_ei_main;
1821   u32 thread_idx = nm->num_workers;
1822   if (nm->num_workers > 1)
1823     {
1824       thread_idx = nm->first_worker_index +
1825                    nm->workers[(e_port - 1024) / nm->port_per_thread];
1826     }
1827   return thread_idx;
1828 }
1829
1830 void
1831 nat44_ei_add_del_addr_to_fib (ip4_address_t *addr, u8 p_len, u32 sw_if_index,
1832                               int is_add)
1833 {
1834   nat44_ei_main_t *nm = &nat44_ei_main;
1835   fib_prefix_t prefix = {
1836     .fp_len = p_len,
1837     .fp_proto = FIB_PROTOCOL_IP4,
1838     .fp_addr = {
1839                 .ip4.as_u32 = addr->as_u32,
1840                 },
1841   };
1842   u32 fib_index = ip4_fib_table_get_index_for_sw_if_index (sw_if_index);
1843
1844   if (is_add)
1845     fib_table_entry_update_one_path (
1846       fib_index, &prefix, nm->fib_src_low,
1847       (FIB_ENTRY_FLAG_CONNECTED | FIB_ENTRY_FLAG_LOCAL |
1848        FIB_ENTRY_FLAG_EXCLUSIVE),
1849       DPO_PROTO_IP4, NULL, sw_if_index, ~0, 1, NULL, FIB_ROUTE_PATH_FLAG_NONE);
1850   else
1851     fib_table_entry_delete (fib_index, &prefix, nm->fib_src_low);
1852 }
1853
1854 int
1855 nat44_ei_add_del_static_mapping (ip4_address_t l_addr, ip4_address_t e_addr,
1856                                  u16 l_port, u16 e_port, nat_protocol_t proto,
1857                                  u32 sw_if_index, u32 vrf_id, u8 addr_only,
1858                                  u8 identity_nat, u8 *tag, u8 is_add)
1859 {
1860   nat44_ei_main_t *nm = &nat44_ei_main;
1861   nat44_ei_static_mapping_t *m = 0;
1862   clib_bihash_kv_8_8_t kv, value;
1863   nat44_ei_address_t *a = 0;
1864   u32 fib_index = ~0;
1865   nat44_ei_interface_t *interface;
1866   nat44_ei_main_per_thread_data_t *tnm;
1867   nat44_ei_user_key_t u_key;
1868   nat44_ei_user_t *u;
1869   dlist_elt_t *head, *elt;
1870   u32 elt_index, head_index;
1871   u32 ses_index;
1872   u64 user_index;
1873   nat44_ei_session_t *s;
1874   nat44_ei_static_map_resolve_t *rp, *rp_match = 0;
1875   nat44_ei_lb_addr_port_t *local;
1876   u32 find = ~0;
1877   int i;
1878
1879   if (sw_if_index != ~0)
1880     {
1881       ip4_address_t *first_int_addr;
1882
1883       for (i = 0; i < vec_len (nm->to_resolve); i++)
1884         {
1885           rp = nm->to_resolve + i;
1886           if (rp->sw_if_index != sw_if_index ||
1887               rp->l_addr.as_u32 != l_addr.as_u32 || rp->vrf_id != vrf_id ||
1888               rp->addr_only != addr_only)
1889             continue;
1890
1891           if (!addr_only)
1892             {
1893               if ((rp->l_port != l_port && rp->e_port != e_port) ||
1894                   rp->proto != proto)
1895                 continue;
1896             }
1897
1898           rp_match = rp;
1899           break;
1900         }
1901
1902       /* Might be already set... */
1903       first_int_addr = ip4_interface_first_address (
1904         nm->ip4_main, sw_if_index, 0 /* just want the address */);
1905
1906       if (is_add)
1907         {
1908           if (rp_match)
1909             return VNET_API_ERROR_VALUE_EXIST;
1910
1911           nat44_ei_add_static_mapping_when_resolved (
1912             l_addr, l_port, e_port, proto, sw_if_index, vrf_id, addr_only,
1913             identity_nat, tag);
1914
1915           /* DHCP resolution required? */
1916           if (!first_int_addr)
1917             return 0;
1918
1919           e_addr.as_u32 = first_int_addr->as_u32;
1920           /* Identity mapping? */
1921           if (l_addr.as_u32 == 0)
1922             l_addr.as_u32 = e_addr.as_u32;
1923         }
1924       else
1925         {
1926           if (!rp_match)
1927             return VNET_API_ERROR_NO_SUCH_ENTRY;
1928
1929           vec_del1 (nm->to_resolve, i);
1930
1931           if (!first_int_addr)
1932             return 0;
1933
1934           e_addr.as_u32 = first_int_addr->as_u32;
1935           /* Identity mapping? */
1936           if (l_addr.as_u32 == 0)
1937             l_addr.as_u32 = e_addr.as_u32;
1938         }
1939     }
1940
1941   init_nat_k (&kv, e_addr, addr_only ? 0 : e_port, 0, addr_only ? 0 : proto);
1942   if (!clib_bihash_search_8_8 (&nm->static_mapping_by_external, &kv, &value))
1943     m = pool_elt_at_index (nm->static_mappings, value.value);
1944
1945   if (is_add)
1946     {
1947       if (m)
1948         {
1949           // identity mapping for second vrf
1950           if (nat44_ei_is_identity_static_mapping (m))
1951             {
1952               pool_foreach (local, m->locals)
1953                 {
1954                   if (local->vrf_id == vrf_id)
1955                     return VNET_API_ERROR_VALUE_EXIST;
1956                 }
1957               pool_get (m->locals, local);
1958               local->vrf_id = vrf_id;
1959               local->fib_index = fib_table_find_or_create_and_lock (
1960                 FIB_PROTOCOL_IP4, vrf_id, nm->fib_src_low);
1961               init_nat_kv (&kv, m->local_addr, m->local_port, local->fib_index,
1962                            m->proto, 0, m - nm->static_mappings);
1963               clib_bihash_add_del_8_8 (&nm->static_mapping_by_local, &kv, 1);
1964               return 0;
1965             }
1966           return VNET_API_ERROR_VALUE_EXIST;
1967         }
1968
1969       /* Convert VRF id to FIB index */
1970       if (vrf_id != ~0)
1971         {
1972           fib_index = fib_table_find_or_create_and_lock (
1973             FIB_PROTOCOL_IP4, vrf_id, nm->fib_src_low);
1974         }
1975       /* If not specified use inside VRF id from NAT44 plugin config */
1976       else
1977         {
1978           fib_index = nm->inside_fib_index;
1979           vrf_id = nm->inside_vrf_id;
1980           fib_table_lock (fib_index, FIB_PROTOCOL_IP4, nm->fib_src_low);
1981         }
1982
1983       if (!identity_nat)
1984         {
1985           init_nat_k (&kv, l_addr, addr_only ? 0 : l_port, fib_index,
1986                       addr_only ? 0 : proto);
1987           if (!clib_bihash_search_8_8 (&nm->static_mapping_by_local, &kv,
1988                                        &value))
1989             return VNET_API_ERROR_VALUE_EXIST;
1990         }
1991
1992       /* Find external address in allocated addresses and reserve port for
1993          address and port pair mapping when dynamic translations enabled */
1994       if (!(addr_only || nm->static_mapping_only))
1995         {
1996           for (i = 0; i < vec_len (nm->addresses); i++)
1997             {
1998               if (nm->addresses[i].addr.as_u32 == e_addr.as_u32)
1999                 {
2000                   a = nm->addresses + i;
2001                   /* External port must be unused */
2002                   switch (proto)
2003                     {
2004 #define _(N, j, n, s)                                                         \
2005   case NAT_PROTOCOL_##N:                                                      \
2006     if (a->busy_##n##_port_refcounts[e_port])                                 \
2007       return VNET_API_ERROR_INVALID_VALUE;                                    \
2008     ++a->busy_##n##_port_refcounts[e_port];                                   \
2009     if (e_port > 1024)                                                        \
2010       {                                                                       \
2011         a->busy_##n##_ports++;                                                \
2012         a->busy_##n##_ports_per_thread[nat44_ei_get_thread_idx_by_port (      \
2013           e_port)]++;                                                         \
2014       }                                                                       \
2015     break;
2016                       foreach_nat_protocol
2017 #undef _
2018                         default : nat_elog_info (nm, "unknown protocol");
2019                       return VNET_API_ERROR_INVALID_VALUE_2;
2020                     }
2021                   break;
2022                 }
2023             }
2024           /* External address must be allocated */
2025           if (!a && (l_addr.as_u32 != e_addr.as_u32))
2026             {
2027               if (sw_if_index != ~0)
2028                 {
2029                   for (i = 0; i < vec_len (nm->to_resolve); i++)
2030                     {
2031                       rp = nm->to_resolve + i;
2032                       if (rp->addr_only)
2033                         continue;
2034                       if (rp->sw_if_index != sw_if_index &&
2035                           rp->l_addr.as_u32 != l_addr.as_u32 &&
2036                           rp->vrf_id != vrf_id && rp->l_port != l_port &&
2037                           rp->e_port != e_port && rp->proto != proto)
2038                         continue;
2039
2040                       vec_del1 (nm->to_resolve, i);
2041                       break;
2042                     }
2043                 }
2044               return VNET_API_ERROR_NO_SUCH_ENTRY;
2045             }
2046         }
2047
2048       pool_get (nm->static_mappings, m);
2049       clib_memset (m, 0, sizeof (*m));
2050       m->tag = vec_dup (tag);
2051       m->local_addr = l_addr;
2052       m->external_addr = e_addr;
2053
2054       if (addr_only)
2055         m->flags |= NAT44_EI_STATIC_MAPPING_FLAG_ADDR_ONLY;
2056       else
2057         {
2058           m->local_port = l_port;
2059           m->external_port = e_port;
2060           m->proto = proto;
2061         }
2062
2063       if (identity_nat)
2064         {
2065           m->flags |= NAT44_EI_STATIC_MAPPING_FLAG_IDENTITY_NAT;
2066           pool_get (m->locals, local);
2067           local->vrf_id = vrf_id;
2068           local->fib_index = fib_index;
2069         }
2070       else
2071         {
2072           m->vrf_id = vrf_id;
2073           m->fib_index = fib_index;
2074         }
2075
2076       if (nm->num_workers > 1)
2077         {
2078           ip4_header_t ip = {
2079             .src_address = m->local_addr,
2080           };
2081           vec_add1 (m->workers,
2082                     nat44_ei_get_in2out_worker_index (&ip, m->fib_index, 0));
2083           tnm = vec_elt_at_index (nm->per_thread_data, m->workers[0]);
2084         }
2085       else
2086         tnm = vec_elt_at_index (nm->per_thread_data, nm->num_workers);
2087
2088       init_nat_kv (&kv, m->local_addr, m->local_port, fib_index, m->proto, 0,
2089                    m - nm->static_mappings);
2090       clib_bihash_add_del_8_8 (&nm->static_mapping_by_local, &kv, 1);
2091
2092       init_nat_kv (&kv, m->external_addr, m->external_port, 0, m->proto, 0,
2093                    m - nm->static_mappings);
2094       clib_bihash_add_del_8_8 (&nm->static_mapping_by_external, &kv, 1);
2095
2096       /* Delete dynamic sessions matching local address (+ local port) */
2097       // TODO: based on type of NAT EI/ED
2098       if (!(nm->static_mapping_only))
2099         {
2100           u_key.addr = m->local_addr;
2101           u_key.fib_index = m->fib_index;
2102           kv.key = u_key.as_u64;
2103           if (!clib_bihash_search_8_8 (&tnm->user_hash, &kv, &value))
2104             {
2105               user_index = value.value;
2106               u = pool_elt_at_index (tnm->users, user_index);
2107               if (u->nsessions)
2108                 {
2109                   head_index = u->sessions_per_user_list_head_index;
2110                   head = pool_elt_at_index (tnm->list_pool, head_index);
2111                   elt_index = head->next;
2112                   elt = pool_elt_at_index (tnm->list_pool, elt_index);
2113                   ses_index = elt->value;
2114                   while (ses_index != ~0)
2115                     {
2116                       s = pool_elt_at_index (tnm->sessions, ses_index);
2117                       elt = pool_elt_at_index (tnm->list_pool, elt->next);
2118                       ses_index = elt->value;
2119
2120                       if (nat44_ei_is_session_static (s))
2121                         continue;
2122
2123                       if (!addr_only && s->in2out.port != m->local_port)
2124                         continue;
2125
2126                       nat44_ei_free_session_data_v2 (
2127                         nm, s, tnm - nm->per_thread_data, 0);
2128                       nat44_ei_delete_session (nm, s,
2129                                                tnm - nm->per_thread_data);
2130
2131                       if (!addr_only)
2132                         break;
2133                     }
2134                 }
2135             }
2136         }
2137     }
2138   else
2139     {
2140       if (!m)
2141         {
2142           if (sw_if_index != ~0)
2143             return 0;
2144           else
2145             return VNET_API_ERROR_NO_SUCH_ENTRY;
2146         }
2147
2148       if (identity_nat)
2149         {
2150           if (vrf_id == ~0)
2151             vrf_id = nm->inside_vrf_id;
2152
2153           pool_foreach (local, m->locals)
2154             {
2155               if (local->vrf_id == vrf_id)
2156                 find = local - m->locals;
2157             }
2158           if (find == ~0)
2159             return VNET_API_ERROR_NO_SUCH_ENTRY;
2160
2161           local = pool_elt_at_index (m->locals, find);
2162           fib_index = local->fib_index;
2163           pool_put (m->locals, local);
2164         }
2165       else
2166         fib_index = m->fib_index;
2167
2168       /* Free external address port */
2169       if (!(addr_only || nm->static_mapping_only))
2170         {
2171           for (i = 0; i < vec_len (nm->addresses); i++)
2172             {
2173               if (nm->addresses[i].addr.as_u32 == e_addr.as_u32)
2174                 {
2175                   a = nm->addresses + i;
2176                   switch (proto)
2177                     {
2178 #define _(N, j, n, s)                                                         \
2179   case NAT_PROTOCOL_##N:                                                      \
2180     --a->busy_##n##_port_refcounts[e_port];                                   \
2181     if (e_port > 1024)                                                        \
2182       {                                                                       \
2183         a->busy_##n##_ports--;                                                \
2184         a->busy_##n##_ports_per_thread[nat44_ei_get_thread_idx_by_port (      \
2185           e_port)]--;                                                         \
2186       }                                                                       \
2187     break;
2188                       foreach_nat_protocol
2189 #undef _
2190                         default : return VNET_API_ERROR_INVALID_VALUE_2;
2191                     }
2192                   break;
2193                 }
2194             }
2195         }
2196
2197       if (nm->num_workers > 1)
2198         tnm = vec_elt_at_index (nm->per_thread_data, m->workers[0]);
2199       else
2200         tnm = vec_elt_at_index (nm->per_thread_data, nm->num_workers);
2201
2202       init_nat_k (&kv, m->local_addr, m->local_port, fib_index, m->proto);
2203       clib_bihash_add_del_8_8 (&nm->static_mapping_by_local, &kv, 0);
2204
2205       /* Delete session(s) for static mapping if exist */
2206       if (!(nm->static_mapping_only) ||
2207           (nm->static_mapping_only && nm->static_mapping_connection_tracking))
2208         {
2209           u_key.addr = m->local_addr;
2210           u_key.fib_index = fib_index;
2211           kv.key = u_key.as_u64;
2212           nat44_ei_static_mapping_del_sessions (nm, tnm, u_key, addr_only,
2213                                                 e_addr, e_port);
2214         }
2215
2216       fib_table_unlock (fib_index, FIB_PROTOCOL_IP4, nm->fib_src_low);
2217       if (pool_elts (m->locals))
2218         return 0;
2219
2220       init_nat_k (&kv, m->external_addr, m->external_port, 0, m->proto);
2221       clib_bihash_add_del_8_8 (&nm->static_mapping_by_external, &kv, 0);
2222
2223       vec_free (m->tag);
2224       vec_free (m->workers);
2225       /* Delete static mapping from pool */
2226       pool_put (nm->static_mappings, m);
2227     }
2228
2229   if (!addr_only || (l_addr.as_u32 == e_addr.as_u32))
2230     return 0;
2231
2232   /* Add/delete external address to FIB */
2233   pool_foreach (interface, nm->interfaces)
2234     {
2235       if (nat44_ei_interface_is_inside (interface) || nm->out2in_dpo)
2236         continue;
2237
2238       nat44_ei_add_del_addr_to_fib (&e_addr, 32, interface->sw_if_index,
2239                                     is_add);
2240       break;
2241     }
2242   pool_foreach (interface, nm->output_feature_interfaces)
2243     {
2244       if (nat44_ei_interface_is_inside (interface) || nm->out2in_dpo)
2245         continue;
2246
2247       nat44_ei_add_del_addr_to_fib (&e_addr, 32, interface->sw_if_index,
2248                                     is_add);
2249       break;
2250     }
2251   return 0;
2252 }
2253
2254 int
2255 nat44_ei_static_mapping_match (ip4_address_t match_addr, u16 match_port,
2256                                u32 match_fib_index,
2257                                nat_protocol_t match_protocol,
2258                                ip4_address_t *mapping_addr, u16 *mapping_port,
2259                                u32 *mapping_fib_index, u8 by_external,
2260                                u8 *is_addr_only, u8 *is_identity_nat)
2261 {
2262   nat44_ei_main_t *nm = &nat44_ei_main;
2263   clib_bihash_kv_8_8_t kv, value;
2264   nat44_ei_static_mapping_t *m;
2265   u16 port;
2266
2267   if (by_external)
2268     {
2269       init_nat_k (&kv, match_addr, match_port, 0, match_protocol);
2270       if (clib_bihash_search_8_8 (&nm->static_mapping_by_external, &kv,
2271                                   &value))
2272         {
2273           /* Try address only mapping */
2274           init_nat_k (&kv, match_addr, 0, 0, 0);
2275           if (clib_bihash_search_8_8 (&nm->static_mapping_by_external, &kv,
2276                                       &value))
2277             return 1;
2278         }
2279       m = pool_elt_at_index (nm->static_mappings, value.value);
2280
2281       *mapping_fib_index = m->fib_index;
2282       *mapping_addr = m->local_addr;
2283       port = m->local_port;
2284     }
2285   else
2286     {
2287       init_nat_k (&kv, match_addr, match_port, match_fib_index,
2288                   match_protocol);
2289       if (clib_bihash_search_8_8 (&nm->static_mapping_by_local, &kv, &value))
2290         {
2291           /* Try address only mapping */
2292           init_nat_k (&kv, match_addr, 0, match_fib_index, 0);
2293           if (clib_bihash_search_8_8 (&nm->static_mapping_by_local, &kv,
2294                                       &value))
2295             return 1;
2296         }
2297       m = pool_elt_at_index (nm->static_mappings, value.value);
2298
2299       *mapping_fib_index = nm->outside_fib_index;
2300       *mapping_addr = m->external_addr;
2301       port = m->external_port;
2302     }
2303
2304   /* Address only mapping doesn't change port */
2305   if (nat44_ei_is_addr_only_static_mapping (m))
2306     *mapping_port = match_port;
2307   else
2308     *mapping_port = port;
2309
2310   if (PREDICT_FALSE (is_addr_only != 0))
2311     *is_addr_only = nat44_ei_is_addr_only_static_mapping (m);
2312
2313   if (PREDICT_FALSE (is_identity_nat != 0))
2314     *is_identity_nat = nat44_ei_is_identity_static_mapping (m);
2315
2316   return 0;
2317 }
2318
2319 static void
2320 nat44_ei_worker_db_free (nat44_ei_main_per_thread_data_t *tnm)
2321 {
2322   pool_free (tnm->list_pool);
2323   pool_free (tnm->lru_pool);
2324   pool_free (tnm->sessions);
2325   pool_free (tnm->users);
2326
2327   clib_bihash_free_8_8 (&tnm->user_hash);
2328 }
2329
2330 u8 *
2331 format_nat44_ei_key (u8 *s, va_list *args)
2332 {
2333   u64 key = va_arg (*args, u64);
2334
2335   ip4_address_t addr;
2336   u16 port;
2337   nat_protocol_t protocol;
2338   u32 fib_index;
2339
2340   split_nat_key (key, &addr, &port, &fib_index, &protocol);
2341
2342   s = format (s, "%U proto %U port %d fib %d", format_ip4_address, &addr,
2343               format_nat_protocol, protocol, clib_net_to_host_u16 (port),
2344               fib_index);
2345   return s;
2346 }
2347
2348 u8 *
2349 format_nat44_ei_user_kvp (u8 *s, va_list *args)
2350 {
2351   clib_bihash_kv_8_8_t *v = va_arg (*args, clib_bihash_kv_8_8_t *);
2352   nat44_ei_user_key_t k;
2353
2354   k.as_u64 = v->key;
2355
2356   s = format (s, "%U fib %d user-index %llu", format_ip4_address, &k.addr,
2357               k.fib_index, v->value);
2358
2359   return s;
2360 }
2361
2362 u8 *
2363 format_nat44_ei_session_kvp (u8 *s, va_list *args)
2364 {
2365   clib_bihash_kv_8_8_t *v = va_arg (*args, clib_bihash_kv_8_8_t *);
2366
2367   s = format (s, "%U thread-index %llu session-index %llu",
2368               format_nat44_ei_key, v->key, nat_value_get_thread_index (v),
2369               nat_value_get_session_index (v));
2370
2371   return s;
2372 }
2373
2374 u8 *
2375 format_nat44_ei_static_mapping_kvp (u8 *s, va_list *args)
2376 {
2377   clib_bihash_kv_8_8_t *v = va_arg (*args, clib_bihash_kv_8_8_t *);
2378
2379   s = format (s, "%U static-mapping-index %llu", format_nat44_ei_key, v->key,
2380               v->value);
2381
2382   return s;
2383 }
2384
2385 static void
2386 nat44_ei_worker_db_init (nat44_ei_main_per_thread_data_t *tnm,
2387                          u32 translations, u32 translation_buckets,
2388                          u32 user_buckets)
2389 {
2390   dlist_elt_t *head;
2391
2392   pool_alloc (tnm->list_pool, translations);
2393   pool_alloc (tnm->lru_pool, translations);
2394   pool_alloc (tnm->sessions, translations);
2395
2396   clib_bihash_init_8_8 (&tnm->user_hash, "users", user_buckets, 0);
2397
2398   clib_bihash_set_kvp_format_fn_8_8 (&tnm->user_hash,
2399                                      format_nat44_ei_user_kvp);
2400
2401   pool_get (tnm->lru_pool, head);
2402   tnm->tcp_trans_lru_head_index = head - tnm->lru_pool;
2403   clib_dlist_init (tnm->lru_pool, tnm->tcp_trans_lru_head_index);
2404
2405   pool_get (tnm->lru_pool, head);
2406   tnm->tcp_estab_lru_head_index = head - tnm->lru_pool;
2407   clib_dlist_init (tnm->lru_pool, tnm->tcp_estab_lru_head_index);
2408
2409   pool_get (tnm->lru_pool, head);
2410   tnm->udp_lru_head_index = head - tnm->lru_pool;
2411   clib_dlist_init (tnm->lru_pool, tnm->udp_lru_head_index);
2412
2413   pool_get (tnm->lru_pool, head);
2414   tnm->icmp_lru_head_index = head - tnm->lru_pool;
2415   clib_dlist_init (tnm->lru_pool, tnm->icmp_lru_head_index);
2416
2417   pool_get (tnm->lru_pool, head);
2418   tnm->unk_proto_lru_head_index = head - tnm->lru_pool;
2419   clib_dlist_init (tnm->lru_pool, tnm->unk_proto_lru_head_index);
2420 }
2421
2422 static void
2423 nat44_ei_db_free ()
2424 {
2425   nat44_ei_main_t *nm = &nat44_ei_main;
2426   nat44_ei_main_per_thread_data_t *tnm;
2427
2428   pool_free (nm->static_mappings);
2429   clib_bihash_free_8_8 (&nm->static_mapping_by_local);
2430   clib_bihash_free_8_8 (&nm->static_mapping_by_external);
2431
2432   if (nm->pat)
2433     {
2434       clib_bihash_free_8_8 (&nm->in2out);
2435       clib_bihash_free_8_8 (&nm->out2in);
2436       vec_foreach (tnm, nm->per_thread_data)
2437         {
2438           nat44_ei_worker_db_free (tnm);
2439         }
2440     }
2441 }
2442
2443 static void
2444 nat44_ei_db_init (u32 translations, u32 translation_buckets, u32 user_buckets)
2445 {
2446   nat44_ei_main_t *nm = &nat44_ei_main;
2447   nat44_ei_main_per_thread_data_t *tnm;
2448
2449   u32 static_mapping_buckets = 1024;
2450   u32 static_mapping_memory_size = 64 << 20;
2451
2452   clib_bihash_init_8_8 (&nm->static_mapping_by_local,
2453                         "static_mapping_by_local", static_mapping_buckets,
2454                         static_mapping_memory_size);
2455   clib_bihash_init_8_8 (&nm->static_mapping_by_external,
2456                         "static_mapping_by_external", static_mapping_buckets,
2457                         static_mapping_memory_size);
2458   clib_bihash_set_kvp_format_fn_8_8 (&nm->static_mapping_by_local,
2459                                      format_nat44_ei_static_mapping_kvp);
2460   clib_bihash_set_kvp_format_fn_8_8 (&nm->static_mapping_by_external,
2461                                      format_nat44_ei_static_mapping_kvp);
2462
2463   if (nm->pat)
2464     {
2465       clib_bihash_init_8_8 (&nm->in2out, "in2out", translation_buckets, 0);
2466       clib_bihash_init_8_8 (&nm->out2in, "out2in", translation_buckets, 0);
2467       clib_bihash_set_kvp_format_fn_8_8 (&nm->in2out,
2468                                          format_nat44_ei_session_kvp);
2469       clib_bihash_set_kvp_format_fn_8_8 (&nm->out2in,
2470                                          format_nat44_ei_session_kvp);
2471       vec_foreach (tnm, nm->per_thread_data)
2472         {
2473           nat44_ei_worker_db_init (tnm, translations, translation_buckets,
2474                                    user_buckets);
2475         }
2476     }
2477 }
2478
2479 void
2480 nat44_ei_sessions_clear ()
2481 {
2482   nat44_ei_main_t *nm = &nat44_ei_main;
2483   nat44_ei_main_per_thread_data_t *tnm;
2484
2485   if (nm->pat)
2486     {
2487       clib_bihash_free_8_8 (&nm->in2out);
2488       clib_bihash_free_8_8 (&nm->out2in);
2489       clib_bihash_init_8_8 (&nm->in2out, "in2out", nm->translation_buckets, 0);
2490       clib_bihash_init_8_8 (&nm->out2in, "out2in", nm->translation_buckets, 0);
2491       clib_bihash_set_kvp_format_fn_8_8 (&nm->in2out,
2492                                          format_nat44_ei_session_kvp);
2493       clib_bihash_set_kvp_format_fn_8_8 (&nm->out2in,
2494                                          format_nat44_ei_session_kvp);
2495       vec_foreach (tnm, nm->per_thread_data)
2496         {
2497           nat44_ei_worker_db_free (tnm);
2498           nat44_ei_worker_db_init (tnm, nm->translations,
2499                                    nm->translation_buckets, nm->user_buckets);
2500         }
2501     }
2502
2503   vlib_zero_simple_counter (&nm->total_users, 0);
2504   vlib_zero_simple_counter (&nm->total_sessions, 0);
2505   vlib_zero_simple_counter (&nm->user_limit_reached, 0);
2506 }
2507
2508 static void
2509 nat44_ei_update_outside_fib (ip4_main_t *im, uword opaque, u32 sw_if_index,
2510                              u32 new_fib_index, u32 old_fib_index)
2511 {
2512   nat44_ei_main_t *nm = &nat44_ei_main;
2513   nat44_ei_outside_fib_t *outside_fib;
2514   nat44_ei_interface_t *i;
2515   u8 is_add = 1;
2516   u8 match = 0;
2517
2518   if (!nm->enabled || (new_fib_index == old_fib_index) ||
2519       (!vec_len (nm->outside_fibs)))
2520     {
2521       return;
2522     }
2523
2524   pool_foreach (i, nm->interfaces)
2525     {
2526       if (i->sw_if_index == sw_if_index)
2527         {
2528           if (!(nat44_ei_interface_is_outside (i)))
2529             return;
2530           match = 1;
2531         }
2532     }
2533
2534   pool_foreach (i, nm->output_feature_interfaces)
2535     {
2536       if (i->sw_if_index == sw_if_index)
2537         {
2538           if (!(nat44_ei_interface_is_outside (i)))
2539             return;
2540           match = 1;
2541         }
2542     }
2543
2544   if (!match)
2545     return;
2546
2547   vec_foreach (outside_fib, nm->outside_fibs)
2548     {
2549       if (outside_fib->fib_index == old_fib_index)
2550         {
2551           outside_fib->refcount--;
2552           if (!outside_fib->refcount)
2553             vec_del1 (nm->outside_fibs, outside_fib - nm->outside_fibs);
2554           break;
2555         }
2556     }
2557
2558   vec_foreach (outside_fib, nm->outside_fibs)
2559     {
2560       if (outside_fib->fib_index == new_fib_index)
2561         {
2562           outside_fib->refcount++;
2563           is_add = 0;
2564           break;
2565         }
2566     }
2567
2568   if (is_add)
2569     {
2570       vec_add2 (nm->outside_fibs, outside_fib, 1);
2571       outside_fib->refcount = 1;
2572       outside_fib->fib_index = new_fib_index;
2573     }
2574 }
2575
2576 int
2577 nat44_ei_add_address (nat44_ei_main_t *nm, ip4_address_t *addr, u32 vrf_id)
2578 {
2579   nat44_ei_address_t *ap;
2580   nat44_ei_interface_t *i;
2581   vlib_thread_main_t *tm = vlib_get_thread_main ();
2582
2583   /* Check if address already exists */
2584   vec_foreach (ap, nm->addresses)
2585     {
2586       if (ap->addr.as_u32 == addr->as_u32)
2587         {
2588           nat44_ei_log_err ("address exist");
2589           return VNET_API_ERROR_VALUE_EXIST;
2590         }
2591     }
2592
2593   vec_add2 (nm->addresses, ap, 1);
2594
2595   ap->addr = *addr;
2596   if (vrf_id != ~0)
2597     ap->fib_index = fib_table_find_or_create_and_lock (
2598       FIB_PROTOCOL_IP4, vrf_id, nm->fib_src_low);
2599   else
2600     ap->fib_index = ~0;
2601
2602 #define _(N, i, n, s)                                                         \
2603   clib_memset (ap->busy_##n##_port_refcounts, 0,                              \
2604                sizeof (ap->busy_##n##_port_refcounts));                       \
2605   ap->busy_##n##_ports = 0;                                                   \
2606   ap->busy_##n##_ports_per_thread = 0;                                        \
2607   vec_validate_init_empty (ap->busy_##n##_ports_per_thread,                   \
2608                            tm->n_vlib_mains - 1, 0);
2609   foreach_nat_protocol
2610 #undef _
2611
2612     /* Add external address to FIB */
2613     pool_foreach (i, nm->interfaces)
2614   {
2615     if (nat44_ei_interface_is_inside (i) || nm->out2in_dpo)
2616       continue;
2617
2618     nat44_ei_add_del_addr_to_fib (addr, 32, i->sw_if_index, 1);
2619     break;
2620   }
2621   pool_foreach (i, nm->output_feature_interfaces)
2622     {
2623       if (nat44_ei_interface_is_inside (i) || nm->out2in_dpo)
2624         continue;
2625
2626       nat44_ei_add_del_addr_to_fib (addr, 32, i->sw_if_index, 1);
2627       break;
2628     }
2629
2630   return 0;
2631 }
2632
2633 int
2634 nat44_ei_add_interface_address (nat44_ei_main_t *nm, u32 sw_if_index,
2635                                 int is_del)
2636 {
2637   ip4_main_t *ip4_main = nm->ip4_main;
2638   ip4_address_t *first_int_addr;
2639   nat44_ei_static_map_resolve_t *rp;
2640   u32 *indices_to_delete = 0;
2641   int i, j;
2642   u32 *auto_add_sw_if_indices = nm->auto_add_sw_if_indices;
2643
2644   first_int_addr = ip4_interface_first_address (ip4_main, sw_if_index,
2645                                                 0 /* just want the address */);
2646
2647   for (i = 0; i < vec_len (auto_add_sw_if_indices); i++)
2648     {
2649       if (auto_add_sw_if_indices[i] == sw_if_index)
2650         {
2651           if (is_del)
2652             {
2653               /* if have address remove it */
2654               if (first_int_addr)
2655                 (void) nat44_ei_del_address (nm, first_int_addr[0], 1);
2656               else
2657                 {
2658                   for (j = 0; j < vec_len (nm->to_resolve); j++)
2659                     {
2660                       rp = nm->to_resolve + j;
2661                       if (rp->sw_if_index == sw_if_index)
2662                         vec_add1 (indices_to_delete, j);
2663                     }
2664                   if (vec_len (indices_to_delete))
2665                     {
2666                       for (j = vec_len (indices_to_delete) - 1; j >= 0; j--)
2667                         vec_del1 (nm->to_resolve, j);
2668                       vec_free (indices_to_delete);
2669                     }
2670                 }
2671               vec_del1 (nm->auto_add_sw_if_indices, i);
2672             }
2673           else
2674             return VNET_API_ERROR_VALUE_EXIST;
2675
2676           return 0;
2677         }
2678     }
2679
2680   if (is_del)
2681     return VNET_API_ERROR_NO_SUCH_ENTRY;
2682
2683   /* add to the auto-address list */
2684   vec_add1 (nm->auto_add_sw_if_indices, sw_if_index);
2685
2686   /* If the address is already bound - or static - add it now */
2687   if (first_int_addr)
2688     (void) nat44_ei_add_address (nm, first_int_addr, ~0);
2689
2690   return 0;
2691 }
2692
2693 static int
2694 nat44_ei_is_address_used_in_static_mapping (ip4_address_t addr)
2695 {
2696   nat44_ei_main_t *nm = &nat44_ei_main;
2697   nat44_ei_static_mapping_t *m;
2698   pool_foreach (m, nm->static_mappings)
2699     {
2700       if (nat44_ei_is_addr_only_static_mapping (m) ||
2701           nat44_ei_is_identity_static_mapping (m))
2702         continue;
2703       if (m->external_addr.as_u32 == addr.as_u32)
2704         return 1;
2705     }
2706   return 0;
2707 }
2708
2709 int
2710 nat44_ei_del_address (nat44_ei_main_t *nm, ip4_address_t addr, u8 delete_sm)
2711 {
2712   nat44_ei_address_t *a = 0;
2713   nat44_ei_session_t *ses;
2714   u32 *ses_to_be_removed = 0, *ses_index;
2715   nat44_ei_main_per_thread_data_t *tnm;
2716   nat44_ei_interface_t *interface;
2717   nat44_ei_static_mapping_t *m;
2718   int i;
2719
2720   /* Find SNAT address */
2721   for (i = 0; i < vec_len (nm->addresses); i++)
2722     {
2723       if (nm->addresses[i].addr.as_u32 == addr.as_u32)
2724         {
2725           a = nm->addresses + i;
2726           break;
2727         }
2728     }
2729   if (!a)
2730     {
2731       nat44_ei_log_err ("no such address");
2732       return VNET_API_ERROR_NO_SUCH_ENTRY;
2733     }
2734
2735   if (delete_sm)
2736     {
2737       pool_foreach (m, nm->static_mappings)
2738         {
2739           if (m->external_addr.as_u32 == addr.as_u32)
2740             (void) nat44_ei_add_del_static_mapping (
2741               m->local_addr, m->external_addr, m->local_port, m->external_port,
2742               m->proto, ~0 /* sw_if_index */, m->vrf_id,
2743               nat44_ei_is_addr_only_static_mapping (m),
2744               nat44_ei_is_identity_static_mapping (m), m->tag, 0);
2745         }
2746     }
2747   else
2748     {
2749       /* Check if address is used in some static mapping */
2750       if (nat44_ei_is_address_used_in_static_mapping (addr))
2751         {
2752           nat44_ei_log_err ("address used in static mapping");
2753           return VNET_API_ERROR_UNSPECIFIED;
2754         }
2755     }
2756
2757   if (a->fib_index != ~0)
2758     fib_table_unlock (a->fib_index, FIB_PROTOCOL_IP4, nm->fib_src_low);
2759
2760   /* Delete sessions using address */
2761   if (a->busy_tcp_ports || a->busy_udp_ports || a->busy_icmp_ports)
2762     {
2763       vec_foreach (tnm, nm->per_thread_data)
2764         {
2765           pool_foreach (ses, tnm->sessions)
2766             {
2767               if (ses->out2in.addr.as_u32 == addr.as_u32)
2768                 {
2769                   nat44_ei_free_session_data (nm, ses,
2770                                               tnm - nm->per_thread_data, 0);
2771                   vec_add1 (ses_to_be_removed, ses - tnm->sessions);
2772                 }
2773             }
2774           vec_foreach (ses_index, ses_to_be_removed)
2775             {
2776               ses = pool_elt_at_index (tnm->sessions, ses_index[0]);
2777               nat44_ei_delete_session (nm, ses, tnm - nm->per_thread_data);
2778             }
2779           vec_free (ses_to_be_removed);
2780         }
2781     }
2782
2783 #define _(N, i, n, s) vec_free (a->busy_##n##_ports_per_thread);
2784   foreach_nat_protocol
2785 #undef _
2786     vec_del1 (nm->addresses, i);
2787
2788   /* Delete external address from FIB */
2789   pool_foreach (interface, nm->interfaces)
2790     {
2791       if (nat44_ei_interface_is_inside (interface) || nm->out2in_dpo)
2792         continue;
2793       nat44_ei_add_del_addr_to_fib (&addr, 32, interface->sw_if_index, 0);
2794       break;
2795     }
2796
2797   pool_foreach (interface, nm->output_feature_interfaces)
2798     {
2799       if (nat44_ei_interface_is_inside (interface) || nm->out2in_dpo)
2800         continue;
2801       nat44_ei_add_del_addr_to_fib (&addr, 32, interface->sw_if_index, 0);
2802       break;
2803     }
2804
2805   return 0;
2806 }
2807
2808 static void
2809 nat44_ei_ip4_add_del_interface_address_cb (ip4_main_t *im, uword opaque,
2810                                            u32 sw_if_index,
2811                                            ip4_address_t *address,
2812                                            u32 address_length,
2813                                            u32 if_address_index, u32 is_delete)
2814 {
2815   nat44_ei_main_t *nm = &nat44_ei_main;
2816   nat44_ei_static_map_resolve_t *rp;
2817   ip4_address_t l_addr;
2818   int i, j;
2819   int rv;
2820   nat44_ei_address_t *addresses = nm->addresses;
2821
2822   if (!nm->enabled)
2823     return;
2824
2825   for (i = 0; i < vec_len (nm->auto_add_sw_if_indices); i++)
2826     {
2827       if (sw_if_index == nm->auto_add_sw_if_indices[i])
2828         goto match;
2829     }
2830
2831   return;
2832
2833 match:
2834   if (!is_delete)
2835     {
2836       /* Don't trip over lease renewal, static config */
2837       for (j = 0; j < vec_len (addresses); j++)
2838         if (addresses[j].addr.as_u32 == address->as_u32)
2839           return;
2840
2841       (void) nat44_ei_add_address (nm, address, ~0);
2842       /* Scan static map resolution vector */
2843       for (j = 0; j < vec_len (nm->to_resolve); j++)
2844         {
2845           rp = nm->to_resolve + j;
2846           if (rp->addr_only)
2847             continue;
2848           /* On this interface? */
2849           if (rp->sw_if_index == sw_if_index)
2850             {
2851               /* Indetity mapping? */
2852               if (rp->l_addr.as_u32 == 0)
2853                 l_addr.as_u32 = address[0].as_u32;
2854               else
2855                 l_addr.as_u32 = rp->l_addr.as_u32;
2856               /* Add the static mapping */
2857               rv = nat44_ei_add_del_static_mapping (
2858                 l_addr, address[0], rp->l_port, rp->e_port, rp->proto,
2859                 ~0 /* sw_if_index */, rp->vrf_id, rp->addr_only,
2860                 rp->identity_nat, rp->tag, 1);
2861               if (rv)
2862                 nat_elog_notice_X1 (
2863                   nm, "nat44_ei_add_del_static_mapping returned %d", "i4", rv);
2864             }
2865         }
2866       return;
2867     }
2868   else
2869     {
2870       (void) nat44_ei_del_address (nm, address[0], 1);
2871       return;
2872     }
2873 }
2874
2875 int
2876 nat44_ei_set_frame_queue_nelts (u32 frame_queue_nelts)
2877 {
2878   fail_if_enabled ();
2879   nat44_ei_main_t *nm = &nat44_ei_main;
2880   nm->frame_queue_nelts = frame_queue_nelts;
2881   return 0;
2882 }
2883
2884 static void
2885 nat44_ei_ip4_add_del_addr_only_sm_cb (ip4_main_t *im, uword opaque,
2886                                       u32 sw_if_index, ip4_address_t *address,
2887                                       u32 address_length, u32 if_address_index,
2888                                       u32 is_delete)
2889 {
2890   nat44_ei_main_t *nm = &nat44_ei_main;
2891   nat44_ei_static_map_resolve_t *rp;
2892   nat44_ei_static_mapping_t *m;
2893   clib_bihash_kv_8_8_t kv, value;
2894   int i, rv;
2895   ip4_address_t l_addr;
2896
2897   if (!nm->enabled)
2898     return;
2899
2900   for (i = 0; i < vec_len (nm->to_resolve); i++)
2901     {
2902       rp = nm->to_resolve + i;
2903       if (rp->addr_only == 0)
2904         continue;
2905       if (rp->sw_if_index == sw_if_index)
2906         goto match;
2907     }
2908
2909   return;
2910
2911 match:
2912   init_nat_k (&kv, *address, rp->addr_only ? 0 : rp->e_port,
2913               nm->outside_fib_index, rp->addr_only ? 0 : rp->proto);
2914   if (clib_bihash_search_8_8 (&nm->static_mapping_by_external, &kv, &value))
2915     m = 0;
2916   else
2917     m = pool_elt_at_index (nm->static_mappings, value.value);
2918
2919   if (!is_delete)
2920     {
2921       /* Don't trip over lease renewal, static config */
2922       if (m)
2923         return;
2924     }
2925   else
2926     {
2927       if (!m)
2928         return;
2929     }
2930
2931   /* Indetity mapping? */
2932   if (rp->l_addr.as_u32 == 0)
2933     l_addr.as_u32 = address[0].as_u32;
2934   else
2935     l_addr.as_u32 = rp->l_addr.as_u32;
2936   /* Add the static mapping */
2937
2938   rv = nat44_ei_add_del_static_mapping (
2939     l_addr, address[0], rp->l_port, rp->e_port, rp->proto,
2940     ~0 /* sw_if_index */, rp->vrf_id, rp->addr_only, rp->identity_nat, rp->tag,
2941     !is_delete);
2942   if (rv)
2943     nat_elog_notice_X1 (nm, "nat44_ei_add_del_static_mapping returned %d",
2944                         "i4", rv);
2945 }
2946
2947 static_always_inline uword
2948 nat44_ei_classify_inline_fn (vlib_main_t *vm, vlib_node_runtime_t *node,
2949                              vlib_frame_t *frame)
2950 {
2951   u32 n_left_from, *from, *to_next;
2952   nat44_ei_classify_next_t next_index;
2953   nat44_ei_main_t *nm = &nat44_ei_main;
2954   nat44_ei_static_mapping_t *m;
2955   u32 next_in2out = 0, next_out2in = 0;
2956
2957   from = vlib_frame_vector_args (frame);
2958   n_left_from = frame->n_vectors;
2959   next_index = node->cached_next_index;
2960
2961   while (n_left_from > 0)
2962     {
2963       u32 n_left_to_next;
2964
2965       vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next);
2966
2967       while (n_left_from > 0 && n_left_to_next > 0)
2968         {
2969           u32 bi0;
2970           vlib_buffer_t *b0;
2971           u32 next0 = NAT44_EI_CLASSIFY_NEXT_IN2OUT;
2972           ip4_header_t *ip0;
2973           nat44_ei_address_t *ap;
2974           clib_bihash_kv_8_8_t kv0, value0;
2975
2976           /* speculatively enqueue b0 to the current next frame */
2977           bi0 = from[0];
2978           to_next[0] = bi0;
2979           from += 1;
2980           to_next += 1;
2981           n_left_from -= 1;
2982           n_left_to_next -= 1;
2983
2984           b0 = vlib_get_buffer (vm, bi0);
2985           ip0 = vlib_buffer_get_current (b0);
2986
2987           vec_foreach (ap, nm->addresses)
2988             {
2989               if (ip0->dst_address.as_u32 == ap->addr.as_u32)
2990                 {
2991                   next0 = NAT44_EI_CLASSIFY_NEXT_OUT2IN;
2992                   goto enqueue0;
2993                 }
2994             }
2995
2996           if (PREDICT_FALSE (pool_elts (nm->static_mappings)))
2997             {
2998               init_nat_k (&kv0, ip0->dst_address, 0, 0, 0);
2999               /* try to classify the fragment based on IP header alone */
3000               if (!clib_bihash_search_8_8 (&nm->static_mapping_by_external,
3001                                            &kv0, &value0))
3002                 {
3003                   m = pool_elt_at_index (nm->static_mappings, value0.value);
3004                   if (m->local_addr.as_u32 != m->external_addr.as_u32)
3005                     next0 = NAT44_EI_CLASSIFY_NEXT_OUT2IN;
3006                   goto enqueue0;
3007                 }
3008               init_nat_k (&kv0, ip0->dst_address,
3009                           vnet_buffer (b0)->ip.reass.l4_dst_port, 0,
3010                           ip_proto_to_nat_proto (ip0->protocol));
3011               if (!clib_bihash_search_8_8 (&nm->static_mapping_by_external,
3012                                            &kv0, &value0))
3013                 {
3014                   m = pool_elt_at_index (nm->static_mappings, value0.value);
3015                   if (m->local_addr.as_u32 != m->external_addr.as_u32)
3016                     next0 = NAT44_EI_CLASSIFY_NEXT_OUT2IN;
3017                 }
3018             }
3019
3020         enqueue0:
3021           if (PREDICT_FALSE ((node->flags & VLIB_NODE_FLAG_TRACE) &&
3022                              (b0->flags & VLIB_BUFFER_IS_TRACED)))
3023             {
3024               nat44_ei_classify_trace_t *t =
3025                 vlib_add_trace (vm, node, b0, sizeof (*t));
3026               t->cached = 0;
3027               t->next_in2out = next0 == NAT44_EI_CLASSIFY_NEXT_IN2OUT ? 1 : 0;
3028             }
3029
3030           next_in2out += next0 == NAT44_EI_CLASSIFY_NEXT_IN2OUT;
3031           next_out2in += next0 == NAT44_EI_CLASSIFY_NEXT_OUT2IN;
3032
3033           /* verify speculative enqueue, maybe switch current next frame */
3034           vlib_validate_buffer_enqueue_x1 (vm, node, next_index, to_next,
3035                                            n_left_to_next, bi0, next0);
3036         }
3037
3038       vlib_put_next_frame (vm, node, next_index, n_left_to_next);
3039     }
3040
3041   vlib_node_increment_counter (
3042     vm, node->node_index, NAT44_EI_CLASSIFY_ERROR_NEXT_IN2OUT, next_in2out);
3043   vlib_node_increment_counter (
3044     vm, node->node_index, NAT44_EI_CLASSIFY_ERROR_NEXT_OUT2IN, next_out2in);
3045   return frame->n_vectors;
3046 }
3047
3048 VLIB_NODE_FN (nat44_ei_classify_node)
3049 (vlib_main_t *vm, vlib_node_runtime_t *node, vlib_frame_t *frame)
3050 {
3051   return nat44_ei_classify_inline_fn (vm, node, frame);
3052 }
3053
3054 VLIB_REGISTER_NODE (nat44_ei_classify_node) = {
3055   .name = "nat44-ei-classify",
3056   .vector_size = sizeof (u32),
3057   .format_trace = format_nat44_ei_classify_trace,
3058   .type = VLIB_NODE_TYPE_INTERNAL,
3059   .n_errors = ARRAY_LEN(nat44_ei_classify_error_strings),
3060   .error_strings = nat44_ei_classify_error_strings,
3061   .n_next_nodes = NAT44_EI_CLASSIFY_N_NEXT,
3062   .next_nodes = {
3063     [NAT44_EI_CLASSIFY_NEXT_IN2OUT] = "nat44-ei-in2out",
3064     [NAT44_EI_CLASSIFY_NEXT_OUT2IN] = "nat44-ei-out2in",
3065     [NAT44_EI_CLASSIFY_NEXT_DROP] = "error-drop",
3066   },
3067 };
3068
3069 VLIB_NODE_FN (nat44_ei_handoff_classify_node)
3070 (vlib_main_t *vm, vlib_node_runtime_t *node, vlib_frame_t *frame)
3071 {
3072   return nat44_ei_classify_inline_fn (vm, node, frame);
3073 }
3074
3075 VLIB_REGISTER_NODE (nat44_ei_handoff_classify_node) = {
3076   .name = "nat44-ei-handoff-classify",
3077   .vector_size = sizeof (u32),
3078   .format_trace = format_nat44_ei_classify_trace,
3079   .type = VLIB_NODE_TYPE_INTERNAL,
3080   .n_errors = ARRAY_LEN(nat44_ei_classify_error_strings),
3081   .error_strings = nat44_ei_classify_error_strings,
3082   .n_next_nodes = NAT44_EI_CLASSIFY_N_NEXT,
3083   .next_nodes = {
3084     [NAT44_EI_CLASSIFY_NEXT_IN2OUT] = "nat44-ei-in2out-worker-handoff",
3085     [NAT44_EI_CLASSIFY_NEXT_OUT2IN] = "nat44-ei-out2in-worker-handoff",
3086     [NAT44_EI_CLASSIFY_NEXT_DROP] = "error-drop",
3087   },
3088 };
3089
3090 /*
3091  * fd.io coding-style-patch-verification: ON
3092  *
3093  * Local Variables:
3094  * eval: (c-set-style "gnu")
3095  * End:
3096  */