virtio: enable the interrupt support for uio_pci_generic
[vpp.git] / src / plugins / nat / nat44-ed / nat44_ed_out2in.c
1 /*
2  * Copyright (c) 2018 Cisco and/or its affiliates.
3  * Licensed under the Apache License, Version 2.0 (the "License");
4  * you may not use this file except in compliance with the License.
5  * You may obtain a copy of the License at:
6  *
7  *     http://www.apache.org/licenses/LICENSE-2.0
8  *
9  * Unless required by applicable law or agreed to in writing, software
10  * distributed under the License is distributed on an "AS IS" BASIS,
11  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12  * See the License for the specific language governing permissions and
13  * limitations under the License.
14  */
15 /**
16  * @file
17  * @brief NAT44 endpoint-dependent outside to inside network translation
18  */
19
20 #include <vlib/vlib.h>
21 #include <vnet/vnet.h>
22 #include <vnet/ip/ip.h>
23 #include <vnet/ethernet/ethernet.h>
24 #include <vnet/fib/ip4_fib.h>
25 #include <vnet/udp/udp_local.h>
26 #include <vppinfra/error.h>
27
28 #include <nat/lib/nat_syslog.h>
29 #include <nat/lib/ipfix_logging.h>
30
31 #include <nat/nat44-ed/nat44_ed.h>
32 #include <nat/nat44-ed/nat44_ed_inlines.h>
33
34 static char *nat_out2in_ed_error_strings[] = {
35 #define _(sym,string) string,
36   foreach_nat_out2in_ed_error
37 #undef _
38 };
39
40 typedef struct
41 {
42   u32 sw_if_index;
43   u32 next_index;
44   u32 session_index;
45   nat_translation_error_e translation_error;
46   nat_6t_flow_t i2of;
47   nat_6t_flow_t o2if;
48   clib_bihash_kv_16_8_t search_key;
49   u8 is_slow_path;
50   u8 translation_via_i2of;
51   u8 lookup_skipped;
52 } nat44_ed_out2in_trace_t;
53
54 static u8 *
55 format_nat44_ed_out2in_trace (u8 * s, va_list * args)
56 {
57   CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
58   CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
59   nat44_ed_out2in_trace_t *t = va_arg (*args, nat44_ed_out2in_trace_t *);
60   char *tag;
61
62   tag =
63     t->is_slow_path ? "NAT44_OUT2IN_ED_SLOW_PATH" :
64     "NAT44_OUT2IN_ED_FAST_PATH";
65
66   s = format (s, "%s: sw_if_index %d, next index %d, session %d", tag,
67               t->sw_if_index, t->next_index, t->session_index);
68   if (~0 != t->session_index)
69     {
70       s = format (s, ", translation result '%U' via %s",
71                   format_nat_ed_translation_error, t->translation_error,
72                   t->translation_via_i2of ? "i2of" : "o2if");
73       s = format (s, "\n  i2of %U", format_nat_6t_flow, &t->i2of);
74       s = format (s, "\n  o2if %U", format_nat_6t_flow, &t->o2if);
75     }
76   if (!t->is_slow_path)
77     {
78       if (t->lookup_skipped)
79         {
80           s = format (s, "\n lookup skipped - cached session index used");
81         }
82       else
83         {
84           s = format (s, "\n  search key %U", format_ed_session_kvp,
85                       &t->search_key);
86         }
87     }
88
89   return s;
90 }
91
92 static int
93 next_src_nat (snat_main_t *sm, ip4_header_t *ip, u16 src_port, u16 dst_port,
94               u32 thread_index, u32 rx_fib_index)
95 {
96   clib_bihash_kv_16_8_t kv, value;
97
98   init_ed_k (&kv, ip->src_address, src_port, ip->dst_address, dst_port,
99              rx_fib_index, ip->protocol);
100   if (!clib_bihash_search_16_8 (&sm->flow_hash, &kv, &value))
101     return 1;
102
103   return 0;
104 }
105
106 static void create_bypass_for_fwd (snat_main_t *sm, vlib_buffer_t *b,
107                                    snat_session_t *s, ip4_header_t *ip,
108                                    u32 rx_fib_index, u32 thread_index);
109
110 static snat_session_t *create_session_for_static_mapping_ed (
111   snat_main_t *sm, vlib_buffer_t *b, ip4_address_t i2o_addr, u16 i2o_port,
112   u32 i2o_fib_index, ip4_address_t o2i_addr, u16 o2i_port, u32 o2i_fib_index,
113   nat_protocol_t nat_proto, vlib_node_runtime_t *node, u32 rx_fib_index,
114   u32 thread_index, twice_nat_type_t twice_nat, lb_nat_type_t lb_nat, f64 now,
115   snat_static_mapping_t *mapping);
116
117 static inline u32
118 icmp_out2in_ed_slow_path (snat_main_t *sm, vlib_buffer_t *b, ip4_header_t *ip,
119                           icmp46_header_t *icmp, u32 sw_if_index,
120                           u32 rx_fib_index, vlib_node_runtime_t *node,
121                           u32 next, f64 now, u32 thread_index,
122                           snat_session_t **s_p)
123 {
124   vlib_main_t *vm = vlib_get_main ();
125
126   ip_csum_t sum;
127   u16 checksum;
128
129   snat_session_t *s = 0;
130   u8 is_addr_only, identity_nat;
131   ip4_address_t sm_addr;
132   u16 sm_port;
133   u32 sm_fib_index;
134   snat_static_mapping_t *m;
135   u8 lookup_protocol;
136   ip4_address_t lookup_saddr, lookup_daddr;
137   u16 lookup_sport, lookup_dport;
138
139   sw_if_index = vnet_buffer (b)->sw_if_index[VLIB_RX];
140   rx_fib_index = ip4_fib_table_get_index_for_sw_if_index (sw_if_index);
141
142   if (nat_get_icmp_session_lookup_values (b, ip, &lookup_saddr, &lookup_sport,
143                                           &lookup_daddr, &lookup_dport,
144                                           &lookup_protocol))
145     {
146       b->error = node->errors[NAT_OUT2IN_ED_ERROR_UNSUPPORTED_PROTOCOL];
147       next = NAT_NEXT_DROP;
148       goto out;
149     }
150
151   if (snat_static_mapping_match (
152         sm, ip->dst_address, lookup_sport, rx_fib_index,
153         ip_proto_to_nat_proto (ip->protocol), &sm_addr, &sm_port,
154         &sm_fib_index, 1, &is_addr_only, 0, 0, 0, &identity_nat, &m))
155     {
156       // static mapping not matched
157       if (!sm->forwarding_enabled)
158         {
159           /* Don't NAT packet aimed at the intfc address */
160           if (!is_interface_addr (sm, node, sw_if_index,
161                                   ip->dst_address.as_u32))
162             {
163               b->error = node->errors[NAT_OUT2IN_ED_ERROR_NO_TRANSLATION];
164               next = NAT_NEXT_DROP;
165             }
166         }
167       else
168         {
169           if (next_src_nat (sm, ip, lookup_sport, lookup_dport, thread_index,
170                             rx_fib_index))
171             {
172               next = NAT_NEXT_IN2OUT_ED_FAST_PATH;
173             }
174           else
175             {
176               create_bypass_for_fwd (sm, b, s, ip, rx_fib_index, thread_index);
177             }
178         }
179       goto out;
180     }
181
182   if (PREDICT_FALSE (vnet_buffer (b)->ip.reass.icmp_type_or_tcp_flags !=
183                        ICMP4_echo_reply &&
184                      (vnet_buffer (b)->ip.reass.icmp_type_or_tcp_flags !=
185                         ICMP4_echo_request ||
186                       !is_addr_only)))
187     {
188       b->error = node->errors[NAT_OUT2IN_ED_ERROR_BAD_ICMP_TYPE];
189       next = NAT_NEXT_DROP;
190       goto out;
191     }
192
193   if (PREDICT_FALSE (identity_nat))
194     {
195       goto out;
196     }
197
198   /* Create session initiated by host from external network */
199   s = create_session_for_static_mapping_ed (
200     sm, b, sm_addr, sm_port, sm_fib_index, ip->dst_address, lookup_sport,
201     rx_fib_index, ip_proto_to_nat_proto (lookup_protocol), node, rx_fib_index,
202     thread_index, 0, 0, vlib_time_now (vm), m);
203   if (!s)
204     next = NAT_NEXT_DROP;
205
206   if (PREDICT_TRUE (!ip4_is_fragment (ip)))
207     {
208       sum = ip_incremental_checksum_buffer (
209         vm, b, (u8 *) icmp - (u8 *) vlib_buffer_get_current (b),
210         ntohs (ip->length) - ip4_header_bytes (ip), 0);
211       checksum = ~ip_csum_fold (sum);
212       if (checksum != 0 && checksum != 0xffff)
213         {
214           next = NAT_NEXT_DROP;
215           goto out;
216         }
217     }
218
219   if (PREDICT_TRUE (next != NAT_NEXT_DROP && s))
220     {
221       /* Accounting */
222       nat44_session_update_counters (
223         s, now, vlib_buffer_length_in_chain (vm, b), thread_index);
224       /* Per-user LRU list maintenance */
225       nat44_session_update_lru (sm, s, thread_index);
226     }
227 out:
228   if (NAT_NEXT_DROP == next && s)
229     {
230       nat_ed_session_delete (sm, s, thread_index, 1);
231       s = 0;
232     }
233   *s_p = s;
234   return next;
235 }
236
237 // allocate exact address based on preference
238 static_always_inline int
239 nat_alloc_addr_and_port_exact (snat_address_t * a,
240                                u32 thread_index,
241                                nat_protocol_t proto,
242                                ip4_address_t * addr,
243                                u16 * port,
244                                u16 port_per_thread, u32 snat_thread_index)
245 {
246   snat_main_t *sm = &snat_main;
247   u32 portnum;
248
249   switch (proto)
250     {
251 #define _(N, j, n, s) \
252     case NAT_PROTOCOL_##N: \
253       if (a->busy_##n##_ports_per_thread[thread_index] < port_per_thread) \
254         { \
255           while (1) \
256             { \
257               portnum = (port_per_thread * \
258                 snat_thread_index) + \
259                 snat_random_port(0, port_per_thread - 1) + 1024; \
260               if (a->busy_##n##_port_refcounts[portnum]) \
261                 continue; \
262               --a->busy_##n##_port_refcounts[portnum]; \
263               a->busy_##n##_ports_per_thread[thread_index]++; \
264               a->busy_##n##_ports++; \
265               *addr = a->addr; \
266               *port = clib_host_to_net_u16(portnum); \
267               return 0; \
268             } \
269         } \
270       break;
271       foreach_nat_protocol
272 #undef _
273         default : nat_elog_info (sm, "unknown protocol");
274       return 1;
275     }
276
277   /* Totally out of translations to use... */
278   nat_ipfix_logging_addresses_exhausted (thread_index, 0);
279   return 1;
280 }
281
282 static_always_inline int
283 nat44_ed_alloc_outside_addr_and_port (snat_address_t *addresses, u32 fib_index,
284                                       u32 thread_index, nat_protocol_t proto,
285                                       ip4_address_t *addr, u16 *port,
286                                       u16 port_per_thread,
287                                       u32 snat_thread_index)
288 {
289   snat_main_t *sm = &snat_main;
290   snat_address_t *a, *ga = 0;
291   u32 portnum;
292   int i;
293
294   for (i = 0; i < vec_len (addresses); i++)
295     {
296       a = addresses + i;
297       switch (proto)
298         {
299 #define _(N, j, n, s)                                                         \
300   case NAT_PROTOCOL_##N:                                                      \
301     if (a->busy_##n##_ports_per_thread[thread_index] < port_per_thread)       \
302       {                                                                       \
303         if (a->fib_index == fib_index)                                        \
304           {                                                                   \
305             while (1)                                                         \
306               {                                                               \
307                 portnum = (port_per_thread * snat_thread_index) +             \
308                           snat_random_port (0, port_per_thread - 1) + 1024;   \
309                 if (a->busy_##n##_port_refcounts[portnum])                    \
310                   continue;                                                   \
311                 --a->busy_##n##_port_refcounts[portnum];                      \
312                 a->busy_##n##_ports_per_thread[thread_index]++;               \
313                 a->busy_##n##_ports++;                                        \
314                 *addr = a->addr;                                              \
315                 *port = clib_host_to_net_u16 (portnum);                       \
316                 return 0;                                                     \
317               }                                                               \
318           }                                                                   \
319         else if (a->fib_index == ~0)                                          \
320           {                                                                   \
321             ga = a;                                                           \
322           }                                                                   \
323       }                                                                       \
324     break;
325           foreach_nat_protocol
326 #undef _
327             default : nat_elog_info (sm, "unknown protocol");
328           return 1;
329         }
330     }
331
332   if (ga)
333     {
334       a = ga;
335       switch (proto)
336         {
337 #define _(N, j, n, s)                                                         \
338   case NAT_PROTOCOL_##N:                                                      \
339     while (1)                                                                 \
340       {                                                                       \
341         portnum = (port_per_thread * snat_thread_index) +                     \
342                   snat_random_port (0, port_per_thread - 1) + 1024;           \
343         if (a->busy_##n##_port_refcounts[portnum])                            \
344           continue;                                                           \
345         ++a->busy_##n##_port_refcounts[portnum];                              \
346         a->busy_##n##_ports_per_thread[thread_index]++;                       \
347         a->busy_##n##_ports++;                                                \
348         *addr = a->addr;                                                      \
349         *port = clib_host_to_net_u16 (portnum);                               \
350         return 0;                                                             \
351       }
352           break;
353           foreach_nat_protocol
354 #undef _
355             default : nat_elog_info (sm, "unknown protocol");
356           return 1;
357         }
358     }
359
360   /* Totally out of translations to use... */
361   nat_ipfix_logging_addresses_exhausted (thread_index, 0);
362   return 1;
363 }
364
365 static snat_session_t *
366 create_session_for_static_mapping_ed (
367   snat_main_t *sm, vlib_buffer_t *b, ip4_address_t i2o_addr, u16 i2o_port,
368   u32 i2o_fib_index, ip4_address_t o2i_addr, u16 o2i_port, u32 o2i_fib_index,
369   nat_protocol_t nat_proto, vlib_node_runtime_t *node, u32 rx_fib_index,
370   u32 thread_index, twice_nat_type_t twice_nat, lb_nat_type_t lb_nat, f64 now,
371   snat_static_mapping_t *mapping)
372 {
373   snat_session_t *s;
374   ip4_header_t *ip;
375   udp_header_t *udp;
376   snat_main_per_thread_data_t *tsm = &sm->per_thread_data[thread_index];
377
378   if (PREDICT_FALSE
379       (nat44_ed_maximum_sessions_exceeded (sm, rx_fib_index, thread_index)))
380     {
381       b->error = node->errors[NAT_OUT2IN_ED_ERROR_MAX_SESSIONS_EXCEEDED];
382       nat_elog_notice (sm, "maximum sessions exceeded");
383       return 0;
384     }
385
386   s = nat_ed_session_alloc (sm, thread_index, now, nat_proto);
387   if (!s)
388     {
389       b->error = node->errors[NAT_OUT2IN_ED_ERROR_MAX_SESSIONS_EXCEEDED];
390       nat_elog_warn (sm, "create NAT session failed");
391       return 0;
392     }
393
394   ip = vlib_buffer_get_current (b);
395   udp = ip4_next_header (ip);
396
397   s->ext_host_addr.as_u32 = ip->src_address.as_u32;
398   s->ext_host_port = nat_proto == NAT_PROTOCOL_ICMP ? 0 : udp->src_port;
399   s->flags |= SNAT_SESSION_FLAG_STATIC_MAPPING;
400   if (lb_nat)
401     s->flags |= SNAT_SESSION_FLAG_LOAD_BALANCING;
402   if (lb_nat == AFFINITY_LB_NAT)
403     s->flags |= SNAT_SESSION_FLAG_AFFINITY;
404   s->flags |= SNAT_SESSION_FLAG_ENDPOINT_DEPENDENT;
405   s->out2in.addr = o2i_addr;
406   s->out2in.port = o2i_port;
407   s->out2in.fib_index = o2i_fib_index;
408   s->in2out.addr = i2o_addr;
409   s->in2out.port = i2o_port;
410   s->in2out.fib_index = i2o_fib_index;
411   s->nat_proto = nat_proto;
412
413   if (NAT_PROTOCOL_ICMP == nat_proto)
414     {
415       nat_6t_o2i_flow_init (sm, thread_index, s, s->ext_host_addr, o2i_port,
416                             o2i_addr, o2i_port, o2i_fib_index, ip->protocol);
417       nat_6t_flow_icmp_id_rewrite_set (&s->o2i, i2o_port);
418     }
419   else
420     {
421       nat_6t_o2i_flow_init (sm, thread_index, s, s->ext_host_addr,
422                             s->ext_host_port, o2i_addr, o2i_port,
423                             o2i_fib_index, ip->protocol);
424       nat_6t_flow_dport_rewrite_set (&s->o2i, i2o_port);
425     }
426   nat_6t_flow_daddr_rewrite_set (&s->o2i, i2o_addr.as_u32);
427   nat_6t_flow_txfib_rewrite_set (&s->o2i, i2o_fib_index);
428
429   if (nat_ed_ses_o2i_flow_hash_add_del (sm, thread_index, s, 1))
430     {
431       b->error = node->errors[NAT_OUT2IN_ED_ERROR_HASH_ADD_FAILED];
432       nat_ed_session_delete (sm, s, thread_index, 1);
433       nat_elog_warn (sm, "out2in flow hash add failed");
434       return 0;
435     }
436
437   if (twice_nat == TWICE_NAT || (twice_nat == TWICE_NAT_SELF &&
438                                  ip->src_address.as_u32 == i2o_addr.as_u32))
439     {
440       int rc = 0;
441       snat_address_t *filter = 0;
442
443       // if exact address is specified use this address
444       if (is_exact_address (mapping))
445         {
446           snat_address_t *ap;
447           vec_foreach (ap, sm->twice_nat_addresses)
448           {
449             if (mapping->pool_addr.as_u32 == ap->addr.as_u32)
450               {
451                 filter = ap;
452                 break;
453               }
454           }
455         }
456
457       if (filter)
458         {
459           rc = nat_alloc_addr_and_port_exact (filter,
460                                               thread_index,
461                                               nat_proto,
462                                               &s->ext_host_nat_addr,
463                                               &s->ext_host_nat_port,
464                                               sm->port_per_thread,
465                                               tsm->snat_thread_index);
466           s->flags |= SNAT_SESSION_FLAG_EXACT_ADDRESS;
467         }
468       else
469         {
470           rc = nat44_ed_alloc_outside_addr_and_port (
471             sm->twice_nat_addresses, 0, thread_index, nat_proto,
472             &s->ext_host_nat_addr, &s->ext_host_nat_port, sm->port_per_thread,
473             tsm->snat_thread_index);
474         }
475
476       if (rc)
477         {
478           b->error = node->errors[NAT_OUT2IN_ED_ERROR_OUT_OF_PORTS];
479           if (nat_ed_ses_o2i_flow_hash_add_del (sm, thread_index, s, 0))
480             {
481               nat_elog_warn (sm, "out2in flow hash del failed");
482             }
483           snat_free_outside_address_and_port (
484             sm->twice_nat_addresses, thread_index, &s->ext_host_nat_addr,
485             s->ext_host_nat_port, s->nat_proto);
486           nat_ed_session_delete (sm, s, thread_index, 1);
487           return 0;
488         }
489
490       s->flags |= SNAT_SESSION_FLAG_TWICE_NAT;
491
492       nat_6t_flow_saddr_rewrite_set (&s->o2i, s->ext_host_nat_addr.as_u32);
493       if (NAT_PROTOCOL_ICMP == nat_proto)
494         {
495           nat_6t_flow_icmp_id_rewrite_set (&s->o2i, s->ext_host_nat_port);
496         }
497       else
498         {
499           nat_6t_flow_sport_rewrite_set (&s->o2i, s->ext_host_nat_port);
500         }
501
502       nat_6t_l3_l4_csum_calc (&s->o2i);
503
504       nat_6t_i2o_flow_init (sm, thread_index, s, i2o_addr, i2o_port,
505                             s->ext_host_nat_addr, s->ext_host_nat_port,
506                             i2o_fib_index, ip->protocol);
507       nat_6t_flow_daddr_rewrite_set (&s->i2o, s->ext_host_addr.as_u32);
508       if (NAT_PROTOCOL_ICMP == nat_proto)
509         {
510           nat_6t_flow_icmp_id_rewrite_set (&s->i2o, s->ext_host_port);
511         }
512       else
513         {
514           nat_6t_flow_dport_rewrite_set (&s->i2o, s->ext_host_port);
515         }
516     }
517   else
518     {
519       if (NAT_PROTOCOL_ICMP == nat_proto)
520         {
521           nat_6t_i2o_flow_init (sm, thread_index, s, i2o_addr, i2o_port,
522                                 s->ext_host_addr, i2o_port, i2o_fib_index,
523                                 ip->protocol);
524         }
525       else
526         {
527           nat_6t_i2o_flow_init (sm, thread_index, s, i2o_addr, i2o_port,
528                                 s->ext_host_addr, s->ext_host_port,
529                                 i2o_fib_index, ip->protocol);
530         }
531     }
532
533   nat_6t_flow_saddr_rewrite_set (&s->i2o, o2i_addr.as_u32);
534   if (NAT_PROTOCOL_ICMP == nat_proto)
535     {
536       nat_6t_flow_icmp_id_rewrite_set (&s->i2o, o2i_port);
537     }
538   else
539     {
540       nat_6t_flow_sport_rewrite_set (&s->i2o, o2i_port);
541     }
542
543   if (nat_ed_ses_i2o_flow_hash_add_del (sm, thread_index, s, 1))
544     {
545       nat_elog_notice (sm, "in2out flow hash add failed");
546       if (nat_ed_ses_o2i_flow_hash_add_del (sm, thread_index, s, 0))
547         {
548           nat_elog_warn (sm, "out2in flow hash del failed");
549         }
550       nat_ed_session_delete (sm, s, thread_index, 1);
551       return 0;
552     }
553
554   nat_ipfix_logging_nat44_ses_create (thread_index,
555                                       s->in2out.addr.as_u32,
556                                       s->out2in.addr.as_u32,
557                                       s->nat_proto,
558                                       s->in2out.port,
559                                       s->out2in.port, s->in2out.fib_index);
560
561   nat_syslog_nat44_sadd (0, s->in2out.fib_index, &s->in2out.addr,
562                          s->in2out.port, &s->ext_host_nat_addr,
563                          s->ext_host_nat_port, &s->out2in.addr, s->out2in.port,
564                          &s->ext_host_addr, s->ext_host_port, s->nat_proto,
565                          is_twice_nat_session (s));
566
567   per_vrf_sessions_register_session (s, thread_index);
568
569   return s;
570 }
571
572 static void
573 create_bypass_for_fwd (snat_main_t *sm, vlib_buffer_t *b, snat_session_t *s,
574                        ip4_header_t *ip, u32 rx_fib_index, u32 thread_index)
575 {
576   clib_bihash_kv_16_8_t kv, value;
577   udp_header_t *udp;
578   snat_main_per_thread_data_t *tsm = &sm->per_thread_data[thread_index];
579   vlib_main_t *vm = vlib_get_main ();
580   f64 now = vlib_time_now (vm);
581   u16 lookup_sport, lookup_dport;
582   u8 lookup_protocol;
583   ip4_address_t lookup_saddr, lookup_daddr;
584
585   if (ip->protocol == IP_PROTOCOL_ICMP)
586     {
587       if (nat_get_icmp_session_lookup_values (b, ip, &lookup_saddr,
588                                               &lookup_sport, &lookup_daddr,
589                                               &lookup_dport, &lookup_protocol))
590         return;
591     }
592   else
593     {
594       if (ip->protocol == IP_PROTOCOL_UDP || ip->protocol == IP_PROTOCOL_TCP)
595         {
596           udp = ip4_next_header (ip);
597           lookup_sport = udp->dst_port;
598           lookup_dport = udp->src_port;
599         }
600       else
601         {
602           lookup_sport = 0;
603           lookup_dport = 0;
604         }
605       lookup_saddr.as_u32 = ip->dst_address.as_u32;
606       lookup_daddr.as_u32 = ip->src_address.as_u32;
607       lookup_protocol = ip->protocol;
608     }
609
610   init_ed_k (&kv, lookup_saddr, lookup_sport, lookup_daddr, lookup_dport,
611              rx_fib_index, lookup_protocol);
612
613   if (!clib_bihash_search_16_8 (&sm->flow_hash, &kv, &value))
614     {
615       ASSERT (thread_index == ed_value_get_thread_index (&value));
616       s =
617         pool_elt_at_index (tsm->sessions,
618                            ed_value_get_session_index (&value));
619     }
620   else if (ip->protocol == IP_PROTOCOL_ICMP &&
621            icmp_type_is_error_message
622            (vnet_buffer (b)->ip.reass.icmp_type_or_tcp_flags))
623     {
624       return;
625     }
626   else
627     {
628       u32 proto;
629
630       if (PREDICT_FALSE
631           (nat44_ed_maximum_sessions_exceeded
632            (sm, rx_fib_index, thread_index)))
633         return;
634
635       s = nat_ed_session_alloc (sm, thread_index, now, ip->protocol);
636       if (!s)
637         {
638           nat_elog_warn (sm, "create NAT session failed");
639           return;
640         }
641
642       proto = ip_proto_to_nat_proto (ip->protocol);
643
644       s->ext_host_addr = ip->src_address;
645       s->ext_host_port = lookup_dport;
646       s->flags |= SNAT_SESSION_FLAG_FWD_BYPASS;
647       s->out2in.addr = ip->dst_address;
648       s->out2in.port = lookup_sport;
649       s->nat_proto = proto;
650       if (proto == NAT_PROTOCOL_OTHER)
651         {
652           s->flags |= SNAT_SESSION_FLAG_UNKNOWN_PROTO;
653           s->out2in.port = ip->protocol;
654         }
655       s->out2in.fib_index = rx_fib_index;
656       s->in2out.addr = s->out2in.addr;
657       s->in2out.port = s->out2in.port;
658       s->in2out.fib_index = s->out2in.fib_index;
659
660       nat_6t_i2o_flow_init (sm, thread_index, s, ip->dst_address, lookup_sport,
661                             ip->src_address, lookup_dport, rx_fib_index,
662                             ip->protocol);
663       nat_6t_flow_txfib_rewrite_set (&s->i2o, rx_fib_index);
664       if (nat_ed_ses_i2o_flow_hash_add_del (sm, thread_index, s, 1))
665         {
666           nat_elog_notice (sm, "in2out flow add failed");
667           nat_ed_session_delete (sm, s, thread_index, 1);
668           return;
669         }
670
671       per_vrf_sessions_register_session (s, thread_index);
672     }
673
674   if (ip->protocol == IP_PROTOCOL_TCP)
675     {
676       tcp_header_t *tcp = ip4_next_header (ip);
677       nat44_set_tcp_session_state_o2i (sm, now, s, tcp->flags,
678                                        tcp->ack_number, tcp->seq_number,
679                                        thread_index);
680     }
681
682   /* Accounting */
683   nat44_session_update_counters (s, now, 0, thread_index);
684   /* Per-user LRU list maintenance */
685   nat44_session_update_lru (sm, s, thread_index);
686 }
687
688 static snat_session_t *
689 nat44_ed_out2in_slowpath_unknown_proto (snat_main_t *sm, vlib_buffer_t *b,
690                                         ip4_header_t *ip, u32 rx_fib_index,
691                                         u32 thread_index, f64 now,
692                                         vlib_main_t *vm,
693                                         vlib_node_runtime_t *node)
694 {
695   clib_bihash_kv_8_8_t kv, value;
696   snat_static_mapping_t *m;
697   snat_session_t *s;
698
699   if (PREDICT_FALSE (
700         nat44_ed_maximum_sessions_exceeded (sm, rx_fib_index, thread_index)))
701     {
702       b->error = node->errors[NAT_OUT2IN_ED_ERROR_MAX_SESSIONS_EXCEEDED];
703       nat_elog_notice (sm, "maximum sessions exceeded");
704       return 0;
705     }
706
707   init_nat_k (&kv, ip->dst_address, 0, 0, 0);
708   if (clib_bihash_search_8_8 (&sm->static_mapping_by_external, &kv, &value))
709     {
710       b->error = node->errors[NAT_OUT2IN_ED_ERROR_NO_TRANSLATION];
711       return 0;
712     }
713
714   m = pool_elt_at_index (sm->static_mappings, value.value);
715
716   /* Create a new session */
717   s = nat_ed_session_alloc (sm, thread_index, now, ip->protocol);
718   if (!s)
719     {
720       b->error = node->errors[NAT_OUT2IN_ED_ERROR_MAX_SESSIONS_EXCEEDED];
721       nat_elog_warn (sm, "create NAT session failed");
722       return 0;
723     }
724
725   s->ext_host_addr.as_u32 = ip->src_address.as_u32;
726   s->flags |= SNAT_SESSION_FLAG_UNKNOWN_PROTO;
727   s->flags |= SNAT_SESSION_FLAG_STATIC_MAPPING;
728   s->flags |= SNAT_SESSION_FLAG_ENDPOINT_DEPENDENT;
729   s->out2in.addr.as_u32 = ip->dst_address.as_u32;
730   s->out2in.fib_index = rx_fib_index;
731   s->in2out.addr.as_u32 = m->local_addr.as_u32;
732   s->in2out.fib_index = m->fib_index;
733   s->in2out.port = s->out2in.port = ip->protocol;
734
735   nat_6t_o2i_flow_init (sm, thread_index, s, ip->dst_address, 0,
736                         ip->src_address, 0, m->fib_index, ip->protocol);
737   nat_6t_flow_saddr_rewrite_set (&s->i2o, ip->dst_address.as_u32);
738   if (nat_ed_ses_i2o_flow_hash_add_del (sm, thread_index, s, 1))
739     {
740       nat_elog_notice (sm, "in2out key add failed");
741       nat_ed_session_delete (sm, s, thread_index, 1);
742       return NULL;
743     }
744
745   nat_6t_o2i_flow_init (sm, thread_index, s, ip->src_address, 0,
746                         ip->dst_address, 0, rx_fib_index, ip->protocol);
747   nat_6t_flow_daddr_rewrite_set (&s->o2i, m->local_addr.as_u32);
748   nat_6t_flow_txfib_rewrite_set (&s->o2i, m->fib_index);
749   if (nat_ed_ses_o2i_flow_hash_add_del (sm, thread_index, s, 1))
750     {
751       nat_elog_notice (sm, "out2in flow hash add failed");
752       nat_ed_session_delete (sm, s, thread_index, 1);
753       return NULL;
754     }
755
756   per_vrf_sessions_register_session (s, thread_index);
757
758   /* Accounting */
759   nat44_session_update_counters (s, now, vlib_buffer_length_in_chain (vm, b),
760                                  thread_index);
761   /* Per-user LRU list maintenance */
762   nat44_session_update_lru (sm, s, thread_index);
763
764   return s;
765 }
766
767 static inline uword
768 nat44_ed_out2in_fast_path_node_fn_inline (vlib_main_t * vm,
769                                           vlib_node_runtime_t * node,
770                                           vlib_frame_t * frame,
771                                           int is_multi_worker)
772 {
773   u32 n_left_from, *from;
774   snat_main_t *sm = &snat_main;
775   f64 now = vlib_time_now (vm);
776   u32 thread_index = vm->thread_index;
777   snat_main_per_thread_data_t *tsm = &sm->per_thread_data[thread_index];
778
779   from = vlib_frame_vector_args (frame);
780   n_left_from = frame->n_vectors;
781
782   vlib_buffer_t *bufs[VLIB_FRAME_SIZE], **b = bufs;
783   u16 nexts[VLIB_FRAME_SIZE], *next = nexts;
784   vlib_get_buffers (vm, from, b, n_left_from);
785
786   while (n_left_from > 0)
787     {
788       vlib_buffer_t *b0;
789       u32 sw_if_index0, rx_fib_index0;
790       nat_protocol_t proto0;
791       ip4_header_t *ip0;
792       snat_session_t *s0 = 0;
793       clib_bihash_kv_16_8_t kv0, value0;
794       nat_translation_error_e translation_error = NAT_ED_TRNSL_ERR_SUCCESS;
795       nat_6t_flow_t *f = 0;
796       ip4_address_t lookup_saddr, lookup_daddr;
797       u16 lookup_sport, lookup_dport;
798       u8 lookup_protocol;
799       int lookup_skipped = 0;
800
801       b0 = *b;
802       b++;
803
804       lookup_sport = vnet_buffer (b0)->ip.reass.l4_src_port;
805       lookup_dport = vnet_buffer (b0)->ip.reass.l4_dst_port;
806
807       /* Prefetch next iteration. */
808       if (PREDICT_TRUE (n_left_from >= 2))
809         {
810           vlib_buffer_t *p2;
811
812           p2 = *b;
813
814           vlib_prefetch_buffer_header (p2, LOAD);
815
816           CLIB_PREFETCH (p2->data, CLIB_CACHE_LINE_BYTES, LOAD);
817         }
818
819       next[0] = vnet_buffer2 (b0)->nat.arc_next;
820
821       vnet_buffer (b0)->snat.flags = 0;
822       ip0 = vlib_buffer_get_current (b0);
823
824       sw_if_index0 = vnet_buffer (b0)->sw_if_index[VLIB_RX];
825       rx_fib_index0 =
826         fib_table_get_index_for_sw_if_index (FIB_PROTOCOL_IP4, sw_if_index0);
827
828       if (PREDICT_FALSE (ip0->ttl == 1))
829         {
830           vnet_buffer (b0)->sw_if_index[VLIB_TX] = (u32) ~ 0;
831           icmp4_error_set_vnet_buffer (b0, ICMP4_time_exceeded,
832                                        ICMP4_time_exceeded_ttl_exceeded_in_transit,
833                                        0);
834           next[0] = NAT_NEXT_ICMP_ERROR;
835           goto trace0;
836         }
837
838       proto0 = ip_proto_to_nat_proto (ip0->protocol);
839
840       if (PREDICT_FALSE (proto0 == NAT_PROTOCOL_ICMP))
841         {
842           if (vnet_buffer (b0)->ip.reass.icmp_type_or_tcp_flags !=
843                 ICMP4_echo_request &&
844               vnet_buffer (b0)->ip.reass.icmp_type_or_tcp_flags !=
845                 ICMP4_echo_reply &&
846               !icmp_type_is_error_message (
847                 vnet_buffer (b0)->ip.reass.icmp_type_or_tcp_flags))
848             {
849               b0->error = node->errors[NAT_OUT2IN_ED_ERROR_BAD_ICMP_TYPE];
850               next[0] = NAT_NEXT_DROP;
851               goto trace0;
852             }
853           int err = nat_get_icmp_session_lookup_values (
854             b0, ip0, &lookup_saddr, &lookup_sport, &lookup_daddr,
855             &lookup_dport, &lookup_protocol);
856           if (err != 0)
857             {
858               b0->error = node->errors[err];
859               next[0] = NAT_NEXT_DROP;
860               goto trace0;
861             }
862         }
863       else
864         {
865           lookup_saddr.as_u32 = ip0->src_address.as_u32;
866           lookup_daddr.as_u32 = ip0->dst_address.as_u32;
867           lookup_protocol = ip0->protocol;
868         }
869
870       /* there might be a stashed index in vnet_buffer2 from handoff or
871        * classify node, see if it can be used */
872       if (!pool_is_free_index (tsm->sessions,
873                                vnet_buffer2 (b0)->nat.cached_session_index))
874         {
875           s0 = pool_elt_at_index (tsm->sessions,
876                                   vnet_buffer2 (b0)->nat.cached_session_index);
877           if (PREDICT_TRUE (
878                 nat_6t_flow_match (&s0->o2i, b0, lookup_saddr, lookup_sport,
879                                    lookup_daddr, lookup_dport, lookup_protocol,
880                                    rx_fib_index0) ||
881                 (s0->flags & SNAT_SESSION_FLAG_TWICE_NAT &&
882                  nat_6t_flow_match (&s0->i2o, b0, lookup_saddr, lookup_sport,
883                                     lookup_daddr, lookup_dport,
884                                     lookup_protocol, rx_fib_index0))))
885             {
886               /* yes, this is the droid we're looking for */
887               lookup_skipped = 1;
888               goto skip_lookup;
889             }
890           s0 = NULL;
891         }
892
893       init_ed_k (&kv0, lookup_saddr, lookup_sport, lookup_daddr, lookup_dport,
894                  rx_fib_index0, lookup_protocol);
895
896       // lookup flow
897       if (clib_bihash_search_16_8 (&sm->flow_hash, &kv0, &value0))
898         {
899           // flow does not exist go slow path
900           next[0] = NAT_NEXT_OUT2IN_ED_SLOW_PATH;
901           goto trace0;
902         }
903       ASSERT (thread_index == ed_value_get_thread_index (&value0));
904       s0 =
905         pool_elt_at_index (tsm->sessions,
906                            ed_value_get_session_index (&value0));
907     skip_lookup:
908
909       if (PREDICT_FALSE (per_vrf_sessions_is_expired (s0, thread_index)))
910         {
911           // session is closed, go slow path
912           nat_free_session_data (sm, s0, thread_index, 0);
913           nat_ed_session_delete (sm, s0, thread_index, 1);
914           next[0] = NAT_NEXT_OUT2IN_ED_SLOW_PATH;
915           goto trace0;
916         }
917
918       if (s0->tcp_closed_timestamp)
919         {
920           if (now >= s0->tcp_closed_timestamp)
921             {
922               // session is closed, go slow path, freed in slow path
923               next[0] = NAT_NEXT_OUT2IN_ED_SLOW_PATH;
924             }
925           else
926             {
927               // session in transitory timeout, drop
928               b0->error = node->errors[NAT_OUT2IN_ED_ERROR_TCP_CLOSED];
929               next[0] = NAT_NEXT_DROP;
930             }
931           goto trace0;
932         }
933
934       // drop if session expired
935       u64 sess_timeout_time;
936       sess_timeout_time =
937         s0->last_heard + (f64) nat44_session_get_timeout (sm, s0);
938       if (now >= sess_timeout_time)
939         {
940           // session is closed, go slow path
941           nat_free_session_data (sm, s0, thread_index, 0);
942           nat_ed_session_delete (sm, s0, thread_index, 1);
943           next[0] = NAT_NEXT_OUT2IN_ED_SLOW_PATH;
944           goto trace0;
945         }
946
947       if (nat_6t_flow_match (&s0->o2i, b0, lookup_saddr, lookup_sport,
948                              lookup_daddr, lookup_dport, lookup_protocol,
949                              rx_fib_index0))
950         {
951           f = &s0->o2i;
952         }
953       else if (s0->flags & SNAT_SESSION_FLAG_TWICE_NAT &&
954                nat_6t_flow_match (&s0->i2o, b0, lookup_saddr, lookup_sport,
955                                   lookup_daddr, lookup_dport, lookup_protocol,
956                                   rx_fib_index0))
957         {
958           f = &s0->i2o;
959         }
960       else
961         {
962           /*
963            * Send DHCP packets to the ipv4 stack, or we won't
964            * be able to use dhcp client on the outside interface
965            */
966           if (PREDICT_FALSE (
967                 proto0 == NAT_PROTOCOL_UDP &&
968                 (vnet_buffer (b0)->ip.reass.l4_dst_port ==
969                  clib_host_to_net_u16 (UDP_DST_PORT_dhcp_to_client))))
970             {
971               goto trace0;
972             }
973
974           if (!sm->forwarding_enabled)
975             {
976               b0->error = node->errors[NAT_OUT2IN_ED_ERROR_NO_TRANSLATION];
977               next[0] = NAT_NEXT_DROP;
978               goto trace0;
979             }
980           else
981             {
982               if (nat_6t_flow_match (&s0->i2o, b0, lookup_saddr, lookup_sport,
983                                      lookup_daddr, lookup_dport,
984                                      lookup_protocol, rx_fib_index0))
985                 {
986                   f = &s0->i2o;
987                 }
988               else
989                 {
990                   // FIXME TODO bypass ???
991                   //  create_bypass_for_fwd (sm, b0, s0, ip0, rx_fib_index0,
992                   //                       thread_index);
993                   translation_error = NAT_ED_TRNSL_ERR_FLOW_MISMATCH;
994                   nat_free_session_data (sm, s0, thread_index, 0);
995                   nat_ed_session_delete (sm, s0, thread_index, 1);
996                   next[0] = NAT_NEXT_DROP;
997                   goto trace0;
998                 }
999             }
1000         }
1001
1002       if (NAT_ED_TRNSL_ERR_SUCCESS !=
1003           (translation_error = nat_6t_flow_buf_translate (
1004              sm, b0, ip0, f, proto0, 0 /* is_output_feature */)))
1005         {
1006           next[0] = NAT_NEXT_DROP;
1007           goto trace0;
1008         }
1009
1010       switch (proto0)
1011         {
1012         case NAT_PROTOCOL_TCP:
1013           vlib_increment_simple_counter (&sm->counters.fastpath.out2in.tcp,
1014                                          thread_index, sw_if_index0, 1);
1015           nat44_set_tcp_session_state_o2i (sm, now, s0,
1016                                            vnet_buffer (b0)->ip.
1017                                            reass.icmp_type_or_tcp_flags,
1018                                            vnet_buffer (b0)->ip.
1019                                            reass.tcp_ack_number,
1020                                            vnet_buffer (b0)->ip.
1021                                            reass.tcp_seq_number,
1022                                            thread_index);
1023           break;
1024         case NAT_PROTOCOL_UDP:
1025           vlib_increment_simple_counter (&sm->counters.fastpath.out2in.udp,
1026                                          thread_index, sw_if_index0, 1);
1027           break;
1028         case NAT_PROTOCOL_ICMP:
1029           vlib_increment_simple_counter (&sm->counters.fastpath.out2in.icmp,
1030                                          thread_index, sw_if_index0, 1);
1031           break;
1032         case NAT_PROTOCOL_OTHER:
1033           vlib_increment_simple_counter (&sm->counters.fastpath.out2in.other,
1034                                          thread_index, sw_if_index0, 1);
1035           break;
1036         }
1037
1038       /* Accounting */
1039       nat44_session_update_counters (s0, now,
1040                                      vlib_buffer_length_in_chain (vm, b0),
1041                                      thread_index);
1042       /* Per-user LRU list maintenance */
1043       nat44_session_update_lru (sm, s0, thread_index);
1044
1045     trace0:
1046       if (PREDICT_FALSE ((node->flags & VLIB_NODE_FLAG_TRACE)
1047                          && (b0->flags & VLIB_BUFFER_IS_TRACED)))
1048         {
1049           nat44_ed_out2in_trace_t *t =
1050             vlib_add_trace (vm, node, b0, sizeof (*t));
1051           t->sw_if_index = sw_if_index0;
1052           t->next_index = next[0];
1053           t->is_slow_path = 0;
1054           t->translation_error = translation_error;
1055           clib_memcpy (&t->search_key, &kv0, sizeof (t->search_key));
1056           t->lookup_skipped = lookup_skipped;
1057
1058           if (s0)
1059             {
1060               t->session_index = s0 - tsm->sessions;
1061               clib_memcpy (&t->i2of, &s0->i2o, sizeof (t->i2of));
1062               clib_memcpy (&t->o2if, &s0->o2i, sizeof (t->o2if));
1063               t->translation_via_i2of = (&s0->i2o == f);
1064             }
1065           else
1066             {
1067               t->session_index = ~0;
1068             }
1069         }
1070
1071       if (next[0] == NAT_NEXT_DROP)
1072         {
1073           vlib_increment_simple_counter (&sm->counters.fastpath.out2in.drops,
1074                                          thread_index, sw_if_index0, 1);
1075         }
1076
1077       n_left_from--;
1078       next++;
1079     }
1080
1081   vlib_buffer_enqueue_to_next (vm, node, from, (u16 *) nexts,
1082                                frame->n_vectors);
1083   return frame->n_vectors;
1084 }
1085
1086 static inline uword
1087 nat44_ed_out2in_slow_path_node_fn_inline (vlib_main_t * vm,
1088                                           vlib_node_runtime_t * node,
1089                                           vlib_frame_t * frame)
1090 {
1091   u32 n_left_from, *from;
1092   snat_main_t *sm = &snat_main;
1093   f64 now = vlib_time_now (vm);
1094   u32 thread_index = vm->thread_index;
1095   snat_main_per_thread_data_t *tsm = &sm->per_thread_data[thread_index];
1096   snat_static_mapping_t *m;
1097
1098   from = vlib_frame_vector_args (frame);
1099   n_left_from = frame->n_vectors;
1100
1101   vlib_buffer_t *bufs[VLIB_FRAME_SIZE], **b = bufs;
1102   u16 nexts[VLIB_FRAME_SIZE], *next = nexts;
1103   vlib_get_buffers (vm, from, b, n_left_from);
1104
1105   while (n_left_from > 0)
1106     {
1107       vlib_buffer_t *b0;
1108       u32 sw_if_index0, rx_fib_index0;
1109       nat_protocol_t proto0;
1110       ip4_header_t *ip0;
1111       udp_header_t *udp0;
1112       icmp46_header_t *icmp0;
1113       snat_session_t *s0 = 0;
1114       clib_bihash_kv_16_8_t kv0, value0;
1115       lb_nat_type_t lb_nat0;
1116       twice_nat_type_t twice_nat0;
1117       u8 identity_nat0;
1118       ip4_address_t sm_addr;
1119       u16 sm_port;
1120       u32 sm_fib_index;
1121       nat_translation_error_e translation_error = NAT_ED_TRNSL_ERR_SUCCESS;
1122
1123       b0 = *b;
1124       next[0] = vnet_buffer2 (b0)->nat.arc_next;
1125
1126       vnet_buffer (b0)->snat.flags = 0;
1127       ip0 = vlib_buffer_get_current (b0);
1128
1129       sw_if_index0 = vnet_buffer (b0)->sw_if_index[VLIB_RX];
1130       rx_fib_index0 =
1131         fib_table_get_index_for_sw_if_index (FIB_PROTOCOL_IP4, sw_if_index0);
1132
1133       if (PREDICT_FALSE (ip0->ttl == 1))
1134         {
1135           vnet_buffer (b0)->sw_if_index[VLIB_TX] = (u32) ~ 0;
1136           icmp4_error_set_vnet_buffer (b0, ICMP4_time_exceeded,
1137                                        ICMP4_time_exceeded_ttl_exceeded_in_transit,
1138                                        0);
1139           next[0] = NAT_NEXT_ICMP_ERROR;
1140           goto trace0;
1141         }
1142
1143       udp0 = ip4_next_header (ip0);
1144       icmp0 = (icmp46_header_t *) udp0;
1145       proto0 = ip_proto_to_nat_proto (ip0->protocol);
1146
1147       if (PREDICT_FALSE (proto0 == NAT_PROTOCOL_OTHER))
1148         {
1149           s0 = nat44_ed_out2in_slowpath_unknown_proto (
1150             sm, b0, ip0, rx_fib_index0, thread_index, now, vm, node);
1151           if (!sm->forwarding_enabled)
1152             {
1153               if (!s0)
1154                 next[0] = NAT_NEXT_DROP;
1155             }
1156           if (NAT_NEXT_DROP != next[0] &&
1157               NAT_ED_TRNSL_ERR_SUCCESS !=
1158                 (translation_error = nat_6t_flow_buf_translate (
1159                    sm, b0, ip0, &s0->o2i, proto0, 0 /* is_output_feature */)))
1160             {
1161               goto trace0;
1162             }
1163
1164           vlib_increment_simple_counter (&sm->counters.slowpath.out2in.other,
1165                                          thread_index, sw_if_index0, 1);
1166           goto trace0;
1167         }
1168
1169       if (PREDICT_FALSE (proto0 == NAT_PROTOCOL_ICMP))
1170         {
1171           next[0] = icmp_out2in_ed_slow_path
1172             (sm, b0, ip0, icmp0, sw_if_index0, rx_fib_index0, node,
1173              next[0], now, thread_index, &s0);
1174
1175           if (NAT_NEXT_DROP != next[0] && s0 &&
1176               NAT_ED_TRNSL_ERR_SUCCESS !=
1177                 (translation_error = nat_6t_flow_buf_translate (
1178                    sm, b0, ip0, &s0->o2i, proto0, 0 /* is_output_feature */)))
1179             {
1180               goto trace0;
1181             }
1182
1183           vlib_increment_simple_counter (&sm->counters.slowpath.out2in.icmp,
1184                                          thread_index, sw_if_index0, 1);
1185           goto trace0;
1186         }
1187
1188       init_ed_k (&kv0, ip0->src_address,
1189                  vnet_buffer (b0)->ip.reass.l4_src_port, ip0->dst_address,
1190                  vnet_buffer (b0)->ip.reass.l4_dst_port, rx_fib_index0,
1191                  ip0->protocol);
1192
1193       s0 = NULL;
1194       if (!clib_bihash_search_16_8 (&sm->flow_hash, &kv0, &value0))
1195         {
1196           ASSERT (thread_index == ed_value_get_thread_index (&value0));
1197           s0 =
1198             pool_elt_at_index (tsm->sessions,
1199                                ed_value_get_session_index (&value0));
1200
1201           if (s0->tcp_closed_timestamp && now >= s0->tcp_closed_timestamp)
1202             {
1203               nat_free_session_data (sm, s0, thread_index, 0);
1204               nat_ed_session_delete (sm, s0, thread_index, 1);
1205               s0 = NULL;
1206             }
1207         }
1208
1209       if (!s0)
1210         {
1211           /* Try to match static mapping by external address and port,
1212              destination address and port in packet */
1213
1214           if (snat_static_mapping_match
1215               (sm, ip0->dst_address,
1216                vnet_buffer (b0)->ip.reass.l4_dst_port, rx_fib_index0,
1217                proto0, &sm_addr, &sm_port, &sm_fib_index, 1, 0,
1218                &twice_nat0, &lb_nat0, &ip0->src_address, &identity_nat0, &m))
1219             {
1220               /*
1221                * Send DHCP packets to the ipv4 stack, or we won't
1222                * be able to use dhcp client on the outside interface
1223                */
1224               if (PREDICT_FALSE (proto0 == NAT_PROTOCOL_UDP
1225                                  && (vnet_buffer (b0)->ip.reass.l4_dst_port ==
1226                                      clib_host_to_net_u16
1227                                      (UDP_DST_PORT_dhcp_to_client))))
1228                 {
1229                   goto trace0;
1230                 }
1231
1232               if (!sm->forwarding_enabled)
1233                 {
1234                   b0->error =
1235                     node->errors[NAT_OUT2IN_ED_ERROR_NO_TRANSLATION];
1236                   next[0] = NAT_NEXT_DROP;
1237                 }
1238               else
1239                 {
1240                   if (next_src_nat
1241                       (sm, ip0, vnet_buffer (b0)->ip.reass.l4_src_port,
1242                        vnet_buffer (b0)->ip.reass.l4_dst_port,
1243                        thread_index, rx_fib_index0))
1244                     {
1245                       next[0] = NAT_NEXT_IN2OUT_ED_FAST_PATH;
1246                     }
1247                   else
1248                     {
1249                       create_bypass_for_fwd (sm, b0, s0, ip0, rx_fib_index0,
1250                                              thread_index);
1251                     }
1252                 }
1253               goto trace0;
1254             }
1255
1256           if (PREDICT_FALSE (identity_nat0))
1257             goto trace0;
1258
1259           if ((proto0 == NAT_PROTOCOL_TCP)
1260               && !tcp_flags_is_init (vnet_buffer (b0)->ip.
1261                                      reass.icmp_type_or_tcp_flags))
1262             {
1263               b0->error = node->errors[NAT_OUT2IN_ED_ERROR_NON_SYN];
1264               next[0] = NAT_NEXT_DROP;
1265               goto trace0;
1266             }
1267
1268           /* Create session initiated by host from external network */
1269           s0 = create_session_for_static_mapping_ed (sm, b0,
1270                                                      sm_addr, sm_port,
1271                                                      sm_fib_index,
1272                                                      ip0->dst_address,
1273                                                      vnet_buffer (b0)->
1274                                                      ip.reass.l4_dst_port,
1275                                                      rx_fib_index0, proto0,
1276                                                      node, rx_fib_index0,
1277                                                      thread_index, twice_nat0,
1278                                                      lb_nat0, now, m);
1279           if (!s0)
1280             {
1281               next[0] = NAT_NEXT_DROP;
1282               goto trace0;
1283             }
1284         }
1285
1286       if (NAT_ED_TRNSL_ERR_SUCCESS !=
1287           (translation_error = nat_6t_flow_buf_translate (
1288              sm, b0, ip0, &s0->o2i, proto0, 0 /* is_output_feature */)))
1289         {
1290           next[0] = NAT_NEXT_DROP;
1291           goto trace0;
1292         }
1293
1294       if (PREDICT_TRUE (proto0 == NAT_PROTOCOL_TCP))
1295         {
1296           vlib_increment_simple_counter (&sm->counters.slowpath.out2in.tcp,
1297                                          thread_index, sw_if_index0, 1);
1298           nat44_set_tcp_session_state_o2i (sm, now, s0,
1299                                            vnet_buffer (b0)->ip.
1300                                            reass.icmp_type_or_tcp_flags,
1301                                            vnet_buffer (b0)->ip.
1302                                            reass.tcp_ack_number,
1303                                            vnet_buffer (b0)->ip.
1304                                            reass.tcp_seq_number,
1305                                            thread_index);
1306         }
1307       else
1308         {
1309           vlib_increment_simple_counter (&sm->counters.slowpath.out2in.udp,
1310                                          thread_index, sw_if_index0, 1);
1311         }
1312
1313       /* Accounting */
1314       nat44_session_update_counters (s0, now,
1315                                      vlib_buffer_length_in_chain (vm, b0),
1316                                      thread_index);
1317       /* Per-user LRU list maintenance */
1318       nat44_session_update_lru (sm, s0, thread_index);
1319
1320     trace0:
1321       if (PREDICT_FALSE ((node->flags & VLIB_NODE_FLAG_TRACE)
1322                          && (b0->flags & VLIB_BUFFER_IS_TRACED)))
1323         {
1324           nat44_ed_out2in_trace_t *t =
1325             vlib_add_trace (vm, node, b0, sizeof (*t));
1326           t->sw_if_index = sw_if_index0;
1327           t->next_index = next[0];
1328           t->is_slow_path = 1;
1329           t->translation_error = translation_error;
1330           clib_memcpy (&t->search_key, &kv0, sizeof (t->search_key));
1331
1332           if (s0)
1333             {
1334               t->session_index = s0 - tsm->sessions;
1335               clib_memcpy (&t->i2of, &s0->i2o, sizeof (t->i2of));
1336               clib_memcpy (&t->o2if, &s0->o2i, sizeof (t->o2if));
1337             }
1338           else
1339             {
1340               t->session_index = ~0;
1341             }
1342         }
1343
1344       if (next[0] == NAT_NEXT_DROP)
1345         {
1346           vlib_increment_simple_counter (&sm->counters.slowpath.out2in.drops,
1347                                          thread_index, sw_if_index0, 1);
1348         }
1349
1350       n_left_from--;
1351       next++;
1352       b++;
1353     }
1354
1355   vlib_buffer_enqueue_to_next (vm, node, from, (u16 *) nexts,
1356                                frame->n_vectors);
1357
1358   return frame->n_vectors;
1359 }
1360
1361 VLIB_NODE_FN (nat44_ed_out2in_node) (vlib_main_t * vm,
1362                                      vlib_node_runtime_t * node,
1363                                      vlib_frame_t * frame)
1364 {
1365   if (snat_main.num_workers > 1)
1366     {
1367       return nat44_ed_out2in_fast_path_node_fn_inline (vm, node, frame, 1);
1368     }
1369   else
1370     {
1371       return nat44_ed_out2in_fast_path_node_fn_inline (vm, node, frame, 0);
1372     }
1373 }
1374
1375 /* *INDENT-OFF* */
1376 VLIB_REGISTER_NODE (nat44_ed_out2in_node) = {
1377   .name = "nat44-ed-out2in",
1378   .vector_size = sizeof (u32),
1379   .sibling_of = "nat-default",
1380   .format_trace = format_nat44_ed_out2in_trace,
1381   .type = VLIB_NODE_TYPE_INTERNAL,
1382   .n_errors = ARRAY_LEN(nat_out2in_ed_error_strings),
1383   .error_strings = nat_out2in_ed_error_strings,
1384   .runtime_data_bytes = sizeof (snat_runtime_t),
1385 };
1386 /* *INDENT-ON* */
1387
1388 VLIB_NODE_FN (nat44_ed_out2in_slowpath_node) (vlib_main_t * vm,
1389                                               vlib_node_runtime_t * node,
1390                                               vlib_frame_t * frame)
1391 {
1392   return nat44_ed_out2in_slow_path_node_fn_inline (vm, node, frame);
1393 }
1394
1395 /* *INDENT-OFF* */
1396 VLIB_REGISTER_NODE (nat44_ed_out2in_slowpath_node) = {
1397   .name = "nat44-ed-out2in-slowpath",
1398   .vector_size = sizeof (u32),
1399   .sibling_of = "nat-default",
1400   .format_trace = format_nat44_ed_out2in_trace,
1401   .type = VLIB_NODE_TYPE_INTERNAL,
1402   .n_errors = ARRAY_LEN(nat_out2in_ed_error_strings),
1403   .error_strings = nat_out2in_ed_error_strings,
1404   .runtime_data_bytes = sizeof (snat_runtime_t),
1405 };
1406 /* *INDENT-ON* */
1407
1408 static u8 *
1409 format_nat_pre_trace (u8 * s, va_list * args)
1410 {
1411   CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
1412   CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
1413   nat_pre_trace_t *t = va_arg (*args, nat_pre_trace_t *);
1414   return format (s, "out2in next_index %d arc_next_index %d", t->next_index,
1415                  t->arc_next_index);
1416 }
1417
1418 VLIB_NODE_FN (nat_pre_out2in_node) (vlib_main_t * vm,
1419                                     vlib_node_runtime_t * node,
1420                                     vlib_frame_t * frame)
1421 {
1422   return nat_pre_node_fn_inline (vm, node, frame,
1423                                  NAT_NEXT_OUT2IN_ED_FAST_PATH);
1424 }
1425
1426 /* *INDENT-OFF* */
1427 VLIB_REGISTER_NODE (nat_pre_out2in_node) = {
1428   .name = "nat-pre-out2in",
1429   .vector_size = sizeof (u32),
1430   .sibling_of = "nat-default",
1431   .format_trace = format_nat_pre_trace,
1432   .type = VLIB_NODE_TYPE_INTERNAL,
1433   .n_errors = 0,
1434  };
1435 /* *INDENT-ON* */
1436
1437 /*
1438  * fd.io coding-style-patch-verification: ON
1439  *
1440  * Local Variables:
1441  * eval: (c-set-style "gnu")
1442  * End:
1443  */