2 * Copyright (c) 2016 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
7 * http://www.apache.org/licenses/LICENSE-2.0
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
18 * @brief Local TCP/IP stack punt infrastructure.
20 * Provides a set of VPP nodes together with the relevant APIs and CLI
21 * commands in order to adjust and dispatch packets from the VPP data plane
22 * to the local TCP/IP stack
25 #include <vnet/ip/ip.h>
26 #include <vnet/ethernet/ethernet.h>
27 #include <vlib/vlib.h>
28 #include <vnet/ip/punt.h>
29 #include <vlib/unix/unix.h>
33 #include <sys/socket.h>
39 #define punt_error(n,s) PUNT_ERROR_##n,
40 #include <vnet/ip/punt_error.def>
45 #define foreach_punt_next \
46 _ (PUNT4, "ip4-punt") \
51 #define _(s,n) PUNT_NEXT_##s,
57 enum punt_socket_rx_next_e
59 PUNT_SOCKET_RX_NEXT_INTERFACE_OUTPUT,
60 PUNT_SOCKET_RX_NEXT_IP4_LOOKUP,
61 PUNT_SOCKET_RX_NEXT_IP6_LOOKUP,
65 #define punt_next_punt(is_ip4) (is_ip4 ? PUNT_NEXT_PUNT4 : PUNT_NEXT_PUNT6)
67 /** @brief IPv4/IPv6 UDP punt node main loop.
69 This is the main loop inline function for IPv4/IPv6 UDP punt
72 @param vm vlib_main_t corresponding to the current thread
73 @param node vlib_node_runtime_t
74 @param frame vlib_frame_t whose contents should be dispatched
75 @param is_ipv4 indicates if called for IPv4 or IPv6 node
78 udp46_punt_inline (vlib_main_t * vm,
79 vlib_node_runtime_t * node,
80 vlib_frame_t * from_frame, int is_ip4)
82 u32 n_left_from, *from, *to_next;
85 from = vlib_frame_vector_args (from_frame);
86 n_left_from = from_frame->n_vectors;
88 /* udp[46]_lookup hands us the data payload, not the IP header */
90 advance = -(sizeof (ip4_header_t) + sizeof (udp_header_t));
92 advance = -(sizeof (ip6_header_t) + sizeof (udp_header_t));
94 while (n_left_from > 0)
98 vlib_get_next_frame (vm, node, punt_next_punt (is_ip4), to_next,
101 while (n_left_from > 0 && n_left_to_next > 0)
113 b0 = vlib_get_buffer (vm, bi0);
114 vlib_buffer_advance (b0, advance);
115 b0->error = node->errors[PUNT_ERROR_UDP_PORT];
118 vlib_put_next_frame (vm, node, punt_next_punt (is_ip4), n_left_to_next);
121 return from_frame->n_vectors;
124 static char *punt_error_strings[] = {
125 #define punt_error(n,s) s,
126 #include "punt_error.def"
130 /** @brief IPv4 UDP punt node.
133 This is the IPv4 UDP punt transition node. It is registered as a next
134 node for the "ip4-udp-lookup" handling UDP port(s) requested for punt.
135 The buffer's current data pointer is adjusted to the original packet
136 IPv4 header. All buffers are dispatched to "error-punt".
138 @param vm vlib_main_t corresponding to the current thread
139 @param node vlib_node_runtime_t
140 @param frame vlib_frame_t whose contents should be dispatched
142 @par Graph mechanics: next index usage
145 - <code>vnet_buffer(b)->current_data</code>
146 - <code>vnet_buffer(b)->current_len</code>
149 - Dispatches the packet to the "error-punt" node
151 VLIB_NODE_FN (udp4_punt_node) (vlib_main_t * vm,
152 vlib_node_runtime_t * node,
153 vlib_frame_t * from_frame)
155 return udp46_punt_inline (vm, node, from_frame, 1 /* is_ip4 */ );
158 /** @brief IPv6 UDP punt node.
161 This is the IPv6 UDP punt transition node. It is registered as a next
162 node for the "ip6-udp-lookup" handling UDP port(s) requested for punt.
163 The buffer's current data pointer is adjusted to the original packet
164 IPv6 header. All buffers are dispatched to "error-punt".
166 @param vm vlib_main_t corresponding to the current thread
167 @param node vlib_node_runtime_t
168 @param frame vlib_frame_t whose contents should be dispatched
170 @par Graph mechanics: next index usage
173 - <code>vnet_buffer(b)->current_data</code>
174 - <code>vnet_buffer(b)->current_len</code>
177 - Dispatches the packet to the "error-punt" node
179 VLIB_NODE_FN (udp6_punt_node) (vlib_main_t * vm,
180 vlib_node_runtime_t * node,
181 vlib_frame_t * from_frame)
183 return udp46_punt_inline (vm, node, from_frame, 0 /* is_ip4 */ );
186 VLIB_REGISTER_NODE (udp4_punt_node) = {
187 .name = "ip4-udp-punt",
188 /* Takes a vector of packets. */
189 .vector_size = sizeof (u32),
191 .n_errors = PUNT_N_ERROR,
192 .error_strings = punt_error_strings,
194 .n_next_nodes = PUNT_N_NEXT,
196 #define _(s,n) [PUNT_NEXT_##s] = n,
202 VLIB_REGISTER_NODE (udp6_punt_node) = {
203 .name = "ip6-udp-punt",
204 /* Takes a vector of packets. */
205 .vector_size = sizeof (u32),
207 .n_errors = PUNT_N_ERROR,
208 .error_strings = punt_error_strings,
210 .n_next_nodes = PUNT_N_NEXT,
212 #define _(s,n) [PUNT_NEXT_##s] = n,
220 punt_client_t client;
226 format_udp_punt_trace (u8 * s, va_list * args)
228 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
229 CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
230 udp_punt_trace_t *t = va_arg (*args, udp_punt_trace_t *);
231 u32 indent = format_get_indent (s);
232 s = format (s, "to: %s", t->client.caddr.sun_path);
235 s = format (s, "\n%U(buffer is part of chain)", format_white_space,
238 s = format (s, "\n%U%U", format_white_space, indent,
239 format_hex_bytes, t->packet_data, sizeof (t->packet_data));
245 punt_socket_inline2 (vlib_main_t *vm, vlib_node_runtime_t *node,
246 vlib_frame_t *frame, punt_type_t pt,
247 ip_address_family_t af, ip_protocol_t protocol)
249 u32 *buffers = vlib_frame_vector_args (frame);
250 u32 thread_index = vm->thread_index;
251 uword n_packets = frame->n_vectors;
252 punt_main_t *pm = &punt_main;
255 punt_thread_data_t *ptd = &pm->thread_data[thread_index];
256 u32 node_index = (AF_IP4 == af ?
257 udp4_punt_socket_node.index :
258 udp6_punt_socket_node.index);
260 for (i = 0; i < n_packets; i++)
265 punt_packetdesc_t packetdesc;
268 b = vlib_get_buffer (vm, buffers[i]);
270 if (PUNT_TYPE_L4 == pt)
272 if (protocol == IP_PROTOCOL_UDP)
274 /* Reverse UDP Punt advance */
278 vlib_buffer_advance (
279 b, -(sizeof (ip4_header_t) + sizeof (udp_header_t)));
280 ip4_header_t *ip = vlib_buffer_get_current (b);
281 udp = (udp_header_t *) (ip + 1);
285 vlib_buffer_advance (
286 b, -(sizeof (ip6_header_t) + sizeof (udp_header_t)));
287 ip6_header_t *ip = vlib_buffer_get_current (b);
288 udp = (udp_header_t *) (ip + 1);
290 port = clib_net_to_host_u16 (udp->dst_port);
292 else if (protocol == IP_PROTOCOL_ICMP6)
294 ip6_header_t *ip = vlib_buffer_get_current (b);
295 icmp46_header_t *icmp = ip6_next_header (ip);
299 * Find registerered client
300 * If no registered client, drop packet and count
302 c = punt_client_l4_get (af, port);
304 else if (PUNT_TYPE_IP_PROTO == pt)
306 /* Reverse UDP Punt advance */
311 ip4_header_t *ip = vlib_buffer_get_current (b);
312 proto = ip->protocol;
316 ip6_header_t *ip = vlib_buffer_get_current (b);
317 proto = ip->protocol;
320 c = punt_client_ip_proto_get (af, proto);
322 else if (PUNT_TYPE_EXCEPTION == pt)
324 c = punt_client_exception_get (b->punt_reason);
329 if (PREDICT_FALSE (NULL == c))
331 vlib_node_increment_counter (vm, node_index,
332 PUNT_ERROR_SOCKET_TX_ERROR, 1);
336 struct sockaddr_un *caddr = &c->caddr;
339 vec_reset_length (ptd->iovecs);
341 /* Add packet descriptor */
342 packetdesc.sw_if_index = vnet_buffer (b)->sw_if_index[VLIB_RX];
343 packetdesc.action = 0;
344 vec_add2 (ptd->iovecs, iov, 1);
345 iov->iov_base = &packetdesc;
346 iov->iov_len = sizeof (packetdesc);
348 /** VLIB buffer chain -> Unix iovec(s). */
349 vlib_buffer_advance (b, -ethernet_buffer_header_size (b));
350 vec_add2 (ptd->iovecs, iov, 1);
351 iov->iov_base = b->data + b->current_data;
352 iov->iov_len = l = b->current_length;
354 if (PREDICT_FALSE (b->flags & VLIB_BUFFER_IS_TRACED))
357 t = vlib_add_trace (vm, node, b, sizeof (t[0]));
358 clib_memcpy_fast (&t->client, c, sizeof (t->client));
359 clib_memcpy_fast (t->packet_data,
360 vlib_buffer_get_current (b),
361 sizeof (t->packet_data));
364 if (PREDICT_FALSE (b->flags & VLIB_BUFFER_NEXT_PRESENT))
368 b = vlib_get_buffer (vm, b->next_buffer);
369 if (PREDICT_FALSE (b->flags & VLIB_BUFFER_IS_TRACED))
372 t = vlib_add_trace (vm, node, b, sizeof (t[0]));
373 clib_memcpy_fast (&t->client, c, sizeof (t->client));
377 vec_add2 (ptd->iovecs, iov, 1);
379 iov->iov_base = b->data + b->current_data;
380 iov->iov_len = b->current_length;
381 l += b->current_length;
383 while (b->flags & VLIB_BUFFER_NEXT_PRESENT);
386 struct msghdr msg = {
388 .msg_namelen = sizeof (*caddr),
389 .msg_iov = ptd->iovecs,
390 .msg_iovlen = vec_len (ptd->iovecs),
393 if (sendmsg (pm->socket_fd, &msg, 0) < (ssize_t) l)
394 vlib_node_increment_counter (vm, node_index,
395 PUNT_ERROR_SOCKET_TX_ERROR, 1);
397 vlib_node_increment_counter (vm, node_index, PUNT_ERROR_SOCKET_TX, 1);
401 vlib_buffer_free (vm, buffers, n_packets);
407 punt_socket_inline (vlib_main_t *vm, vlib_node_runtime_t *node,
408 vlib_frame_t *frame, punt_type_t pt,
409 ip_address_family_t af)
411 return punt_socket_inline2 (vm, node, frame, pt, af, IP_PROTOCOL_UDP);
415 udp4_punt_socket (vlib_main_t * vm,
416 vlib_node_runtime_t * node, vlib_frame_t * from_frame)
418 return punt_socket_inline (vm, node, from_frame, PUNT_TYPE_L4, AF_IP4);
422 udp6_punt_socket (vlib_main_t * vm,
423 vlib_node_runtime_t * node, vlib_frame_t * from_frame)
425 return punt_socket_inline (vm, node, from_frame, PUNT_TYPE_L4, AF_IP6);
429 ip4_proto_punt_socket (vlib_main_t * vm,
430 vlib_node_runtime_t * node, vlib_frame_t * from_frame)
432 return punt_socket_inline (vm, node, from_frame,
433 PUNT_TYPE_IP_PROTO, AF_IP4);
437 ip6_proto_punt_socket (vlib_main_t * vm,
438 vlib_node_runtime_t * node, vlib_frame_t * from_frame)
440 return punt_socket_inline (vm, node, from_frame,
441 PUNT_TYPE_IP_PROTO, AF_IP6);
445 icmp6_punt_socket (vlib_main_t *vm, vlib_node_runtime_t *node,
446 vlib_frame_t *from_frame)
448 return punt_socket_inline2 (vm, node, from_frame, PUNT_TYPE_L4, AF_IP6,
453 exception_punt_socket (vlib_main_t * vm,
454 vlib_node_runtime_t * node, vlib_frame_t * from_frame)
456 return punt_socket_inline (vm, node, from_frame,
457 PUNT_TYPE_EXCEPTION, AF_IP4);
461 VLIB_REGISTER_NODE (udp4_punt_socket_node) = {
462 .function = udp4_punt_socket,
463 .name = "ip4-udp-punt-socket",
464 .format_trace = format_udp_punt_trace,
465 .flags = VLIB_NODE_FLAG_IS_DROP,
466 /* Takes a vector of packets. */
467 .vector_size = sizeof (u32),
468 .n_errors = PUNT_N_ERROR,
469 .error_strings = punt_error_strings,
471 VLIB_REGISTER_NODE (udp6_punt_socket_node) = {
472 .function = udp6_punt_socket,
473 .name = "ip6-udp-punt-socket",
474 .format_trace = format_udp_punt_trace,
475 .flags = VLIB_NODE_FLAG_IS_DROP,
476 .vector_size = sizeof (u32),
477 .n_errors = PUNT_N_ERROR,
478 .error_strings = punt_error_strings,
480 VLIB_REGISTER_NODE (ip4_proto_punt_socket_node) = {
481 .function = ip4_proto_punt_socket,
482 .name = "ip4-proto-punt-socket",
483 .format_trace = format_udp_punt_trace,
484 .flags = VLIB_NODE_FLAG_IS_DROP,
485 /* Takes a vector of packets. */
486 .vector_size = sizeof (u32),
487 .n_errors = PUNT_N_ERROR,
488 .error_strings = punt_error_strings,
490 VLIB_REGISTER_NODE (ip6_proto_punt_socket_node) = {
491 .function = ip6_proto_punt_socket,
492 .name = "ip6-proto-punt-socket",
493 .format_trace = format_udp_punt_trace,
494 .flags = VLIB_NODE_FLAG_IS_DROP,
495 .vector_size = sizeof (u32),
496 .n_errors = PUNT_N_ERROR,
497 .error_strings = punt_error_strings,
499 VLIB_REGISTER_NODE (exception_punt_socket_node) = {
500 .function = exception_punt_socket,
501 .name = "exception-punt-socket",
502 .format_trace = format_udp_punt_trace,
503 .flags = VLIB_NODE_FLAG_IS_DROP,
504 .vector_size = sizeof (u32),
505 .n_errors = PUNT_N_ERROR,
506 .error_strings = punt_error_strings,
508 VLIB_REGISTER_NODE (icmp6_punt_socket_node) = {
509 .function = icmp6_punt_socket,
510 .name = "ip6-icmp-punt-socket",
511 .format_trace = format_udp_punt_trace,
512 .flags = VLIB_NODE_FLAG_IS_DROP,
513 .vector_size = sizeof (u32),
514 .n_errors = PUNT_N_ERROR,
515 .error_strings = punt_error_strings,
521 enum punt_action_e action;
526 format_punt_trace (u8 * s, va_list * va)
528 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*va, vlib_main_t *);
529 CLIB_UNUSED (vlib_node_t * node) = va_arg (*va, vlib_node_t *);
530 vnet_main_t *vnm = vnet_get_main ();
531 punt_trace_t *t = va_arg (*va, punt_trace_t *);
532 s = format (s, "%U Action: %d", format_vnet_sw_if_index_name,
533 vnm, t->sw_if_index, t->action);
538 punt_socket_rx_fd (vlib_main_t * vm, vlib_node_runtime_t * node, u32 fd)
540 const uword buffer_size = vlib_buffer_get_default_data_size (vm);
541 u32 n_trace = vlib_get_trace_count (vm, node);
542 u32 next = node->cached_next_index;
543 u32 n_left_to_next, next_index;
545 u32 error = PUNT_ERROR_NONE;
546 vlib_get_next_frame (vm, node, next, to_next, n_left_to_next);
548 /* $$$$ Only dealing with one buffer at the time for now */
552 punt_packetdesc_t packetdesc;
556 if (vlib_buffer_alloc (vm, &bi, 1) != 1)
558 error = PUNT_ERROR_NOBUFFER;
562 b = vlib_get_buffer (vm, bi);
563 io[0].iov_base = &packetdesc;
564 io[0].iov_len = sizeof (packetdesc);
565 io[1].iov_base = b->data;
566 io[1].iov_len = buffer_size;
568 size = readv (fd, io, 2);
569 /* We need at least the packet descriptor plus a header */
570 if (size <= (int) (sizeof (packetdesc) + sizeof (ip4_header_t)))
572 vlib_buffer_free (vm, &bi, 1);
573 error = PUNT_ERROR_READV;
577 b->flags = VNET_BUFFER_F_LOCALLY_ORIGINATED;
578 b->current_length = size - sizeof (packetdesc);
580 switch (packetdesc.action)
583 vnet_buffer (b)->sw_if_index[VLIB_TX] = packetdesc.sw_if_index;
584 next_index = PUNT_SOCKET_RX_NEXT_INTERFACE_OUTPUT;
587 case PUNT_IP4_ROUTED:
588 vnet_buffer (b)->sw_if_index[VLIB_RX] = packetdesc.sw_if_index;
589 vnet_buffer (b)->sw_if_index[VLIB_TX] = ~0;
590 next_index = PUNT_SOCKET_RX_NEXT_IP4_LOOKUP;
593 case PUNT_IP6_ROUTED:
594 vnet_buffer (b)->sw_if_index[VLIB_RX] = packetdesc.sw_if_index;
595 vnet_buffer (b)->sw_if_index[VLIB_TX] = ~0;
596 next_index = PUNT_SOCKET_RX_NEXT_IP6_LOOKUP;
600 error = PUNT_ERROR_ACTION;
601 vlib_buffer_free (vm, &bi, 1);
607 && vlib_trace_buffer (vm, node, next_index, b, 1 /* follow_chain */ )))
610 vlib_set_trace_count (vm, node, --n_trace);
611 t = vlib_add_trace (vm, node, b, sizeof (*t));
612 t->sw_if_index = packetdesc.sw_if_index;
613 t->action = packetdesc.action;
620 vlib_validate_buffer_enqueue_x1 (vm, node, next, to_next, n_left_to_next,
622 vlib_put_next_frame (vm, node, next, n_left_to_next);
627 vlib_put_next_frame (vm, node, next, n_left_to_next);
628 vlib_node_increment_counter (vm, punt_socket_rx_node.index, error, 1);
633 punt_socket_rx (vlib_main_t * vm,
634 vlib_node_runtime_t * node, vlib_frame_t * frame)
636 punt_main_t *pm = &punt_main;
640 for (i = 0; i < vec_len (pm->ready_fds); i++)
642 total_count += punt_socket_rx_fd (vm, node, pm->ready_fds[i]);
643 vec_del1 (pm->ready_fds, i);
648 VLIB_REGISTER_NODE (punt_socket_rx_node) =
650 .function = punt_socket_rx,
651 .name = "punt-socket-rx",
652 .flags = VLIB_NODE_FLAG_TRACE_SUPPORTED,
653 .type = VLIB_NODE_TYPE_INPUT,
654 .state = VLIB_NODE_STATE_INTERRUPT,
656 .n_errors = PUNT_N_ERROR,
657 .error_strings = punt_error_strings,
658 .n_next_nodes = PUNT_SOCKET_RX_N_NEXT,
660 [PUNT_SOCKET_RX_NEXT_INTERFACE_OUTPUT] = "interface-output",
661 [PUNT_SOCKET_RX_NEXT_IP4_LOOKUP] = "ip4-lookup",
662 [PUNT_SOCKET_RX_NEXT_IP6_LOOKUP] = "ip6-lookup",
664 .format_trace = format_punt_trace,
668 * fd.io coding-style-patch-verification: ON
671 * eval: (c-set-style "gnu")