2 * Copyright (c) 2016-2019 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
7 * http://www.apache.org/licenses/LICENSE-2.0
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
16 #include <vlibmemory/api.h>
17 #include <vlib/vlib.h>
19 #include <vppinfra/hash.h>
20 #include <vppinfra/error.h>
21 #include <vppinfra/elog.h>
23 #include <vnet/vnet.h>
24 #include <vnet/pg/pg.h>
25 #include <vnet/ip/ip.h>
26 #include <vnet/udp/udp.h>
27 #include <vnet/udp/udp_packet.h>
28 #include <vnet/session/session.h>
30 static char *udp_error_strings[] = {
31 #define udp_error(n,s) s,
32 #include "udp_error.def"
43 /* packet trace format function */
45 format_udp_input_trace (u8 * s, va_list * args)
47 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
48 CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
49 udp_input_trace_t *t = va_arg (*args, udp_input_trace_t *);
51 s = format (s, "UDP_INPUT: connection %d, disposition %d, thread %d",
52 t->connection, t->disposition, t->thread_index);
56 #define foreach_udp_input_next \
57 _ (DROP, "error-drop")
61 #define _(s, n) UDP_INPUT_NEXT_##s,
62 foreach_udp_input_next
68 udp_input_inc_counter (vlib_main_t * vm, u8 is_ip4, u8 evt, u8 val)
70 if (PREDICT_TRUE (!val))
74 vlib_node_increment_counter (vm, udp4_input_node.index, evt, val);
76 vlib_node_increment_counter (vm, udp6_input_node.index, evt, val);
80 udp46_input_inline (vlib_main_t * vm, vlib_node_runtime_t * node,
81 vlib_frame_t * frame, u8 is_ip4)
83 u32 n_left_from, *from;
84 u32 errors, *first_buffer;
85 u32 my_thread_index = vm->thread_index;
87 from = first_buffer = vlib_frame_vector_args (frame);
88 n_left_from = frame->n_vectors;
90 while (n_left_from > 0)
92 u32 bi0, fib_index0, data_len;
94 u32 error0 = UDP_ERROR_ENQUEUED;
100 udp_connection_t *uc0, *child0, *new_uc0;
101 transport_connection_t *tc0;
103 void *rmt_addr, *lcl_addr;
104 session_dgram_hdr_t hdr0;
107 /* speculatively enqueue b0 to the current next frame */
112 b0 = vlib_get_buffer (vm, bi0);
114 /* udp_local hands us a pointer to the udp data */
115 data0 = vlib_buffer_get_current (b0);
116 udp0 = (udp_header_t *) (data0 - sizeof (*udp0));
117 fib_index0 = vnet_buffer (b0)->ip.fib_index;
121 /* TODO: must fix once udp_local does ip options correctly */
122 ip40 = (ip4_header_t *) (((u8 *) udp0) - sizeof (*ip40));
123 s0 = session_lookup_safe4 (fib_index0, &ip40->dst_address,
124 &ip40->src_address, udp0->dst_port,
125 udp0->src_port, TRANSPORT_PROTO_UDP);
126 lcl_addr = &ip40->dst_address;
127 rmt_addr = &ip40->src_address;
128 data_len = clib_net_to_host_u16 (ip40->length);
129 data_len -= sizeof (ip4_header_t) + sizeof (udp_header_t);
133 ip60 = (ip6_header_t *) (((u8 *) udp0) - sizeof (*ip60));
134 s0 = session_lookup_safe6 (fib_index0, &ip60->dst_address,
135 &ip60->src_address, udp0->dst_port,
136 udp0->src_port, TRANSPORT_PROTO_UDP);
137 lcl_addr = &ip60->dst_address;
138 rmt_addr = &ip60->src_address;
139 data_len = clib_net_to_host_u16 (ip60->payload_length);
140 data_len -= sizeof (udp_header_t);
143 if (PREDICT_FALSE (!s0))
145 error0 = UDP_ERROR_NO_LISTENER;
149 if (s0->session_state == SESSION_STATE_OPENED)
151 /* TODO optimization: move cl session to right thread
152 * However, since such a move would affect the session handle,
153 * which we pass 'raw' to the app, we'd also have notify the
154 * app of the change or change the way we pass handles to apps.
156 tc0 = session_get_transport (s0);
157 uc0 = udp_get_connection_from_transport (tc0);
158 if (uc0->flags & UDP_CONN_F_CONNECTED)
160 if (s0->thread_index != vlib_get_thread_index ())
163 * Clone the transport. It will be cleaned up with the
164 * session once we notify the session layer.
167 udp_connection_clone_safe (s0->connection_index,
169 ASSERT (s0->session_index == new_uc0->c_s_index);
172 * Drop the 'lock' on pool resize
174 session_pool_remove_peeker (s0->thread_index);
175 session_dgram_connect_notify (&new_uc0->connection,
176 s0->thread_index, &s0);
177 tc0 = &new_uc0->connection;
182 s0->session_state = SESSION_STATE_READY;
185 else if (s0->session_state == SESSION_STATE_READY)
187 tc0 = session_get_transport (s0);
188 uc0 = udp_get_connection_from_transport (tc0);
190 else if (s0->session_state == SESSION_STATE_LISTENING)
192 tc0 = listen_session_get_transport (s0);
193 uc0 = udp_get_connection_from_transport (tc0);
194 if (uc0->flags & UDP_CONN_F_CONNECTED)
196 child0 = udp_connection_alloc (my_thread_index);
199 ip_set (&child0->c_lcl_ip, &ip40->dst_address, 1);
200 ip_set (&child0->c_rmt_ip, &ip40->src_address, 1);
204 ip_set (&child0->c_lcl_ip, &ip60->dst_address, 0);
205 ip_set (&child0->c_rmt_ip, &ip60->src_address, 0);
207 child0->c_lcl_port = udp0->dst_port;
208 child0->c_rmt_port = udp0->src_port;
209 child0->c_is_ip4 = is_ip4;
210 child0->c_fib_index = tc0->fib_index;
211 child0->mss = uc0->mss;
212 child0->flags |= UDP_CONN_F_CONNECTED;
214 if (session_stream_accept (&child0->connection,
215 tc0->s_index, tc0->thread_index, 1))
217 error0 = UDP_ERROR_CREATE_SESSION;
220 s0 = session_get (child0->c_s_index, child0->c_thread_index);
221 s0->session_state = SESSION_STATE_READY;
222 tc0 = &child0->connection;
223 uc0 = udp_get_connection_from_transport (tc0);
224 udp_connection_share_port (clib_net_to_host_u16
225 (uc0->c_lcl_port), uc0->c_is_ip4);
226 error0 = UDP_ERROR_LISTENER;
231 error0 = UDP_ERROR_NOT_READY;
236 if (svm_fifo_max_enqueue_prod (s0->rx_fifo)
237 < data_len + sizeof (session_dgram_hdr_t))
239 error0 = UDP_ERROR_FIFO_FULL;
243 hdr0.data_length = data_len;
244 if (PREDICT_TRUE (!(b0->flags & VLIB_BUFFER_NEXT_PRESENT)))
245 b0->current_length = data_len;
247 b0->total_length_not_including_first_buffer = data_len
248 - b0->current_length;
250 hdr0.data_offset = 0;
251 ip_set (&hdr0.lcl_ip, lcl_addr, is_ip4);
252 ip_set (&hdr0.rmt_ip, rmt_addr, is_ip4);
253 hdr0.lcl_port = udp0->dst_port;
254 hdr0.rmt_port = udp0->src_port;
255 hdr0.is_ip4 = is_ip4;
257 clib_spinlock_lock (&uc0->rx_lock);
258 /* If session is owned by another thread and rx event needed,
259 * enqueue event now while we still have the peeker lock */
260 if (s0->thread_index != my_thread_index)
262 wrote0 = session_enqueue_dgram_connection (s0, &hdr0, b0,
264 /* queue event */ 0);
265 if (queue_event && !svm_fifo_has_event (s0->rx_fifo))
266 session_enqueue_notify (s0);
270 wrote0 = session_enqueue_dgram_connection (s0, &hdr0, b0,
274 clib_spinlock_unlock (&uc0->rx_lock);
277 if (s0->session_state != SESSION_STATE_LISTENING)
278 session_pool_remove_peeker (s0->thread_index);
282 b0->error = node->errors[error0];
284 if (PREDICT_FALSE ((node->flags & VLIB_NODE_FLAG_TRACE)
285 && (b0->flags & VLIB_BUFFER_IS_TRACED)))
287 udp_input_trace_t *t = vlib_add_trace (vm, node, b0,
290 t->connection = s0 ? s0->connection_index : ~0;
291 t->disposition = error0;
292 t->thread_index = my_thread_index;
296 vlib_buffer_free (vm, first_buffer, frame->n_vectors);
297 errors = session_main_flush_enqueue_events (TRANSPORT_PROTO_UDP,
299 udp_input_inc_counter (vm, is_ip4, UDP_ERROR_EVENT_FIFO_FULL, errors);
300 return frame->n_vectors;
304 udp4_input (vlib_main_t * vm, vlib_node_runtime_t * node,
305 vlib_frame_t * frame)
307 return udp46_input_inline (vm, node, frame, 1);
311 VLIB_REGISTER_NODE (udp4_input_node) =
313 .function = udp4_input,
314 .name = "udp4-input",
315 .vector_size = sizeof (u32),
316 .format_trace = format_udp_input_trace,
317 .type = VLIB_NODE_TYPE_INTERNAL,
318 .n_errors = ARRAY_LEN (udp_error_strings),
319 .error_strings = udp_error_strings,
320 .n_next_nodes = UDP_INPUT_N_NEXT,
322 #define _(s, n) [UDP_INPUT_NEXT_##s] = n,
323 foreach_udp_input_next
330 udp6_input (vlib_main_t * vm, vlib_node_runtime_t * node,
331 vlib_frame_t * frame)
333 return udp46_input_inline (vm, node, frame, 0);
337 VLIB_REGISTER_NODE (udp6_input_node) =
339 .function = udp6_input,
340 .name = "udp6-input",
341 .vector_size = sizeof (u32),
342 .format_trace = format_udp_input_trace,
343 .type = VLIB_NODE_TYPE_INTERNAL,
344 .n_errors = ARRAY_LEN (udp_error_strings),
345 .error_strings = udp_error_strings,
346 .n_next_nodes = UDP_INPUT_N_NEXT,
348 #define _(s, n) [UDP_INPUT_NEXT_##s] = n,
349 foreach_udp_input_next
356 * fd.io coding-style-patch-verification: ON
359 * eval: (c-set-style "gnu")