2 * Copyright (c) 2016-2019 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
7 * http://www.apache.org/licenses/LICENSE-2.0
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
16 #include <vlibmemory/api.h>
17 #include <vlib/vlib.h>
19 #include <vppinfra/hash.h>
20 #include <vppinfra/error.h>
21 #include <vppinfra/elog.h>
23 #include <vnet/vnet.h>
24 #include <vnet/ip/ip.h>
25 #include <vnet/udp/udp.h>
26 #include <vnet/udp/udp_packet.h>
27 #include <vnet/session/session.h>
29 static vlib_error_desc_t udp_error_counters[] = {
30 #define udp_error(f, n, s, d) { #n, d, VL_COUNTER_SEVERITY_##s },
31 #include "udp_error.def"
42 /* packet trace format function */
44 format_udp_input_trace (u8 * s, va_list * args)
46 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
47 CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
48 udp_input_trace_t *t = va_arg (*args, udp_input_trace_t *);
50 s = format (s, "UDP_INPUT: connection %d, disposition %d, thread %d",
51 t->connection, t->disposition, t->thread_index);
55 #define foreach_udp_input_next \
56 _ (DROP, "error-drop")
60 #define _(s, n) UDP_INPUT_NEXT_##s,
61 foreach_udp_input_next
67 udp_input_inc_counter (vlib_main_t * vm, u8 is_ip4, u8 evt, u8 val)
70 vlib_node_increment_counter (vm, udp4_input_node.index, evt, val);
72 vlib_node_increment_counter (vm, udp6_input_node.index, evt, val);
75 #define udp_store_err_counters(vm, is_ip4, cnts) \
78 for (i = 0; i < UDP_N_ERROR; i++) \
80 udp_input_inc_counter(vm, is_ip4, i, cnts[i]); \
83 #define udp_inc_err_counter(cnts, err, val) \
89 udp_trace_buffer (vlib_main_t * vm, vlib_node_runtime_t * node,
90 vlib_buffer_t * b, session_t * s, u16 error0)
94 if (PREDICT_TRUE (!(b->flags & VLIB_BUFFER_IS_TRACED)))
97 t = vlib_add_trace (vm, node, b, sizeof (*t));
98 t->connection = s ? s->connection_index : ~0;
99 t->disposition = error0;
100 t->thread_index = s ? s->thread_index : vm->thread_index;
103 static udp_connection_t *
104 udp_connection_accept (udp_connection_t * listener, session_dgram_hdr_t * hdr,
107 udp_connection_t *uc;
109 uc = udp_connection_alloc (thread_index);
110 ip_copy (&uc->c_lcl_ip, &hdr->lcl_ip, hdr->is_ip4);
111 ip_copy (&uc->c_rmt_ip, &hdr->rmt_ip, hdr->is_ip4);
112 uc->c_lcl_port = hdr->lcl_port;
113 uc->c_rmt_port = hdr->rmt_port;
114 uc->c_is_ip4 = hdr->is_ip4;
115 uc->c_fib_index = listener->c_fib_index;
116 uc->mss = listener->mss;
117 uc->flags |= UDP_CONN_F_CONNECTED;
118 uc->cfg_flags = listener->cfg_flags;
120 if (session_dgram_accept (&uc->connection, listener->c_s_index,
121 listener->c_thread_index))
123 udp_connection_free (uc);
127 udp_connection_share_port (uc->c_lcl_port, uc->c_is_ip4);
132 udp_connection_enqueue (udp_connection_t * uc0, session_t * s0,
133 session_dgram_hdr_t * hdr0, u32 thread_index,
134 vlib_buffer_t * b, u8 queue_event, u32 * error0)
138 if (!(uc0->flags & UDP_CONN_F_CONNECTED))
140 clib_spinlock_lock (&uc0->rx_lock);
142 wrote0 = session_enqueue_dgram_connection_cl (
143 s0, hdr0, b, TRANSPORT_PROTO_UDP, queue_event);
145 clib_spinlock_unlock (&uc0->rx_lock);
147 /* Expect cl udp enqueue to fail because fifo enqueue */
148 if (PREDICT_FALSE (wrote0 == 0))
149 *error0 = UDP_ERROR_FIFO_FULL;
154 if (svm_fifo_max_enqueue_prod (s0->rx_fifo)
155 < hdr0->data_length + sizeof (session_dgram_hdr_t))
157 *error0 = UDP_ERROR_FIFO_FULL;
161 /* If session is owned by another thread and rx event needed,
162 * enqueue event now while we still have the peeker lock */
163 if (s0->thread_index != thread_index)
165 wrote0 = session_enqueue_dgram_connection2 (
166 s0, hdr0, b, TRANSPORT_PROTO_UDP,
167 queue_event && !svm_fifo_has_event (s0->rx_fifo));
171 wrote0 = session_enqueue_dgram_connection (
172 s0, hdr0, b, TRANSPORT_PROTO_UDP, queue_event);
175 /* In some rare cases, session_enqueue_dgram_connection can fail because a
176 * chunk cannot be allocated in the RX FIFO */
177 if (PREDICT_FALSE (wrote0 == 0))
178 *error0 = UDP_ERROR_FIFO_NOMEM;
181 always_inline session_t *
182 udp_parse_and_lookup_buffer (vlib_buffer_t * b, session_dgram_hdr_t * hdr,
189 /* udp_local hands us a pointer to the udp data */
190 udp = (udp_header_t *) (vlib_buffer_get_current (b) - sizeof (*udp));
191 fib_index = vnet_buffer (b)->ip.fib_index;
193 hdr->data_offset = 0;
194 hdr->lcl_port = udp->dst_port;
195 hdr->rmt_port = udp->src_port;
196 hdr->is_ip4 = is_ip4;
203 /* TODO: must fix once udp_local does ip options correctly */
204 ip4 = (ip4_header_t *) (((u8 *) udp) - sizeof (*ip4));
205 ip_set (&hdr->lcl_ip, &ip4->dst_address, 1);
206 ip_set (&hdr->rmt_ip, &ip4->src_address, 1);
207 hdr->data_length = clib_net_to_host_u16 (ip4->length);
208 hdr->data_length -= sizeof (ip4_header_t) + sizeof (udp_header_t);
209 s = session_lookup_safe4 (fib_index, &ip4->dst_address,
210 &ip4->src_address, udp->dst_port,
211 udp->src_port, TRANSPORT_PROTO_UDP);
217 ip60 = (ip6_header_t *) (((u8 *) udp) - sizeof (*ip60));
218 ip_set (&hdr->lcl_ip, &ip60->dst_address, 0);
219 ip_set (&hdr->rmt_ip, &ip60->src_address, 0);
220 hdr->data_length = clib_net_to_host_u16 (ip60->payload_length);
221 hdr->data_length -= sizeof (udp_header_t);
222 s = session_lookup_safe6 (fib_index, &ip60->dst_address,
223 &ip60->src_address, udp->dst_port,
224 udp->src_port, TRANSPORT_PROTO_UDP);
227 /* Set the sw_if_index[VLIB_RX] to the interface we received
228 * the connection on (the local interface) */
229 vnet_buffer (b)->sw_if_index[VLIB_RX] = vnet_buffer (b)->ip.rx_sw_if_index;
231 if (PREDICT_TRUE (!(b->flags & VLIB_BUFFER_NEXT_PRESENT)))
232 b->current_length = hdr->data_length;
234 b->total_length_not_including_first_buffer = hdr->data_length
241 udp46_input_inline (vlib_main_t * vm, vlib_node_runtime_t * node,
242 vlib_frame_t * frame, u8 is_ip4)
244 u32 thread_index = vm->thread_index, n_left_from, *from, *first_buffer;
245 vlib_buffer_t *bufs[VLIB_FRAME_SIZE], **b;
246 u16 err_counters[UDP_N_ERROR] = { 0 };
248 from = first_buffer = vlib_frame_vector_args (frame);
249 n_left_from = frame->n_vectors;
250 vlib_get_buffers (vm, from, bufs, n_left_from);
254 while (n_left_from > 0)
256 u32 error0 = UDP_ERROR_ENQUEUED;
257 session_dgram_hdr_t hdr0;
258 udp_connection_t *uc0;
261 s0 = udp_parse_and_lookup_buffer (b[0], &hdr0, is_ip4);
262 if (PREDICT_FALSE (!s0))
264 error0 = UDP_ERROR_NO_LISTENER;
268 if (s0->session_state == SESSION_STATE_OPENED)
271 uc0 = udp_connection_from_transport (session_get_transport (s0));
272 uc0->sw_if_index = vnet_buffer (b[0])->sw_if_index[VLIB_RX];
273 if (uc0->flags & UDP_CONN_F_CONNECTED)
275 if (s0->thread_index != thread_index)
278 * Clone the transport. It will be cleaned up with the
279 * session once we notify the session layer.
281 uc0 = udp_connection_clone_safe (s0->connection_index,
283 ASSERT (s0->session_index == uc0->c_s_index);
286 * Ask session layer for a new session.
288 session_dgram_connect_notify (&uc0->connection,
289 s0->thread_index, &s0);
293 s0->session_state = SESSION_STATE_READY;
295 udp_connection_enqueue (uc0, s0, &hdr0, thread_index, b[0],
296 queue_event, &error0);
298 else if (s0->session_state == SESSION_STATE_READY ||
299 s0->session_state == SESSION_STATE_ACCEPTING)
301 uc0 = udp_connection_from_transport (session_get_transport (s0));
302 udp_connection_enqueue (uc0, s0, &hdr0, thread_index, b[0], 1,
305 else if (s0->session_state == SESSION_STATE_LISTENING)
307 uc0 = udp_connection_from_transport (session_get_transport (s0));
308 if (uc0->flags & UDP_CONN_F_CONNECTED)
310 uc0 = udp_connection_accept (uc0, &hdr0, thread_index);
313 error0 = UDP_ERROR_CREATE_SESSION;
316 s0 = session_get (uc0->c_s_index, uc0->c_thread_index);
317 uc0->sw_if_index = vnet_buffer (b[0])->sw_if_index[VLIB_RX];
318 error0 = UDP_ERROR_ACCEPT;
320 udp_connection_enqueue (uc0, s0, &hdr0, thread_index, b[0], 1,
325 error0 = UDP_ERROR_NOT_READY;
329 if (PREDICT_FALSE (node->flags & VLIB_NODE_FLAG_TRACE))
330 udp_trace_buffer (vm, node, b[0], s0, error0);
335 udp_inc_err_counter (err_counters, error0, 1);
338 vlib_buffer_free (vm, first_buffer, frame->n_vectors);
339 session_main_flush_enqueue_events (TRANSPORT_PROTO_UDP, thread_index);
340 udp_store_err_counters (vm, is_ip4, err_counters);
341 return frame->n_vectors;
345 udp4_input (vlib_main_t * vm, vlib_node_runtime_t * node,
346 vlib_frame_t * frame)
348 return udp46_input_inline (vm, node, frame, 1);
351 VLIB_REGISTER_NODE (udp4_input_node) =
353 .function = udp4_input,
354 .name = "udp4-input",
355 .vector_size = sizeof (u32),
356 .format_trace = format_udp_input_trace,
357 .type = VLIB_NODE_TYPE_INTERNAL,
358 .n_errors = UDP_N_ERROR,
359 .error_counters = udp_error_counters,
360 .n_next_nodes = UDP_INPUT_N_NEXT,
362 #define _(s, n) [UDP_INPUT_NEXT_##s] = n,
363 foreach_udp_input_next
369 udp6_input (vlib_main_t * vm, vlib_node_runtime_t * node,
370 vlib_frame_t * frame)
372 return udp46_input_inline (vm, node, frame, 0);
375 VLIB_REGISTER_NODE (udp6_input_node) =
377 .function = udp6_input,
378 .name = "udp6-input",
379 .vector_size = sizeof (u32),
380 .format_trace = format_udp_input_trace,
381 .type = VLIB_NODE_TYPE_INTERNAL,
382 .n_errors = UDP_N_ERROR,
383 .error_counters = udp_error_counters,
384 .n_next_nodes = UDP_INPUT_N_NEXT,
386 #define _(s, n) [UDP_INPUT_NEXT_##s] = n,
387 foreach_udp_input_next
393 * fd.io coding-style-patch-verification: ON
396 * eval: (c-set-style "gnu")