2 *------------------------------------------------------------------
3 * Copyright (c) 2018 Cisco and/or its affiliates.
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at:
8 * http://www.apache.org/licenses/LICENSE-2.0
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 *------------------------------------------------------------------
18 #include <vlib/vlib.h>
19 #include <vlib/unix/unix.h>
20 #include <vlib/pci/pci.h>
21 #include <vnet/ethernet/ethernet.h>
22 #include <vnet/devices/devices.h>
26 #define AVF_TXQ_DESC_CMD(x) (1 << (x + 4))
27 #define AVF_TXQ_DESC_CMD_EOP AVF_TXQ_DESC_CMD(0)
28 #define AVF_TXQ_DESC_CMD_RS AVF_TXQ_DESC_CMD(1)
30 static_always_inline u8
31 avf_tx_desc_get_dtyp (avf_tx_desc_t * d)
33 return d->qword[1] & 0x0f;
37 CLIB_MULTIARCH_FN (avf_interface_tx) (vlib_main_t * vm,
38 vlib_node_runtime_t * node,
41 avf_main_t *am = &avf_main;
42 vnet_interface_output_runtime_t *rd = (void *) node->runtime_data;
43 avf_device_t *ad = pool_elt_at_index (am->devices, rd->dev_instance);
44 u32 thread_index = vlib_get_thread_index ();
45 u8 qid = thread_index;
46 avf_txq_t *txq = vec_elt_at_index (ad->txqs, qid % ad->num_queue_pairs);
47 avf_tx_desc_t *d0, *d1, *d2, *d3;
48 u32 *buffers = vlib_frame_args (frame);
49 u32 bi0, bi1, bi2, bi3;
50 u16 n_left = frame->n_vectors;
51 vlib_buffer_t *b0, *b1, *b2, *b3;
52 u16 mask = txq->size - 1;
54 clib_spinlock_lock_if_init (&txq->lock);
56 /* release cosumed bufs */
59 u16 first, slot, n_free = 0;
60 first = slot = (txq->next - txq->n_bufs) & mask;
61 d0 = txq->descs + slot;
62 while (n_free < txq->n_bufs && avf_tx_desc_get_dtyp (d0) == 0x0F)
65 slot = (slot + 1) & mask;
66 d0 = txq->descs + slot;
71 txq->n_bufs -= n_free;;
72 vlib_buffer_free_from_ring (vm, txq->bufs, first, txq->size,
79 u16 slot0, slot1, slot2, slot3;
81 vlib_prefetch_buffer_with_index (vm, buffers[4], LOAD);
82 vlib_prefetch_buffer_with_index (vm, buffers[5], LOAD);
83 vlib_prefetch_buffer_with_index (vm, buffers[6], LOAD);
84 vlib_prefetch_buffer_with_index (vm, buffers[7], LOAD);
87 slot1 = (txq->next + 1) & mask;
88 slot2 = (txq->next + 2) & mask;
89 slot3 = (txq->next + 3) & mask;
91 d0 = txq->descs + slot0;
92 d1 = txq->descs + slot1;
93 d2 = txq->descs + slot2;
94 d3 = txq->descs + slot3;
101 txq->bufs[slot0] = bi0;
102 txq->bufs[slot1] = bi1;
103 txq->bufs[slot2] = bi2;
104 txq->bufs[slot3] = bi3;
105 b0 = vlib_get_buffer (vm, bi0);
106 b1 = vlib_get_buffer (vm, bi1);
107 b2 = vlib_get_buffer (vm, bi2);
108 b3 = vlib_get_buffer (vm, bi3);
111 d->qword[0] = vlib_get_buffer_data_physical_address (vm, bi0) +
114 d0->qword[0] = pointer_to_uword (b0->data);
115 d1->qword[0] = pointer_to_uword (b1->data);
116 d2->qword[0] = pointer_to_uword (b2->data);
117 d3->qword[0] = pointer_to_uword (b3->data);
120 u64 bits = AVF_TXQ_DESC_CMD_EOP | AVF_TXQ_DESC_CMD_RS;
121 d0->qword[1] = ((u64) b0->current_length) << 34 | bits;
122 d1->qword[1] = ((u64) b1->current_length) << 34 | bits;
123 d2->qword[1] = ((u64) b2->current_length) << 34 | bits;
124 d3->qword[1] = ((u64) b3->current_length) << 34 | bits;
126 txq->next = (txq->next + 4) & mask;
134 d0 = txq->descs + txq->next;
136 txq->bufs[txq->next] = bi0;
137 b0 = vlib_get_buffer (vm, bi0);
140 d->qword[0] = vlib_get_buffer_data_physical_address (vm, bi0) +
143 d0->qword[0] = pointer_to_uword (b0->data);
146 d0->qword[1] = ((u64) b0->current_length) << 34;
147 d0->qword[1] |= AVF_TXQ_DESC_CMD_EOP | AVF_TXQ_DESC_CMD_RS;
149 txq->next = (txq->next + 1) & mask;
154 CLIB_MEMORY_BARRIER ();
155 *(txq->qtx_tail) = txq->next;
157 clib_spinlock_unlock_if_init (&txq->lock);
159 return frame->n_vectors - n_left;
162 #ifndef CLIB_MULTIARCH_VARIANT
164 vlib_node_function_t __clib_weak avf_interface_tx_avx512;
165 vlib_node_function_t __clib_weak avf_interface_tx_avx2;
166 static void __clib_constructor
167 avf_interface_tx_multiarch_select (void)
169 if (avf_interface_tx_avx512 && clib_cpu_supports_avx512f ())
170 avf_device_class.tx_function = avf_interface_tx_avx512;
171 else if (avf_interface_tx_avx2 && clib_cpu_supports_avx2 ())
172 avf_device_class.tx_function = avf_interface_tx_avx2;
178 * fd.io coding-style-patch-verification: ON
181 * eval: (c-set-style "gnu")