Fix bugs and do some optimization in IPFIX code
[vpp.git] / vnet / vnet / flow / flow_report_sample.c
1 /*
2  * Copyright (c) 2015 Cisco and/or its affiliates.
3  * Licensed under the Apache License, Version 2.0 (the "License");
4  * you may not use this file except in compliance with the License.
5  * You may obtain a copy of the License at:
6  *
7  *     http://www.apache.org/licenses/LICENSE-2.0
8  *
9  * Unless required by applicable law or agreed to in writing, software
10  * distributed under the License is distributed on an "AS IS" BASIS,
11  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12  * See the License for the specific language governing permissions and
13  * limitations under the License.
14  */
15 #include <vnet/flow/flow_report.h>
16 #include <vnet/flow/flow_report_sample.h>
17 #include <vnet/api_errno.h>
18
19 typedef struct {
20   u32 classify_table_index;
21 } flow_report_sample_main_t;
22
23 flow_report_sample_main_t flow_report_sample_main;
24
25 static u8 * template_rewrite (flow_report_main_t * frm,
26                               flow_report_t * fr,
27                               ip4_address_t * collector_address,
28                               ip4_address_t * src_address)
29 {
30   vnet_classify_table_t * tblp;
31   vnet_classify_main_t * vcm = &vnet_classify_main;
32   flow_report_sample_main_t *fsm = 
33     (flow_report_sample_main_t *) fr->opaque;
34   ip4_header_t * ip;
35   udp_header_t * udp;
36   ipfix_message_header_t * h;
37   ipfix_set_header_t * s;
38   ipfix_template_header_t * t;
39   ipfix_field_specifier_t * f;
40   ipfix_field_specifier_t * first_field;
41   u8 * rewrite = 0;
42   ip4_ipfix_template_packet_t * tp;
43   i32 l3_offset = -2;  /* sizeof (ethernet_header_t) - sizeof (u32x4) */
44   u32 field_count = 0;
45   u32 field_index = 0;
46   
47   tblp = pool_elt_at_index (vcm->tables, fsm->classify_table_index);
48
49   /* 
50    * Mumble, assumes that we're not classifying on L2 or first 2 octets
51    * of L3..
52    */
53
54   ip = (ip4_header_t *)(((u8 *)(tblp->mask)) + l3_offset);
55   udp = (udp_header_t *)(ip+1);
56
57   /* Determine field count */
58 #define _(field,mask,item,length)                                       \
59   if ((field) == (mask))                                                \
60     {                                                                   \
61       field_count++;                                                    \
62                                                                         \
63       fr->fields_to_send = clib_bitmap_set (fr->fields_to_send,         \
64                                             field_index, 1);            \
65     }                                                                   \
66   field_index++;
67   
68   foreach_ipfix_field;
69 #undef _
70   /* Add packetTotalCount manually */
71   field_count += 1;
72
73   /* $$$ enterprise fields, at some later date */
74
75   /* allocate rewrite space */
76   vec_validate_aligned (rewrite, 
77                         sizeof (ip4_ipfix_template_packet_t) 
78                         + field_count * sizeof (ipfix_field_specifier_t) - 1,
79                         CLIB_CACHE_LINE_BYTES);
80
81   tp = (ip4_ipfix_template_packet_t *) rewrite;
82   ip = (ip4_header_t *) &tp->ip4;
83   udp = (udp_header_t *) (ip+1);
84   h = (ipfix_message_header_t *)(udp+1);
85   s = (ipfix_set_header_t *)(h+1);
86   t = (ipfix_template_header_t *)(s+1);
87   first_field = f = (ipfix_field_specifier_t *)(t+1);
88
89   ip->ip_version_and_header_length = 0x45;
90   ip->ttl = 254;
91   ip->protocol = IP_PROTOCOL_UDP;
92   ip->src_address.as_u32 = src_address->as_u32;
93   ip->dst_address.as_u32 = collector_address->as_u32;
94   udp->src_port = clib_host_to_net_u16 (4739 /* $$FIXME */);
95   udp->dst_port = clib_host_to_net_u16 (UDP_DST_PORT_ipfix);
96   udp->length = clib_host_to_net_u16 (vec_len(rewrite) - sizeof (*ip));
97
98   /* FIXUP: message header export_time */ 
99   /* FIXUP: message header sequence_number */
100   h->domain_id = clib_host_to_net_u32 (fr->domain_id);
101
102   /* Take another trip through the mask and build the template */
103   ip = (ip4_header_t *)(((u8 *)(tblp->mask)) + l3_offset);
104   udp = (udp_header_t *)(ip+1);
105 #define _(field,mask,item,length)                               \
106   if ((field) == (mask))                                        \
107     {                                                           \
108       f->e_id_length = ipfix_e_id_length (0 /* enterprise */,   \
109                                           item, length);        \
110       f++;                                                      \
111     }
112   foreach_ipfix_field;
113 #undef _
114
115   /* Add packetTotalCount manually */
116   f->e_id_length = ipfix_e_id_length (0 /* enterprise */, packetTotalCount, 8);
117   f++;
118
119   /* Back to the template packet... */
120   ip = (ip4_header_t *) &tp->ip4;
121   udp = (udp_header_t *) (ip+1);
122   
123   ASSERT (f - first_field);
124   /* Field count in this template */
125   t->id_count = ipfix_id_count (256 /* template_id */, f - first_field);
126
127   /* set length in octets*/
128   s->set_id_length = ipfix_set_id_length (2 /* set_id */, (u8 *) f - (u8 *)s);
129
130   /* message length in octets */
131   h->version_length = version_length ((u8 *)f - (u8 *)h);
132
133   ip->length = clib_host_to_net_u16 ((u8 *)f - (u8 *)ip);
134   ip->checksum = ip4_header_checksum (ip);
135
136   return rewrite;
137 }
138
139 static vlib_frame_t * send_flows (flow_report_main_t * frm, 
140                                   flow_report_t * fr,
141                                   vlib_frame_t * f, u32 * to_next, 
142                                   u32 node_index)
143 {
144   vnet_classify_main_t * vcm = &vnet_classify_main;
145   flow_report_sample_main_t * fsm = 
146     (flow_report_sample_main_t *) fr->opaque;
147   vnet_classify_table_t * t = 
148     pool_elt_at_index (vcm->tables, fsm->classify_table_index);
149   vnet_classify_bucket_t * b;
150   vnet_classify_entry_t * v, * save_v;
151   vlib_buffer_t *b0 = 0;
152   u32 next_offset = 0;
153   u32 bi0 = ~0;
154   int i, j, k;
155   ip4_ipfix_template_packet_t * tp;
156   ipfix_message_header_t * h = 0;
157   ipfix_set_header_t * s = 0;
158   ip4_header_t * ip;
159   udp_header_t * udp;
160   int field_index;
161   ip4_header_t * match;
162   u32 records_this_buffer;
163   u16 new_l0, old_l0;
164   ip_csum_t sum0;
165   vlib_main_t * vm = frm->vlib_main;
166   
167   while (__sync_lock_test_and_set (t->writer_lock, 1))
168     ; 
169   
170   for (i = 0; i < t->nbuckets; i++)
171     {
172       b = &t->buckets [i];
173       if (b->offset == 0)
174         continue;
175       
176       save_v = vnet_classify_get_entry (t, b->offset);
177       for (j = 0; j < (1<<b->log2_pages); j++)
178         {
179           for (k = 0; k < t->entries_per_page; k++)
180             {
181               v = vnet_classify_entry_at_index 
182                 (t, save_v, j*t->entries_per_page + k);
183               
184               if (vnet_classify_entry_is_free (v))
185                 continue;
186               
187               /* OK, we have something to send... */
188               if (PREDICT_FALSE (b0 == 0))
189                 {
190                   if (vlib_buffer_alloc (vm, &bi0, 1) != 1)
191                     goto flush;
192                   b0 = vlib_get_buffer (vm, bi0);
193                   
194                   u32 copy_len = sizeof(ip4_header_t) +
195                                  sizeof(udp_header_t) +
196                                  sizeof(ipfix_message_header_t);
197                   clib_memcpy (b0->data, fr->rewrite, copy_len);
198                   b0->current_data = 0;
199                   b0->current_length = copy_len;
200                   b0->flags |= VLIB_BUFFER_TOTAL_LENGTH_VALID;
201                   vnet_buffer (b0)->sw_if_index[VLIB_RX] = 0;
202                   /* $$$ for now, look up in fib-0. Later: arbitrary TX fib */
203                   vnet_buffer (b0)->sw_if_index[VLIB_TX] = ~0;
204                   
205                   tp = vlib_buffer_get_current (b0);
206                   ip = (ip4_header_t *) &tp->ip4;
207                   udp = (udp_header_t *) (ip+1);
208                   h = (ipfix_message_header_t *)(udp+1);
209                   s = (ipfix_set_header_t *)(h+1);
210                   
211                   /* FIXUP: message header export_time */ 
212                   h->export_time = (u32) 
213                     (((f64)frm->unix_time_0) + 
214                      (vlib_time_now(frm->vlib_main) - frm->vlib_time_0));
215                   h->export_time = clib_host_to_net_u32(h->export_time);
216                   
217                   /* FIXUP: message header sequence_number */
218                   h->sequence_number = fr->sequence_number;
219                   h->sequence_number = clib_host_to_net_u32 (h->sequence_number);
220
221                   next_offset = (u32) (((u8 *)(s+1)) - (u8 *)tp);
222                   records_this_buffer = 0;
223                 }
224               
225               field_index = 0;
226               match = (ip4_header_t *) (((u8 *)v->key) - 2);
227               ip = match;
228               udp = (udp_header_t * )(ip+1);
229               
230 #define _(field,mask,item,length)                                       \
231               if (clib_bitmap_get (fr->fields_to_send, field_index))    \
232                 {                                                       \
233                   clib_memcpy (b0->data + next_offset, &field,          \
234                           length);                                      \
235                   next_offset += length;                                \
236                 }                                                       \
237               field_index++;
238               foreach_ipfix_field;
239 #undef _
240               
241               /* Add packetTotalCount manually */
242               {
243                 u64 packets = clib_host_to_net_u64 (v->hits);
244                 clib_memcpy (b0->data + next_offset, &packets, sizeof (packets));
245                 next_offset += sizeof (packets);
246               }
247               records_this_buffer++;
248               fr->sequence_number++;
249               
250               if (next_offset > 1450)
251                 {
252                   s->set_id_length = ipfix_set_id_length (256 /* template ID*/, 
253                                                           next_offset - 
254                                                           (sizeof (*ip) + sizeof (*udp) +
255                                                            sizeof (*h)));
256                   h->version_length = version_length (next_offset -
257                                                       (sizeof (*ip) + sizeof (*udp)));
258                   b0->current_length = next_offset;
259                   b0->flags |= VLIB_BUFFER_TOTAL_LENGTH_VALID;
260                   
261                   tp = vlib_buffer_get_current (b0);
262                   ip = (ip4_header_t *) &tp->ip4;
263                   udp = (udp_header_t *) (ip+1);
264                   
265                   sum0 = ip->checksum;
266                   old_l0 = ip->length;
267                   new_l0 = 
268                     clib_host_to_net_u16 ((u16)next_offset);
269                   
270                   sum0 = ip_csum_update (sum0, old_l0, new_l0, ip4_header_t,
271                                          length /* changed member */);
272                   
273                   ip->checksum = ip_csum_fold (sum0);
274                   ip->length = new_l0;
275                   udp->length = 
276                       clib_host_to_net_u16 (b0->current_length - sizeof (*ip));
277                   
278                   ASSERT (ip->checksum == ip4_header_checksum (ip));
279
280                   to_next[0] = bi0;
281                   f->n_vectors++;
282                   to_next++;
283                   
284                   if (f->n_vectors == VLIB_FRAME_SIZE)
285                     {
286                       vlib_put_frame_to_node (vm, node_index, f);
287                       f = vlib_get_frame_to_node (vm, node_index);
288                       f->n_vectors = 0;
289                       to_next = vlib_frame_vector_args (f);
290                     }
291                   b0 = 0;
292                   bi0 = ~0;
293                 }
294             }
295         }
296     }
297   
298  flush:
299   if (b0)
300     {
301         s->set_id_length = ipfix_set_id_length (256 /* template ID*/, 
302                                                 next_offset - 
303                                                 (sizeof (*ip) + sizeof (*udp) +
304                                                  sizeof (*h)));
305         h->version_length = version_length (next_offset -
306                                             (sizeof (*ip) + sizeof (*udp)));
307       b0->current_length = next_offset;
308       b0->flags |= VLIB_BUFFER_TOTAL_LENGTH_VALID;
309       
310       tp = vlib_buffer_get_current (b0);
311       ip = (ip4_header_t *) &tp->ip4;
312       udp = (udp_header_t *) (ip+1);
313       
314       sum0 = ip->checksum;
315       old_l0 = ip->length;
316       new_l0 = clib_host_to_net_u16 ((u16)next_offset);
317       
318       sum0 = ip_csum_update (sum0, old_l0, new_l0, ip4_header_t,
319                              length /* changed member */);
320       
321       ip->checksum = ip_csum_fold (sum0);
322       ip->length = new_l0;
323       udp->length = clib_host_to_net_u16 (b0->current_length - sizeof (*ip));
324
325       ASSERT (ip->checksum == ip4_header_checksum (ip));
326       
327       to_next[0] = bi0;
328       f->n_vectors++;
329       
330       b0 = 0;
331       bi0 = ~0;
332     }
333   
334   *(t->writer_lock) = 0;
335   return f;
336 }
337
338
339 static clib_error_t *
340 flow_sample_command_fn (vlib_main_t * vm,
341                  unformat_input_t * input,
342                  vlib_cli_command_t * cmd)
343 {
344   flow_report_sample_main_t *fsm = &flow_report_sample_main;
345   flow_report_main_t *frm = &flow_report_main;
346   vnet_flow_report_add_del_args_t args;
347   int rv;
348   int is_add = 1;
349   u32 domain_id = 0;
350
351   domain_id = 0;
352   fsm->classify_table_index = ~0;
353   memset (&args, 0, sizeof (args));
354
355   while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT) {
356     if (unformat (input, "table %d", &fsm->classify_table_index))
357       ;
358     else if (unformat (input, "domain %d", &domain_id))
359       ;
360     else if (unformat (input, "del"))
361       is_add = 0;
362     else
363       return clib_error_return (0, "unknown input `%U'",
364                                 format_unformat_error, input);
365   }
366
367   if (fsm->classify_table_index == ~0)
368     return clib_error_return (0, "classifier table not specified");
369
370   args.opaque = (void *) fsm;
371   args.rewrite_callback = template_rewrite;
372   args.flow_data_callback = send_flows;
373   args.is_add = is_add;
374   args.domain_id = domain_id;
375
376   rv = vnet_flow_report_add_del (frm, &args);
377
378   switch (rv)
379     {
380     case 0:
381       break;
382     case VNET_API_ERROR_NO_SUCH_ENTRY:
383       return clib_error_return (0, "registration not found...");
384     default:
385       return clib_error_return (0, "vnet_flow_report_add_del returned %d", rv);
386     }
387
388   return 0;
389 }
390
391 VLIB_CLI_COMMAND (flow_sample_command, static) = {
392   .path = "flow sample",
393   .short_help = "flow sample",
394   .function = flow_sample_command_fn,
395 };
396
397 static clib_error_t *
398 flow_report_sample_init (vlib_main_t *vm)
399 {
400   clib_error_t * error;
401
402   if ((error = vlib_call_init_function (vm, flow_report_init)))
403     return error;
404
405   return 0;
406 }
407
408 VLIB_INIT_FUNCTION (flow_report_sample_init);