ipsec: compress ipsec_sa_t so data used by dataplane code fits in cacheline
[vpp.git] / src / plugins / dpdk / ipsec / esp_encrypt.c
index 8e94850..25815d9 100644 (file)
@@ -1,7 +1,7 @@
 /*
  * esp_encrypt.c : IPSec ESP encrypt node using DPDK Cryptodev
  *
- * Copyright (c) 2016 Intel and/or its affiliates.
+ * Copyright (c) 2017 Intel and/or its affiliates.
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at:
 #include <vnet/ip/ip.h>
 
 #include <vnet/ipsec/ipsec.h>
+#include <vnet/ipsec/esp.h>
+#include <vnet/udp/udp.h>
+#include <dpdk/buffer.h>
 #include <dpdk/ipsec/ipsec.h>
-#include <dpdk/ipsec/esp.h>
 #include <dpdk/device/dpdk.h>
 #include <dpdk/device/dpdk_priv.h>
 
@@ -41,10 +43,11 @@ typedef enum
 
 #define foreach_esp_encrypt_error                   \
  _(RX_PKTS, "ESP pkts received")                    \
- _(SEQ_CYCLED, "sequence number cycled")            \
- _(ENQ_FAIL, "Enqueue failed (buffer full)")        \
- _(NO_CRYPTODEV, "Cryptodev not configured")        \
- _(UNSUPPORTED, "Cipher/Auth not supported")
+ _(SEQ_CYCLED, "Sequence number cycled")            \
+ _(ENQ_FAIL, "Enqueue failed to crypto device")     \
+ _(DISCARD, "Not enough crypto operations, discarding frame")  \
+ _(SESSION, "Failed to get crypto session")         \
+ _(NOSUP, "Cipher/Auth not supported")
 
 
 typedef enum
@@ -61,14 +64,14 @@ static char *esp_encrypt_error_strings[] = {
 #undef _
 };
 
-vlib_node_registration_t dpdk_esp_encrypt_node;
+extern vlib_node_registration_t dpdk_esp4_encrypt_node;
+extern vlib_node_registration_t dpdk_esp6_encrypt_node;
 
 typedef struct
 {
-  u32 spi;
-  u32 seq;
   ipsec_crypto_alg_t crypto_alg;
   ipsec_integ_alg_t integ_alg;
+  u8 packet_data[64];
 } esp_encrypt_trace_t;
 
 /* packet trace format function */
@@ -78,55 +81,69 @@ format_esp_encrypt_trace (u8 * s, va_list * args)
   CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
   CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
   esp_encrypt_trace_t *t = va_arg (*args, esp_encrypt_trace_t *);
+  ip4_header_t *ih4 = (ip4_header_t *) t->packet_data;
+  u32 indent = format_get_indent (s), offset;
 
-  s = format (s, "esp: spi %u seq %u crypto %U integrity %U",
-             t->spi, t->seq,
+  s = format (s, "cipher %U auth %U\n",
              format_ipsec_crypto_alg, t->crypto_alg,
              format_ipsec_integ_alg, t->integ_alg);
+
+  if ((ih4->ip_version_and_header_length & 0xF0) == 0x60)
+    {
+      s = format (s, "%U%U", format_white_space, indent,
+                 format_ip6_header, ih4);
+      offset = sizeof (ip6_header_t);
+    }
+  else
+    {
+      s = format (s, "%U%U", format_white_space, indent,
+                 format_ip4_header, ih4);
+      offset = ip4_header_bytes (ih4);
+    }
+
+  s = format (s, "\n%U%U", format_white_space, indent,
+             format_esp_header, t->packet_data + offset);
+
   return s;
 }
 
-static uword
-dpdk_esp_encrypt_node_fn (vlib_main_t * vm,
-                         vlib_node_runtime_t * node,
-                         vlib_frame_t * from_frame)
+always_inline uword
+dpdk_esp_encrypt_inline (vlib_main_t * vm,
+                        vlib_node_runtime_t * node,
+                        vlib_frame_t * from_frame, int is_ip6)
 {
-  u32 n_left_from, *from, *to_next, next_index;
+  u32 n_left_from, *from, *to_next, next_index, thread_index;
   ipsec_main_t *im = &ipsec_main;
-  u32 thread_index = vlib_get_thread_index ();
+  u32 thread_idx = vlib_get_thread_index ();
   dpdk_crypto_main_t *dcm = &dpdk_crypto_main;
-  dpdk_esp_main_t *em = &dpdk_esp_main;
-  u32 i;
+  crypto_resource_t *res = 0;
+  ipsec_sa_t *sa0 = 0;
+  crypto_alg_t *cipher_alg = 0, *auth_alg = 0;
+  struct rte_cryptodev_sym_session *session = 0;
+  u32 ret, last_sa_index = ~0;
+  u8 numa = rte_socket_id ();
+  u8 is_aead = 0;
+  crypto_worker_main_t *cwm =
+    vec_elt_at_index (dcm->workers_main, thread_idx);
+  struct rte_crypto_op **ops = cwm->ops;
 
   from = vlib_frame_vector_args (from_frame);
   n_left_from = from_frame->n_vectors;
+  thread_index = vm->thread_index;
 
-  if (PREDICT_FALSE (!dcm->workers_main))
+  ret = crypto_alloc_ops (numa, ops, n_left_from);
+  if (ret)
     {
-      /* Likely there are not enough cryptodevs, so drop frame */
-      vlib_node_increment_counter (vm, dpdk_esp_encrypt_node.index,
-                                  ESP_ENCRYPT_ERROR_NO_CRYPTODEV,
-                                  n_left_from);
-      vlib_buffer_free (vm, from, n_left_from);
+      if (is_ip6)
+       vlib_node_increment_counter (vm, dpdk_esp6_encrypt_node.index,
+                                    ESP_ENCRYPT_ERROR_DISCARD, 1);
+      else
+       vlib_node_increment_counter (vm, dpdk_esp4_encrypt_node.index,
+                                    ESP_ENCRYPT_ERROR_DISCARD, 1);
+      /* Discard whole frame */
       return n_left_from;
     }
 
-  crypto_worker_main_t *cwm =
-    vec_elt_at_index (dcm->workers_main, thread_index);
-  u32 n_qps = vec_len (cwm->qp_data);
-  struct rte_crypto_op **cops_to_enq[n_qps];
-  u32 n_cop_qp[n_qps], *bi_to_enq[n_qps];
-
-  for (i = 0; i < n_qps; i++)
-    {
-      bi_to_enq[i] = cwm->qp_data[i].bi;
-      cops_to_enq[i] = cwm->qp_data[i].cops;
-    }
-
-  memset (n_cop_qp, 0, n_qps * sizeof (u32));
-
-  crypto_alloc_cops ();
-
   next_index = ESP_ENCRYPT_NEXT_DROP;
 
   while (n_left_from > 0)
@@ -137,471 +154,470 @@ dpdk_esp_encrypt_node_fn (vlib_main_t * vm,
 
       while (n_left_from > 0 && n_left_to_next > 0)
        {
-         u32 bi0, next0;
+         clib_error_t *error;
+         u32 bi0;
          vlib_buffer_t *b0 = 0;
          u32 sa_index0;
-         ipsec_sa_t *sa0;
          ip4_and_esp_header_t *ih0, *oh0 = 0;
          ip6_and_esp_header_t *ih6_0, *oh6_0 = 0;
-         struct rte_mbuf *mb0 = 0;
+         ip4_and_udp_and_esp_header_t *ouh0 = 0;
+         esp_header_t *esp0;
          esp_footer_t *f0;
-         u8 is_ipv6;
-         u8 ip_hdr_size;
          u8 next_hdr_type;
-         u8 transport_mode = 0;
-         const int BLOCK_SIZE = 16;
          u32 iv_size;
          u16 orig_sz;
-         crypto_sa_session_t *sa_sess;
-         void *sess;
-         struct rte_crypto_op *cop = 0;
-         u16 qp_index;
+         u8 trunc_size;
+         u16 rewrite_len;
+         u16 udp_encap_adv = 0;
+         struct rte_mbuf *mb0 = 0;
+         struct rte_crypto_op *op;
+         u16 res_idx;
 
          bi0 = from[0];
          from += 1;
          n_left_from -= 1;
 
          b0 = vlib_get_buffer (vm, bi0);
+         ih0 = vlib_buffer_get_current (b0);
+         mb0 = rte_mbuf_from_vlib_buffer (b0);
+
+         /* ih0/ih6_0 */
+         CLIB_PREFETCH (ih0, sizeof (ih6_0[0]), LOAD);
+         /* f0 */
+         CLIB_PREFETCH (vlib_buffer_get_tail (b0), 20, STORE);
+         /* mb0 */
+         CLIB_PREFETCH (mb0, CLIB_CACHE_LINE_BYTES, STORE);
+
+         op = ops[0];
+         ops += 1;
+         ASSERT (op->status == RTE_CRYPTO_OP_STATUS_NOT_PROCESSED);
+
+         dpdk_op_priv_t *priv = crypto_op_get_priv (op);
+         /* store bi in op private */
+         priv->bi = bi0;
+
+         u16 op_len =
+           sizeof (op[0]) + sizeof (op[0].sym[0]) + sizeof (priv[0]);
+         CLIB_PREFETCH (op, op_len, STORE);
+
          sa_index0 = vnet_buffer (b0)->ipsec.sad_index;
-         sa0 = pool_elt_at_index (im->sad, sa_index0);
 
-         if (PREDICT_FALSE (esp_seq_advance (sa0)))
+         if (sa_index0 != last_sa_index)
            {
-             clib_warning ("sequence number counter has cycled SPI %u",
-                           sa0->spi);
-             vlib_node_increment_counter (vm, dpdk_esp_encrypt_node.index,
-                                          ESP_ENCRYPT_ERROR_SEQ_CYCLED, 1);
-             //TODO: rekey SA
-             to_next[0] = bi0;
-             to_next += 1;
-             n_left_to_next -= 1;
-             goto trace;
-           }
+             sa0 = pool_elt_at_index (im->sad, sa_index0);
 
-         sa0->total_data_size += b0->current_length;
+             cipher_alg =
+               vec_elt_at_index (dcm->cipher_algs, sa0->crypto_alg);
+             auth_alg = vec_elt_at_index (dcm->auth_algs, sa0->integ_alg);
 
-         sa_sess = pool_elt_at_index (cwm->sa_sess_d[1], sa_index0);
-         if (PREDICT_FALSE (!sa_sess->sess))
-           {
-             int ret = create_sym_sess (sa0, sa_sess, 1);
+             is_aead = (cipher_alg->type == RTE_CRYPTO_SYM_XFORM_AEAD);
+
+             if (is_aead)
+               auth_alg = cipher_alg;
 
-             if (PREDICT_FALSE (ret))
+             res_idx = get_resource (cwm, sa0);
+
+             if (PREDICT_FALSE (res_idx == (u16) ~ 0))
                {
+                 clib_warning ("unsupported SA by thread index %u",
+                               thread_idx);
+                 if (is_ip6)
+                   vlib_node_increment_counter (vm,
+                                                dpdk_esp6_encrypt_node.index,
+                                                ESP_ENCRYPT_ERROR_NOSUP, 1);
+                 else
+                   vlib_node_increment_counter (vm,
+                                                dpdk_esp4_encrypt_node.index,
+                                                ESP_ENCRYPT_ERROR_NOSUP, 1);
                  to_next[0] = bi0;
                  to_next += 1;
                  n_left_to_next -= 1;
                  goto trace;
                }
-           }
-
-         qp_index = sa_sess->qp_index;
-         sess = sa_sess->sess;
+             res = vec_elt_at_index (dcm->resource, res_idx);
 
-         ASSERT (vec_len (vec_elt (cwm->qp_data, qp_index).free_cops) > 0);
-         cop = vec_pop (vec_elt (cwm->qp_data, qp_index).free_cops);
-         ASSERT (cop->status == RTE_CRYPTO_OP_STATUS_NOT_PROCESSED);
-
-         cops_to_enq[qp_index][0] = cop;
-         cops_to_enq[qp_index] += 1;
-         n_cop_qp[qp_index] += 1;
-         bi_to_enq[qp_index][0] = bi0;
-         bi_to_enq[qp_index] += 1;
+             error = crypto_get_session (&session, sa_index0, res, cwm, 1);
+             if (PREDICT_FALSE (error || !session))
+               {
+                 clib_warning ("failed to get crypto session");
+                 if (is_ip6)
+                   vlib_node_increment_counter (vm,
+                                                dpdk_esp6_encrypt_node.index,
+                                                ESP_ENCRYPT_ERROR_SESSION,
+                                                1);
+                 else
+                   vlib_node_increment_counter (vm,
+                                                dpdk_esp4_encrypt_node.index,
+                                                ESP_ENCRYPT_ERROR_SESSION,
+                                                1);
+                 to_next[0] = bi0;
+                 to_next += 1;
+                 n_left_to_next -= 1;
+                 goto trace;
+               }
 
-         ssize_t adv;
-         iv_size = em->esp_crypto_algs[sa0->crypto_alg].iv_len;
-         ih0 = vlib_buffer_get_current (b0);
-         orig_sz = b0->current_length;
-         is_ipv6 = (ih0->ip4.ip_version_and_header_length & 0xF0) == 0x60;
-         /* is ipv6 */
-         if (PREDICT_TRUE (sa0->is_tunnel))
-           {
-             if (PREDICT_TRUE (!is_ipv6))
-               adv = -sizeof (ip4_and_esp_header_t);
-             else
-               adv = -sizeof (ip6_and_esp_header_t);
+             last_sa_index = sa_index0;
            }
-         else
+
+         if (PREDICT_FALSE (esp_seq_advance (sa0)))
            {
-             adv = -sizeof (esp_header_t);
-             if (PREDICT_TRUE (!is_ipv6))
-               orig_sz -= sizeof (ip4_header_t);
+             clib_warning ("sequence number counter has cycled SPI %u",
+                           sa0->spi);
+             if (is_ip6)
+               vlib_node_increment_counter (vm,
+                                            dpdk_esp6_encrypt_node.index,
+                                            ESP_ENCRYPT_ERROR_SEQ_CYCLED, 1);
              else
-               orig_sz -= sizeof (ip6_header_t);
+               vlib_node_increment_counter (vm,
+                                            dpdk_esp4_encrypt_node.index,
+                                            ESP_ENCRYPT_ERROR_SEQ_CYCLED, 1);
+             //TODO: rekey SA
+             to_next[0] = bi0;
+             to_next += 1;
+             n_left_to_next -= 1;
+             goto trace;
            }
 
-         /*transport mode save the eth header before it is overwritten */
-         if (PREDICT_FALSE (!sa0->is_tunnel))
-           {
-             ethernet_header_t *ieh0 = (ethernet_header_t *)
-               ((u8 *) vlib_buffer_get_current (b0) -
-                sizeof (ethernet_header_t));
-             ethernet_header_t *oeh0 =
-               (ethernet_header_t *) ((u8 *) ieh0 + (adv - iv_size));
-             clib_memcpy (oeh0, ieh0, sizeof (ethernet_header_t));
-           }
+         orig_sz = b0->current_length;
 
-         vlib_buffer_advance (b0, adv - iv_size);
+         /* TODO multi-seg support - total_length_not_including_first_buffer */
+         vlib_increment_combined_counter
+           (&ipsec_sa_counters, thread_index, sa_index0,
+            1, b0->current_length);
 
-         /* XXX IP6/ip4 and IP4/IP6 not supported, only IP4/IP4 and IP6/IP6 */
+         res->ops[res->n_ops] = op;
+         res->bi[res->n_ops] = bi0;
+         res->n_ops += 1;
 
-         /* is ipv6 */
-         if (PREDICT_FALSE (is_ipv6))
-           {
-             ih6_0 = (ip6_and_esp_header_t *) ih0;
-             ip_hdr_size = sizeof (ip6_header_t);
-             oh6_0 = vlib_buffer_get_current (b0);
+         dpdk_gcm_cnt_blk *icb = &priv->cb;
 
-             if (PREDICT_TRUE (sa0->is_tunnel))
+         crypto_set_icb (icb, sa0->salt, sa0->seq, sa0->seq_hi);
+
+         iv_size = cipher_alg->iv_len;
+         trunc_size = auth_alg->trunc_size;
+
+         /* if UDP encapsulation is used adjust the address of the IP header */
+         if (ipsec_sa_is_set_UDP_ENCAP (sa0) && !is_ip6)
+           udp_encap_adv = sizeof (udp_header_t);
+
+         if (ipsec_sa_is_set_IS_TUNNEL (sa0))
+           {
+             rewrite_len = 0;
+             if (!is_ip6 && !ipsec_sa_is_set_IS_TUNNEL_V6 (sa0))       /* ip4inip4 */
+               {
+                 /* in tunnel mode send it back to FIB */
+                 priv->next = DPDK_CRYPTO_INPUT_NEXT_IP4_LOOKUP;
+                 u8 adv = sizeof (ip4_header_t) + udp_encap_adv +
+                   sizeof (esp_header_t) + iv_size;
+                 vlib_buffer_advance (b0, -adv);
+                 oh0 = vlib_buffer_get_current (b0);
+                 ouh0 = vlib_buffer_get_current (b0);
+                 next_hdr_type = IP_PROTOCOL_IP_IN_IP;
+                 /*
+                  * oh0->ip4.ip_version_and_header_length = 0x45;
+                  * oh0->ip4.tos = ih0->ip4.tos;
+                  * oh0->ip4.fragment_id = 0;
+                  * oh0->ip4.flags_and_fragment_offset = 0;
+                  */
+                 oh0->ip4.checksum_data_64[0] =
+                   clib_host_to_net_u64 (0x45ULL << 56);
+                 /*
+                  * oh0->ip4.ttl = 254;
+                  * oh0->ip4.protocol = IP_PROTOCOL_IPSEC_ESP;
+                  */
+                 oh0->ip4.checksum_data_32[2] =
+                   clib_host_to_net_u32 (0xfe320000);
+
+                 oh0->ip4.src_address.as_u32 =
+                   sa0->tunnel_src_addr.ip4.as_u32;
+                 oh0->ip4.dst_address.as_u32 =
+                   sa0->tunnel_dst_addr.ip4.as_u32;
+
+                 if (ipsec_sa_is_set_UDP_ENCAP (sa0))
+                   {
+                     oh0->ip4.protocol = IP_PROTOCOL_UDP;
+                     esp0 = &ouh0->esp;
+                   }
+                 else
+                   esp0 = &oh0->esp;
+                 esp0->spi = clib_host_to_net_u32 (sa0->spi);
+                 esp0->seq = clib_host_to_net_u32 (sa0->seq);
+               }
+             else if (is_ip6 && ipsec_sa_is_set_IS_TUNNEL_V6 (sa0))
                {
+                 /* ip6inip6 */
+                 /* in tunnel mode send it back to FIB */
+                 priv->next = DPDK_CRYPTO_INPUT_NEXT_IP6_LOOKUP;
+
+                 u8 adv =
+                   sizeof (ip6_header_t) + sizeof (esp_header_t) + iv_size;
+                 vlib_buffer_advance (b0, -adv);
+                 ih6_0 = (ip6_and_esp_header_t *) ih0;
+                 oh6_0 = vlib_buffer_get_current (b0);
+
                  next_hdr_type = IP_PROTOCOL_IPV6;
+
                  oh6_0->ip6.ip_version_traffic_class_and_flow_label =
                    ih6_0->ip6.ip_version_traffic_class_and_flow_label;
+
+                 oh6_0->ip6.protocol = IP_PROTOCOL_IPSEC_ESP;
+                 oh6_0->ip6.hop_limit = 254;
+                 oh6_0->ip6.src_address.as_u64[0] =
+                   sa0->tunnel_src_addr.ip6.as_u64[0];
+                 oh6_0->ip6.src_address.as_u64[1] =
+                   sa0->tunnel_src_addr.ip6.as_u64[1];
+                 oh6_0->ip6.dst_address.as_u64[0] =
+                   sa0->tunnel_dst_addr.ip6.as_u64[0];
+                 oh6_0->ip6.dst_address.as_u64[1] =
+                   sa0->tunnel_dst_addr.ip6.as_u64[1];
+                 esp0 = &oh6_0->esp;
+                 oh6_0->esp.spi = clib_host_to_net_u32 (sa0->spi);
+                 oh6_0->esp.seq = clib_host_to_net_u32 (sa0->seq);
                }
-             else
+             else              /* unsupported ip4inip6, ip6inip4 */
                {
-                 next_hdr_type = ih6_0->ip6.protocol;
-                 memmove (oh6_0, ih6_0, sizeof (ip6_header_t));
+                 if (is_ip6)
+                   vlib_node_increment_counter (vm,
+                                                dpdk_esp6_encrypt_node.index,
+                                                ESP_ENCRYPT_ERROR_NOSUP, 1);
+                 else
+                   vlib_node_increment_counter (vm,
+                                                dpdk_esp4_encrypt_node.index,
+                                                ESP_ENCRYPT_ERROR_NOSUP, 1);
+                 to_next[0] = bi0;
+                 to_next += 1;
+                 n_left_to_next -= 1;
+                 goto trace;
                }
-
-             oh6_0->ip6.protocol = IP_PROTOCOL_IPSEC_ESP;
-             oh6_0->ip6.hop_limit = 254;
-             oh6_0->esp.spi = clib_net_to_host_u32 (sa0->spi);
-             oh6_0->esp.seq = clib_net_to_host_u32 (sa0->seq);
+             vnet_buffer (b0)->sw_if_index[VLIB_TX] = (u32) ~ 0;
            }
-         else
+         else                  /* transport mode */
            {
-             ip_hdr_size = sizeof (ip4_header_t);
-             oh0 = vlib_buffer_get_current (b0);
-
-             if (PREDICT_TRUE (sa0->is_tunnel))
+             priv->next = DPDK_CRYPTO_INPUT_NEXT_INTERFACE_OUTPUT;
+             rewrite_len = vnet_buffer (b0)->ip.save_rewrite_length;
+             u16 adv = sizeof (esp_header_t) + iv_size + udp_encap_adv;
+             vlib_buffer_advance (b0, -adv - rewrite_len);
+             u8 *src = ((u8 *) ih0) - rewrite_len;
+             u8 *dst = vlib_buffer_get_current (b0);
+             oh0 = vlib_buffer_get_current (b0) + rewrite_len;
+
+             if (is_ip6)
                {
-                 next_hdr_type = IP_PROTOCOL_IP_IN_IP;
-                 oh0->ip4.tos = ih0->ip4.tos;
+                 orig_sz -= sizeof (ip6_header_t);
+                 ih6_0 = (ip6_and_esp_header_t *) ih0;
+                 next_hdr_type = ih6_0->ip6.protocol;
+                 memmove (dst, src, rewrite_len + sizeof (ip6_header_t));
+                 oh6_0 = (ip6_and_esp_header_t *) oh0;
+                 oh6_0->ip6.protocol = IP_PROTOCOL_IPSEC_ESP;
+                 esp0 = &oh6_0->esp;
                }
-             else
+             else              /* ipv4 */
                {
+                 u16 ip_size = ip4_header_bytes (&ih0->ip4);
+                 orig_sz -= ip_size;
                  next_hdr_type = ih0->ip4.protocol;
-                 memmove (oh0, ih0, sizeof (ip4_header_t));
+                 memmove (dst, src, rewrite_len + ip_size);
+                 oh0->ip4.protocol = IP_PROTOCOL_IPSEC_ESP;
+                 esp0 = (esp_header_t *) (((u8 *) oh0) + ip_size);
+                 if (ipsec_sa_is_set_UDP_ENCAP (sa0))
+                   {
+                     oh0->ip4.protocol = IP_PROTOCOL_UDP;
+                     esp0 = (esp_header_t *)
+                       (((u8 *) oh0) + ip_size + udp_encap_adv);
+                   }
+                 else
+                   {
+                     oh0->ip4.protocol = IP_PROTOCOL_IPSEC_ESP;
+                     esp0 = (esp_header_t *) (((u8 *) oh0) + ip_size);
+                   }
                }
-
-             oh0->ip4.ip_version_and_header_length = 0x45;
-             oh0->ip4.fragment_id = 0;
-             oh0->ip4.flags_and_fragment_offset = 0;
-             oh0->ip4.ttl = 254;
-             oh0->ip4.protocol = IP_PROTOCOL_IPSEC_ESP;
-             oh0->esp.spi = clib_net_to_host_u32 (sa0->spi);
-             oh0->esp.seq = clib_net_to_host_u32 (sa0->seq);
+             esp0->spi = clib_host_to_net_u32 (sa0->spi);
+             esp0->seq = clib_host_to_net_u32 (sa0->seq);
            }
 
-         if (PREDICT_TRUE
-             (!is_ipv6 && sa0->is_tunnel && !sa0->is_tunnel_ip6))
-           {
-             oh0->ip4.src_address.as_u32 = sa0->tunnel_src_addr.ip4.as_u32;
-             oh0->ip4.dst_address.as_u32 = sa0->tunnel_dst_addr.ip4.as_u32;
-
-             /* in tunnel mode send it back to FIB */
-             next0 = ESP_ENCRYPT_NEXT_IP4_LOOKUP;
-             vnet_buffer (b0)->sw_if_index[VLIB_TX] = (u32) ~ 0;
-           }
-         else if (is_ipv6 && sa0->is_tunnel && sa0->is_tunnel_ip6)
-           {
-             oh6_0->ip6.src_address.as_u64[0] =
-               sa0->tunnel_src_addr.ip6.as_u64[0];
-             oh6_0->ip6.src_address.as_u64[1] =
-               sa0->tunnel_src_addr.ip6.as_u64[1];
-             oh6_0->ip6.dst_address.as_u64[0] =
-               sa0->tunnel_dst_addr.ip6.as_u64[0];
-             oh6_0->ip6.dst_address.as_u64[1] =
-               sa0->tunnel_dst_addr.ip6.as_u64[1];
-
-             /* in tunnel mode send it back to FIB */
-             next0 = ESP_ENCRYPT_NEXT_IP6_LOOKUP;
-             vnet_buffer (b0)->sw_if_index[VLIB_TX] = (u32) ~ 0;
-           }
-         else
+         if (ipsec_sa_is_set_UDP_ENCAP (sa0) && ouh0)
            {
-             next0 = ESP_ENCRYPT_NEXT_INTERFACE_OUTPUT;
-             transport_mode = 1;
+             ouh0->udp.src_port = clib_host_to_net_u16 (UDP_DST_PORT_ipsec);
+             ouh0->udp.dst_port = clib_host_to_net_u16 (UDP_DST_PORT_ipsec);
+             ouh0->udp.checksum = 0;
            }
+         ASSERT (is_pow2 (cipher_alg->boundary));
+         u16 mask = cipher_alg->boundary - 1;
+         u16 pad_payload_len = ((orig_sz + 2) + mask) & ~mask;
+         u8 pad_bytes = pad_payload_len - 2 - orig_sz;
 
-         ASSERT (sa0->crypto_alg < IPSEC_CRYPTO_N_ALG);
-         ASSERT (sa0->crypto_alg != IPSEC_CRYPTO_ALG_NONE);
-
-         int blocks = 1 + (orig_sz + 1) / BLOCK_SIZE;
+         u8 *padding =
+           vlib_buffer_put_uninit (b0, pad_bytes + 2 + trunc_size);
 
-         /* pad packet in input buffer */
-         u8 pad_bytes = BLOCK_SIZE * blocks - 2 - orig_sz;
-         u8 i;
-         u8 *padding = vlib_buffer_get_current (b0) + b0->current_length;
+         /* The extra pad bytes would be overwritten by the digest */
+         if (pad_bytes)
+           clib_memcpy_fast (padding, pad_data, 16);
 
-         for (i = 0; i < pad_bytes; ++i)
-           padding[i] = i + 1;
-
-         f0 = vlib_buffer_get_current (b0) + b0->current_length + pad_bytes;
+         f0 = (esp_footer_t *) (padding + pad_bytes);
          f0->pad_length = pad_bytes;
          f0->next_header = next_hdr_type;
-         b0->current_length += pad_bytes + 2 +
-           em->esp_integ_algs[sa0->integ_alg].trunc_size;
-
-         vnet_buffer (b0)->sw_if_index[VLIB_RX] =
-           vnet_buffer (b0)->sw_if_index[VLIB_RX];
-         b0->flags |= VLIB_BUFFER_TOTAL_LENGTH_VALID;
-
-         struct rte_crypto_sym_op *sym_cop;
-         sym_cop = (struct rte_crypto_sym_op *) (cop + 1);
-
-         dpdk_cop_priv_t *priv = (dpdk_cop_priv_t *) (sym_cop + 1);
-
-         vnet_buffer (b0)->unused[0] = next0;
 
-         mb0 = rte_mbuf_from_vlib_buffer (b0);
-         mb0->data_len = b0->current_length;
-         mb0->pkt_len = b0->current_length;
-         mb0->data_off = RTE_PKTMBUF_HEADROOM + b0->current_data;
-
-         rte_crypto_op_attach_sym_session (cop, sess);
-
-         sym_cop->m_src = mb0;
-
-         dpdk_gcm_cnt_blk *icb = &priv->cb;
-         icb->salt = sa0->salt;
-         icb->iv[0] = sa0->seq;
-         icb->iv[1] = sa0->seq_hi;
-
-         if (sa0->crypto_alg == IPSEC_CRYPTO_ALG_AES_GCM_128)
+         if (is_ip6)
            {
-             icb->cnt = clib_host_to_net_u32 (1);
-             clib_memcpy (vlib_buffer_get_current (b0) + ip_hdr_size +
-                          sizeof (esp_header_t), icb->iv, 8);
-             sym_cop->cipher.data.offset =
-               ip_hdr_size + sizeof (esp_header_t) + iv_size;
-             sym_cop->cipher.data.length = BLOCK_SIZE * blocks;
-             sym_cop->cipher.iv.length = 16;
+             u16 len = b0->current_length - sizeof (ip6_header_t);
+             oh6_0->ip6.payload_length =
+               clib_host_to_net_u16 (len - rewrite_len);
            }
          else
            {
-             sym_cop->cipher.data.offset =
-               ip_hdr_size + sizeof (esp_header_t);
-             sym_cop->cipher.data.length = BLOCK_SIZE * blocks + iv_size;
-             sym_cop->cipher.iv.length = iv_size;
+             oh0->ip4.length =
+               clib_host_to_net_u16 (b0->current_length - rewrite_len);
+             oh0->ip4.checksum = ip4_header_checksum (&oh0->ip4);
+             if (ipsec_sa_is_set_UDP_ENCAP (sa0) && ouh0)
+               {
+                 ouh0->udp.length =
+                   clib_host_to_net_u16 (clib_net_to_host_u16
+                                         (ouh0->ip4.length) -
+                                         ip4_header_bytes (&ouh0->ip4));
+               }
            }
 
-         sym_cop->cipher.iv.data = (u8 *) icb;
-         sym_cop->cipher.iv.phys_addr = cop->phys_addr + (uintptr_t) icb
-           - (uintptr_t) cop;
+         b0->flags |= VLIB_BUFFER_TOTAL_LENGTH_VALID;
+
+         /* mbuf packet starts at ESP header */
+         mb0->data_len = vlib_buffer_get_tail (b0) - ((u8 *) esp0);
+         mb0->pkt_len = vlib_buffer_get_tail (b0) - ((u8 *) esp0);
+         mb0->data_off = ((void *) esp0) - mb0->buf_addr;
 
+         u32 cipher_off, cipher_len, auth_len = 0;
+         u32 *aad = NULL;
 
-         ASSERT (sa0->integ_alg < IPSEC_INTEG_N_ALG);
-         ASSERT (sa0->integ_alg != IPSEC_INTEG_ALG_NONE);
+         u8 *digest = vlib_buffer_get_tail (b0) - trunc_size;
+         u64 digest_paddr =
+           mb0->buf_physaddr + digest - ((u8 *) mb0->buf_addr);
 
-         if (PREDICT_FALSE (sa0->integ_alg == IPSEC_INTEG_ALG_AES_GCM_128))
+         if (!is_aead && cipher_alg->alg == RTE_CRYPTO_CIPHER_AES_CBC)
            {
-             u8 *aad = priv->aad;
-             clib_memcpy (aad, vlib_buffer_get_current (b0) + ip_hdr_size,
-                          8);
-             sym_cop->auth.aad.data = aad;
-             sym_cop->auth.aad.phys_addr = cop->phys_addr +
-               (uintptr_t) aad - (uintptr_t) cop;
-
-             if (PREDICT_FALSE (sa0->use_esn))
-               {
-                 *((u32 *) & aad[8]) = sa0->seq_hi;
-                 sym_cop->auth.aad.length = 12;
-               }
-             else
-               {
-                 sym_cop->auth.aad.length = 8;
-               }
+             cipher_off = sizeof (esp_header_t);
+             cipher_len = iv_size + pad_payload_len;
            }
-         else
+         else                  /* CTR/GCM */
            {
-             sym_cop->auth.data.offset = ip_hdr_size;
-             sym_cop->auth.data.length = b0->current_length - ip_hdr_size
-               - em->esp_integ_algs[sa0->integ_alg].trunc_size;
+             u32 *esp_iv = (u32 *) (esp0 + 1);
+             esp_iv[0] = sa0->seq;
+             esp_iv[1] = sa0->seq_hi;
 
-             if (PREDICT_FALSE (sa0->use_esn))
-               {
-                 u8 *payload_end =
-                   vlib_buffer_get_current (b0) + b0->current_length;
-                 *((u32 *) payload_end) = sa0->seq_hi;
-                 sym_cop->auth.data.length += sizeof (sa0->seq_hi);
-               }
+             cipher_off = sizeof (esp_header_t) + iv_size;
+             cipher_len = pad_payload_len;
            }
-         sym_cop->auth.digest.data = vlib_buffer_get_current (b0) +
-           b0->current_length -
-           em->esp_integ_algs[sa0->integ_alg].trunc_size;
-         sym_cop->auth.digest.phys_addr = rte_pktmbuf_mtophys_offset (mb0,
-                                                                      b0->current_length
-                                                                      -
-                                                                      em->esp_integ_algs
-                                                                      [sa0->integ_alg].trunc_size);
-         sym_cop->auth.digest.length =
-           em->esp_integ_algs[sa0->integ_alg].trunc_size;
-
-
-         if (PREDICT_FALSE (is_ipv6))
+
+         if (is_aead)
            {
-             oh6_0->ip6.payload_length =
-               clib_host_to_net_u16 (vlib_buffer_length_in_chain (vm, b0) -
-                                     sizeof (ip6_header_t));
+             aad = (u32 *) priv->aad;
+             aad[0] = clib_host_to_net_u32 (sa0->spi);
+             aad[1] = clib_host_to_net_u32 (sa0->seq);
+
+             /* aad[3] should always be 0 */
+             if (PREDICT_FALSE (ipsec_sa_is_set_USE_EXTENDED_SEQ_NUM (sa0)))
+               aad[2] = clib_host_to_net_u32 (sa0->seq_hi);
+             else
+               aad[2] = 0;
            }
          else
            {
-             oh0->ip4.length =
-               clib_host_to_net_u16 (vlib_buffer_length_in_chain (vm, b0));
-             oh0->ip4.checksum = ip4_header_checksum (&oh0->ip4);
+             auth_len =
+               vlib_buffer_get_tail (b0) - ((u8 *) esp0) - trunc_size;
+             if (ipsec_sa_is_set_USE_EXTENDED_SEQ_NUM (sa0))
+               {
+                 u32 *_digest = (u32 *) digest;
+                 _digest[0] = clib_host_to_net_u32 (sa0->seq_hi);
+                 auth_len += 4;
+               }
            }
 
-         if (transport_mode)
-           vlib_buffer_advance (b0, -sizeof (ethernet_header_t));
+         crypto_op_setup (is_aead, mb0, op, session, cipher_off, cipher_len,
+                          0, auth_len, (u8 *) aad, digest, digest_paddr);
 
        trace:
          if (PREDICT_FALSE (b0->flags & VLIB_BUFFER_IS_TRACED))
            {
              esp_encrypt_trace_t *tr =
                vlib_add_trace (vm, node, b0, sizeof (*tr));
-             tr->spi = sa0->spi;
-             tr->seq = sa0->seq - 1;
              tr->crypto_alg = sa0->crypto_alg;
              tr->integ_alg = sa0->integ_alg;
+             u8 *p = vlib_buffer_get_current (b0);
+             if (!ipsec_sa_is_set_IS_TUNNEL (sa0))
+               p += vnet_buffer (b0)->ip.save_rewrite_length;
+             clib_memcpy_fast (tr->packet_data, p, sizeof (tr->packet_data));
            }
        }
       vlib_put_next_frame (vm, node, next_index, n_left_to_next);
     }
-  vlib_node_increment_counter (vm, dpdk_esp_encrypt_node.index,
-                              ESP_ENCRYPT_ERROR_RX_PKTS,
-                              from_frame->n_vectors);
-  crypto_qp_data_t *qpd;
-  /* *INDENT-OFF* */
-  vec_foreach_index (i, cwm->qp_data)
+  if (is_ip6)
     {
-      u32 enq;
+      vlib_node_increment_counter (vm, dpdk_esp6_encrypt_node.index,
+                                  ESP_ENCRYPT_ERROR_RX_PKTS,
+                                  from_frame->n_vectors);
 
-      qpd = vec_elt_at_index(cwm->qp_data, i);
-      enq = rte_cryptodev_enqueue_burst(qpd->dev_id, qpd->qp_id,
-                                       qpd->cops, n_cop_qp[i]);
-      qpd->inflights += enq;
-
-      if (PREDICT_FALSE(enq < n_cop_qp[i]))
-       {
-         crypto_free_cop (qpd, &qpd->cops[enq], n_cop_qp[i] - enq);
-         vlib_buffer_free (vm, &qpd->bi[enq], n_cop_qp[i] - enq);
+      crypto_enqueue_ops (vm, cwm, dpdk_esp6_encrypt_node.index,
+                         ESP_ENCRYPT_ERROR_ENQ_FAIL, numa);
+    }
+  else
+    {
+      vlib_node_increment_counter (vm, dpdk_esp4_encrypt_node.index,
+                                  ESP_ENCRYPT_ERROR_RX_PKTS,
+                                  from_frame->n_vectors);
 
-          vlib_node_increment_counter (vm, dpdk_esp_encrypt_node.index,
-                                      ESP_ENCRYPT_ERROR_ENQ_FAIL,
-                                      n_cop_qp[i] - enq);
-        }
+      crypto_enqueue_ops (vm, cwm, dpdk_esp4_encrypt_node.index,
+                         ESP_ENCRYPT_ERROR_ENQ_FAIL, numa);
     }
-  /* *INDENT-ON* */
+
+  crypto_free_ops (numa, ops, cwm->ops + from_frame->n_vectors - ops);
 
   return from_frame->n_vectors;
 }
 
-VLIB_REGISTER_NODE (dpdk_esp_encrypt_node) =
+VLIB_NODE_FN (dpdk_esp4_encrypt_node) (vlib_main_t * vm,
+                                      vlib_node_runtime_t * node,
+                                      vlib_frame_t * from_frame)
 {
-  .function = dpdk_esp_encrypt_node_fn,.name = "dpdk-esp-encrypt",.flags =
-    VLIB_NODE_FLAG_IS_OUTPUT,.vector_size = sizeof (u32),.format_trace =
-    format_esp_encrypt_trace,.n_errors =
-    ARRAY_LEN (esp_encrypt_error_strings),.error_strings =
-    esp_encrypt_error_strings,.n_next_nodes = 1,.next_nodes =
-  {
-  [ESP_ENCRYPT_NEXT_DROP] = "error-drop",}
-};
-
-VLIB_NODE_FUNCTION_MULTIARCH (dpdk_esp_encrypt_node, dpdk_esp_encrypt_node_fn)
-/*
- * ESP Encrypt Post Node
- */
-#define foreach_esp_encrypt_post_error              \
- _(PKTS, "ESP post pkts")
-     typedef enum
-     {
-#define _(sym,str) ESP_ENCRYPT_POST_ERROR_##sym,
-       foreach_esp_encrypt_post_error
-#undef _
-        ESP_ENCRYPT_POST_N_ERROR,
-     } esp_encrypt_post_error_t;
-
-     static char *esp_encrypt_post_error_strings[] = {
-#define _(sym,string) string,
-       foreach_esp_encrypt_post_error
-#undef _
-     };
-
-vlib_node_registration_t dpdk_esp_encrypt_post_node;
-
-static u8 *
-format_esp_encrypt_post_trace (u8 * s, va_list * args)
-{
-  return s;
+  return dpdk_esp_encrypt_inline (vm, node, from_frame, 0 /*is_ip6 */ );
 }
 
-static uword
-dpdk_esp_encrypt_post_node_fn (vlib_main_t * vm,
-                              vlib_node_runtime_t * node,
-                              vlib_frame_t * from_frame)
-{
-  u32 n_left_from, *from, *to_next = 0, next_index;
-
-  from = vlib_frame_vector_args (from_frame);
-  n_left_from = from_frame->n_vectors;
-
-  next_index = node->cached_next_index;
-
-  while (n_left_from > 0)
+/* *INDENT-OFF* */
+VLIB_REGISTER_NODE (dpdk_esp4_encrypt_node) = {
+  .name = "dpdk-esp4-encrypt",
+  .flags = VLIB_NODE_FLAG_IS_OUTPUT,
+  .vector_size = sizeof (u32),
+  .format_trace = format_esp_encrypt_trace,
+  .n_errors = ARRAY_LEN (esp_encrypt_error_strings),
+  .error_strings = esp_encrypt_error_strings,
+  .n_next_nodes = 1,
+  .next_nodes =
     {
-      u32 n_left_to_next;
-
-      vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next);
-
-      while (n_left_from > 0 && n_left_to_next > 0)
-       {
-         u32 bi0, next0;
-         vlib_buffer_t *b0 = 0;
-
-         bi0 = from[0];
-         from += 1;
-         n_left_from -= 1;
-         n_left_to_next -= 1;
-
-         b0 = vlib_get_buffer (vm, bi0);
-
-         to_next[0] = bi0;
-         to_next += 1;
-
-         next0 = vnet_buffer (b0)->unused[0];
-
-         vlib_validate_buffer_enqueue_x1 (vm, node, next_index,
-                                          to_next, n_left_to_next, bi0,
-                                          next0);
-       }
-      vlib_put_next_frame (vm, node, next_index, n_left_to_next);
+      [ESP_ENCRYPT_NEXT_DROP] = "error-drop",
     }
+};
+/* *INDENT-ON* */
 
-  vlib_node_increment_counter (vm, dpdk_esp_encrypt_post_node.index,
-                              ESP_ENCRYPT_POST_ERROR_PKTS,
-                              from_frame->n_vectors);
-
-  return from_frame->n_vectors;
+VLIB_NODE_FN (dpdk_esp6_encrypt_node) (vlib_main_t * vm,
+                                      vlib_node_runtime_t * node,
+                                      vlib_frame_t * from_frame)
+{
+  return dpdk_esp_encrypt_inline (vm, node, from_frame, 1 /*is_ip6 */ );
 }
 
-VLIB_REGISTER_NODE (dpdk_esp_encrypt_post_node) =
-{
-  .function = dpdk_esp_encrypt_post_node_fn,.name =
-    "dpdk-esp-encrypt-post",.vector_size = sizeof (u32),.format_trace =
-    format_esp_encrypt_post_trace,.type = VLIB_NODE_TYPE_INTERNAL,.n_errors =
-    ARRAY_LEN (esp_encrypt_post_error_strings),.error_strings =
-    esp_encrypt_post_error_strings,.n_next_nodes =
-    ESP_ENCRYPT_N_NEXT,.next_nodes =
-  {
-#define _(s,n) [ESP_ENCRYPT_NEXT_##s] = n,
-    foreach_esp_encrypt_next
-#undef _
-  }
+/* *INDENT-OFF* */
+VLIB_REGISTER_NODE (dpdk_esp6_encrypt_node) = {
+  .name = "dpdk-esp6-encrypt",
+  .flags = VLIB_NODE_FLAG_IS_OUTPUT,
+  .vector_size = sizeof (u32),
+  .format_trace = format_esp_encrypt_trace,
+  .n_errors = ARRAY_LEN (esp_encrypt_error_strings),
+  .error_strings = esp_encrypt_error_strings,
+  .n_next_nodes = 1,
+  .next_nodes =
+    {
+      [ESP_ENCRYPT_NEXT_DROP] = "error-drop",
+    }
 };
+/* *INDENT-ON* */
 
-VLIB_NODE_FUNCTION_MULTIARCH (dpdk_esp_encrypt_post_node,
-                             dpdk_esp_encrypt_post_node_fn)
 /*
  * fd.io coding-style-patch-verification: ON
  *