/* SPDX-License-Identifier: BSD-3-Clause * Copyright(c) 2017 Cavium, Inc */ #ifndef _TEST_PERF_COMMON_ #define _TEST_PERF_COMMON_ #include #include #include #include #include #include #include #include #include #include #include #include "evt_common.h" #include "evt_options.h" #include "evt_test.h" struct test_perf; struct worker_data { uint64_t processed_pkts; uint64_t latency; uint8_t dev_id; uint8_t port_id; struct test_perf *t; } __rte_cache_aligned; struct prod_data { uint8_t dev_id; uint8_t port_id; uint8_t queue_id; struct test_perf *t; } __rte_cache_aligned; struct test_perf { /* Don't change the offset of "done". Signal handler use this memory * to terminate all lcores work. */ int done; uint64_t outstand_pkts; uint8_t nb_workers; enum evt_test_result result; uint32_t nb_flows; uint64_t nb_pkts; struct rte_mempool *pool; struct prod_data prod[EVT_MAX_PORTS]; struct worker_data worker[EVT_MAX_PORTS]; struct evt_options *opt; uint8_t sched_type_list[EVT_MAX_STAGES] __rte_cache_aligned; } __rte_cache_aligned; struct perf_elt { uint64_t timestamp; } __rte_cache_aligned; #define BURST_SIZE 16 #define PERF_WORKER_INIT\ struct worker_data *w = arg;\ struct test_perf *t = w->t;\ struct evt_options *opt = t->opt;\ const uint8_t dev = w->dev_id;\ const uint8_t port = w->port_id;\ uint8_t *const sched_type_list = &t->sched_type_list[0];\ struct rte_mempool *const pool = t->pool;\ const uint8_t nb_stages = t->opt->nb_stages;\ const uint8_t laststage = nb_stages - 1;\ uint8_t cnt = 0;\ void *bufs[16] __rte_cache_aligned;\ int const sz = RTE_DIM(bufs);\ if (opt->verbose_level > 1)\ printf("%s(): lcore %d dev_id %d port=%d\n", __func__,\ rte_lcore_id(), dev, port) static inline __attribute__((always_inline)) int perf_process_last_stage(struct rte_mempool *const pool, struct rte_event *const ev, struct worker_data *const w, void *bufs[], int const buf_sz, uint8_t count) { bufs[count++] = ev->event_ptr; w->processed_pkts++; rte_smp_wmb(); if (unlikely(count == buf_sz)) { count = 0; rte_mempool_put_bulk(pool, bufs, buf_sz); } return count; } static inline __attribute__((always_inline)) uint8_t perf_process_last_stage_latency(struct rte_mempool *const pool, struct rte_event *const ev, struct worker_data *const w, void *bufs[], int const buf_sz, uint8_t count) { uint64_t latency; struct perf_elt *const m = ev->event_ptr; bufs[count++] = ev->event_ptr; w->processed_pkts++; if (unlikely(count == buf_sz)) { count = 0; latency = rte_get_timer_cycles() - m->timestamp; rte_mempool_put_bulk(pool, bufs, buf_sz); } else { latency = rte_get_timer_cycles() - m->timestamp; } w->latency += latency; rte_smp_wmb(); return count; } static inline int perf_nb_event_ports(struct evt_options *opt) { return evt_nr_active_lcores(opt->wlcores) + evt_nr_active_lcores(opt->plcores); } int perf_test_result(struct evt_test *test, struct evt_options *opt); int perf_opt_check(struct evt_options *opt, uint64_t nb_queues); int perf_test_setup(struct evt_test *test, struct evt_options *opt); int perf_ethdev_setup(struct evt_test *test, struct evt_options *opt); int perf_mempool_setup(struct evt_test *test, struct evt_options *opt); int perf_event_dev_port_setup(struct evt_test *test, struct evt_options *opt, uint8_t stride, uint8_t nb_queues, const struct rte_event_port_conf *port_conf); int perf_event_dev_service_setup(uint8_t dev_id); int perf_launch_lcores(struct evt_test *test, struct evt_options *opt, int (*worker)(void *)); void perf_opt_dump(struct evt_options *opt, uint8_t nb_queues); void perf_test_destroy(struct evt_test *test, struct evt_options *opt); void perf_eventdev_destroy(struct evt_test *test, struct evt_options *opt); void perf_ethdev_destroy(struct evt_test *test, struct evt_options *opt); void perf_mempool_destroy(struct evt_test *test, struct evt_options *opt); #endif /* _TEST_PERF_COMMON_ */