1d30ea906Sjfb8856606 /* SPDX-License-Identifier: BSD-3-Clause
2d30ea906Sjfb8856606 * Copyright(c) 2017 Cavium, Inc
32bfe3f2eSlogwang */
42bfe3f2eSlogwang
52bfe3f2eSlogwang #ifndef _TEST_PERF_COMMON_
62bfe3f2eSlogwang #define _TEST_PERF_COMMON_
72bfe3f2eSlogwang
82bfe3f2eSlogwang #include <stdio.h>
92bfe3f2eSlogwang #include <stdbool.h>
102bfe3f2eSlogwang #include <unistd.h>
112bfe3f2eSlogwang
122bfe3f2eSlogwang #include <rte_cycles.h>
13d30ea906Sjfb8856606 #include <rte_ethdev.h>
142bfe3f2eSlogwang #include <rte_eventdev.h>
15d30ea906Sjfb8856606 #include <rte_event_eth_rx_adapter.h>
16d30ea906Sjfb8856606 #include <rte_event_timer_adapter.h>
172bfe3f2eSlogwang #include <rte_lcore.h>
182bfe3f2eSlogwang #include <rte_malloc.h>
192bfe3f2eSlogwang #include <rte_mempool.h>
202bfe3f2eSlogwang #include <rte_prefetch.h>
212bfe3f2eSlogwang
222bfe3f2eSlogwang #include "evt_common.h"
232bfe3f2eSlogwang #include "evt_options.h"
242bfe3f2eSlogwang #include "evt_test.h"
252bfe3f2eSlogwang
262bfe3f2eSlogwang struct test_perf;
272bfe3f2eSlogwang
282bfe3f2eSlogwang struct worker_data {
292bfe3f2eSlogwang uint64_t processed_pkts;
302bfe3f2eSlogwang uint64_t latency;
312bfe3f2eSlogwang uint8_t dev_id;
322bfe3f2eSlogwang uint8_t port_id;
332bfe3f2eSlogwang struct test_perf *t;
342bfe3f2eSlogwang } __rte_cache_aligned;
352bfe3f2eSlogwang
362bfe3f2eSlogwang struct prod_data {
372bfe3f2eSlogwang uint8_t dev_id;
382bfe3f2eSlogwang uint8_t port_id;
392bfe3f2eSlogwang uint8_t queue_id;
402bfe3f2eSlogwang struct test_perf *t;
412bfe3f2eSlogwang } __rte_cache_aligned;
422bfe3f2eSlogwang
43d30ea906Sjfb8856606
442bfe3f2eSlogwang struct test_perf {
452bfe3f2eSlogwang /* Don't change the offset of "done". Signal handler use this memory
462bfe3f2eSlogwang * to terminate all lcores work.
472bfe3f2eSlogwang */
482bfe3f2eSlogwang int done;
492bfe3f2eSlogwang uint64_t outstand_pkts;
502bfe3f2eSlogwang uint8_t nb_workers;
512bfe3f2eSlogwang enum evt_test_result result;
522bfe3f2eSlogwang uint32_t nb_flows;
532bfe3f2eSlogwang uint64_t nb_pkts;
542bfe3f2eSlogwang struct rte_mempool *pool;
552bfe3f2eSlogwang struct prod_data prod[EVT_MAX_PORTS];
562bfe3f2eSlogwang struct worker_data worker[EVT_MAX_PORTS];
572bfe3f2eSlogwang struct evt_options *opt;
582bfe3f2eSlogwang uint8_t sched_type_list[EVT_MAX_STAGES] __rte_cache_aligned;
59d30ea906Sjfb8856606 struct rte_event_timer_adapter *timer_adptr[
60d30ea906Sjfb8856606 RTE_EVENT_TIMER_ADAPTER_NUM_MAX] __rte_cache_aligned;
612bfe3f2eSlogwang } __rte_cache_aligned;
622bfe3f2eSlogwang
632bfe3f2eSlogwang struct perf_elt {
64d30ea906Sjfb8856606 union {
65d30ea906Sjfb8856606 struct rte_event_timer tim;
66d30ea906Sjfb8856606 struct {
67d30ea906Sjfb8856606 char pad[offsetof(struct rte_event_timer, user_meta)];
682bfe3f2eSlogwang uint64_t timestamp;
69d30ea906Sjfb8856606 };
70d30ea906Sjfb8856606 };
712bfe3f2eSlogwang } __rte_cache_aligned;
722bfe3f2eSlogwang
732bfe3f2eSlogwang #define BURST_SIZE 16
742bfe3f2eSlogwang
752bfe3f2eSlogwang #define PERF_WORKER_INIT\
762bfe3f2eSlogwang struct worker_data *w = arg;\
772bfe3f2eSlogwang struct test_perf *t = w->t;\
782bfe3f2eSlogwang struct evt_options *opt = t->opt;\
792bfe3f2eSlogwang const uint8_t dev = w->dev_id;\
802bfe3f2eSlogwang const uint8_t port = w->port_id;\
81d30ea906Sjfb8856606 const uint8_t prod_timer_type = \
82d30ea906Sjfb8856606 opt->prod_type == EVT_PROD_TYPE_EVENT_TIMER_ADPTR;\
832bfe3f2eSlogwang uint8_t *const sched_type_list = &t->sched_type_list[0];\
842bfe3f2eSlogwang struct rte_mempool *const pool = t->pool;\
852bfe3f2eSlogwang const uint8_t nb_stages = t->opt->nb_stages;\
862bfe3f2eSlogwang const uint8_t laststage = nb_stages - 1;\
872bfe3f2eSlogwang uint8_t cnt = 0;\
882bfe3f2eSlogwang void *bufs[16] __rte_cache_aligned;\
892bfe3f2eSlogwang int const sz = RTE_DIM(bufs);\
902bfe3f2eSlogwang if (opt->verbose_level > 1)\
912bfe3f2eSlogwang printf("%s(): lcore %d dev_id %d port=%d\n", __func__,\
922bfe3f2eSlogwang rte_lcore_id(), dev, port)
932bfe3f2eSlogwang
94*2d9fd380Sjfb8856606 static __rte_always_inline int
perf_process_last_stage(struct rte_mempool * const pool,struct rte_event * const ev,struct worker_data * const w,void * bufs[],int const buf_sz,uint8_t count)952bfe3f2eSlogwang perf_process_last_stage(struct rte_mempool *const pool,
962bfe3f2eSlogwang struct rte_event *const ev, struct worker_data *const w,
972bfe3f2eSlogwang void *bufs[], int const buf_sz, uint8_t count)
982bfe3f2eSlogwang {
992bfe3f2eSlogwang bufs[count++] = ev->event_ptr;
1002bfe3f2eSlogwang w->processed_pkts++;
1012bfe3f2eSlogwang rte_smp_wmb();
1022bfe3f2eSlogwang
1032bfe3f2eSlogwang if (unlikely(count == buf_sz)) {
1042bfe3f2eSlogwang count = 0;
1052bfe3f2eSlogwang rte_mempool_put_bulk(pool, bufs, buf_sz);
1062bfe3f2eSlogwang }
1072bfe3f2eSlogwang return count;
1082bfe3f2eSlogwang }
1092bfe3f2eSlogwang
110*2d9fd380Sjfb8856606 static __rte_always_inline uint8_t
perf_process_last_stage_latency(struct rte_mempool * const pool,struct rte_event * const ev,struct worker_data * const w,void * bufs[],int const buf_sz,uint8_t count)1112bfe3f2eSlogwang perf_process_last_stage_latency(struct rte_mempool *const pool,
1122bfe3f2eSlogwang struct rte_event *const ev, struct worker_data *const w,
1132bfe3f2eSlogwang void *bufs[], int const buf_sz, uint8_t count)
1142bfe3f2eSlogwang {
1152bfe3f2eSlogwang uint64_t latency;
1162bfe3f2eSlogwang struct perf_elt *const m = ev->event_ptr;
1172bfe3f2eSlogwang
1182bfe3f2eSlogwang bufs[count++] = ev->event_ptr;
1192bfe3f2eSlogwang w->processed_pkts++;
1202bfe3f2eSlogwang
1212bfe3f2eSlogwang if (unlikely(count == buf_sz)) {
1222bfe3f2eSlogwang count = 0;
1232bfe3f2eSlogwang latency = rte_get_timer_cycles() - m->timestamp;
1242bfe3f2eSlogwang rte_mempool_put_bulk(pool, bufs, buf_sz);
1252bfe3f2eSlogwang } else {
1262bfe3f2eSlogwang latency = rte_get_timer_cycles() - m->timestamp;
1272bfe3f2eSlogwang }
1282bfe3f2eSlogwang
1292bfe3f2eSlogwang w->latency += latency;
1302bfe3f2eSlogwang rte_smp_wmb();
1312bfe3f2eSlogwang return count;
1322bfe3f2eSlogwang }
1332bfe3f2eSlogwang
1342bfe3f2eSlogwang
1352bfe3f2eSlogwang static inline int
perf_nb_event_ports(struct evt_options * opt)1362bfe3f2eSlogwang perf_nb_event_ports(struct evt_options *opt)
1372bfe3f2eSlogwang {
1382bfe3f2eSlogwang return evt_nr_active_lcores(opt->wlcores) +
1392bfe3f2eSlogwang evt_nr_active_lcores(opt->plcores);
1402bfe3f2eSlogwang }
1412bfe3f2eSlogwang
1422bfe3f2eSlogwang int perf_test_result(struct evt_test *test, struct evt_options *opt);
1432bfe3f2eSlogwang int perf_opt_check(struct evt_options *opt, uint64_t nb_queues);
1442bfe3f2eSlogwang int perf_test_setup(struct evt_test *test, struct evt_options *opt);
145d30ea906Sjfb8856606 int perf_ethdev_setup(struct evt_test *test, struct evt_options *opt);
1462bfe3f2eSlogwang int perf_mempool_setup(struct evt_test *test, struct evt_options *opt);
1472bfe3f2eSlogwang int perf_event_dev_port_setup(struct evt_test *test, struct evt_options *opt,
148d30ea906Sjfb8856606 uint8_t stride, uint8_t nb_queues,
149d30ea906Sjfb8856606 const struct rte_event_port_conf *port_conf);
1502bfe3f2eSlogwang int perf_event_dev_service_setup(uint8_t dev_id);
1512bfe3f2eSlogwang int perf_launch_lcores(struct evt_test *test, struct evt_options *opt,
1522bfe3f2eSlogwang int (*worker)(void *));
1532bfe3f2eSlogwang void perf_opt_dump(struct evt_options *opt, uint8_t nb_queues);
1542bfe3f2eSlogwang void perf_test_destroy(struct evt_test *test, struct evt_options *opt);
1552bfe3f2eSlogwang void perf_eventdev_destroy(struct evt_test *test, struct evt_options *opt);
156d30ea906Sjfb8856606 void perf_ethdev_destroy(struct evt_test *test, struct evt_options *opt);
1572bfe3f2eSlogwang void perf_mempool_destroy(struct evt_test *test, struct evt_options *opt);
1582bfe3f2eSlogwang
1592bfe3f2eSlogwang #endif /* _TEST_PERF_COMMON_ */
160