de2bc16e1b
In crypto producer mode, producer core enqueues cryptodev with software generated crypto ops and worker core dequeues crypto completion events from the eventdev. Event crypto metadata used for above processing is pre-populated in each crypto session. Parameter --prod_type_cryptodev can be used to enable crypto producer mode. Parameter --crypto_adptr_mode can be set to select the crypto adapter mode, 0 for OP_NEW and 1 for OP_FORWARD. This mode can be used to measure the performance of crypto adapter. Example: ./dpdk-test-eventdev -l 0-2 -w <EVENTDEV> -w <CRYPTODEV> -- \ --prod_type_cryptodev --crypto_adptr_mode 1 --test=perf_atq \ --stlist=a --wlcores 1 --plcores 2 Signed-off-by: Shijith Thotton <sthotton@marvell.com> Acked-by: Akhil Goyal <gakhil@marvell.com> Acked-by: Abhinandan Gujjar <abhinandan.gujjar@intel.com>
187 lines
5.3 KiB
C
187 lines
5.3 KiB
C
/* SPDX-License-Identifier: BSD-3-Clause
|
|
* Copyright(c) 2017 Cavium, Inc
|
|
*/
|
|
|
|
#ifndef _TEST_PERF_COMMON_
|
|
#define _TEST_PERF_COMMON_
|
|
|
|
#include <stdio.h>
|
|
#include <stdbool.h>
|
|
#include <unistd.h>
|
|
|
|
#include <rte_cryptodev.h>
|
|
#include <rte_cycles.h>
|
|
#include <rte_ethdev.h>
|
|
#include <rte_eventdev.h>
|
|
#include <rte_event_crypto_adapter.h>
|
|
#include <rte_event_eth_rx_adapter.h>
|
|
#include <rte_event_timer_adapter.h>
|
|
#include <rte_lcore.h>
|
|
#include <rte_malloc.h>
|
|
#include <rte_mempool.h>
|
|
#include <rte_prefetch.h>
|
|
|
|
#include "evt_common.h"
|
|
#include "evt_options.h"
|
|
#include "evt_test.h"
|
|
|
|
#define TEST_PERF_CA_ID 0
|
|
|
|
struct test_perf;
|
|
|
|
struct worker_data {
|
|
uint64_t processed_pkts;
|
|
uint64_t latency;
|
|
uint8_t dev_id;
|
|
uint8_t port_id;
|
|
struct test_perf *t;
|
|
} __rte_cache_aligned;
|
|
|
|
struct crypto_adptr_data {
|
|
uint8_t cdev_id;
|
|
uint16_t cdev_qp_id;
|
|
struct rte_cryptodev_sym_session **crypto_sess;
|
|
};
|
|
struct prod_data {
|
|
uint8_t dev_id;
|
|
uint8_t port_id;
|
|
uint8_t queue_id;
|
|
struct crypto_adptr_data ca;
|
|
struct test_perf *t;
|
|
} __rte_cache_aligned;
|
|
|
|
struct test_perf {
|
|
/* Don't change the offset of "done". Signal handler use this memory
|
|
* to terminate all lcores work.
|
|
*/
|
|
int done;
|
|
uint64_t outstand_pkts;
|
|
uint8_t nb_workers;
|
|
enum evt_test_result result;
|
|
uint32_t nb_flows;
|
|
uint64_t nb_pkts;
|
|
struct rte_mempool *pool;
|
|
struct prod_data prod[EVT_MAX_PORTS];
|
|
struct worker_data worker[EVT_MAX_PORTS];
|
|
struct evt_options *opt;
|
|
uint8_t sched_type_list[EVT_MAX_STAGES] __rte_cache_aligned;
|
|
struct rte_event_timer_adapter *timer_adptr[
|
|
RTE_EVENT_TIMER_ADAPTER_NUM_MAX] __rte_cache_aligned;
|
|
struct rte_mempool *ca_op_pool;
|
|
struct rte_mempool *ca_sess_pool;
|
|
struct rte_mempool *ca_sess_priv_pool;
|
|
} __rte_cache_aligned;
|
|
|
|
struct perf_elt {
|
|
union {
|
|
struct rte_event_timer tim;
|
|
struct {
|
|
char pad[offsetof(struct rte_event_timer, user_meta)];
|
|
uint64_t timestamp;
|
|
};
|
|
};
|
|
} __rte_cache_aligned;
|
|
|
|
#define BURST_SIZE 16
|
|
#define MAX_PROD_ENQ_BURST_SIZE 128
|
|
|
|
#define PERF_WORKER_INIT\
|
|
struct worker_data *w = arg;\
|
|
struct test_perf *t = w->t;\
|
|
struct evt_options *opt = t->opt;\
|
|
const uint8_t dev = w->dev_id;\
|
|
const uint8_t port = w->port_id;\
|
|
const uint8_t prod_timer_type = \
|
|
opt->prod_type == EVT_PROD_TYPE_EVENT_TIMER_ADPTR;\
|
|
const uint8_t prod_crypto_type = \
|
|
opt->prod_type == EVT_PROD_TYPE_EVENT_CRYPTO_ADPTR;\
|
|
uint8_t *const sched_type_list = &t->sched_type_list[0];\
|
|
struct rte_mempool *const pool = t->pool;\
|
|
const uint8_t nb_stages = t->opt->nb_stages;\
|
|
const uint8_t laststage = nb_stages - 1;\
|
|
uint8_t cnt = 0;\
|
|
void *bufs[16] __rte_cache_aligned;\
|
|
int const sz = RTE_DIM(bufs);\
|
|
if (opt->verbose_level > 1)\
|
|
printf("%s(): lcore %d dev_id %d port=%d\n", __func__,\
|
|
rte_lcore_id(), dev, port)
|
|
|
|
static __rte_always_inline int
|
|
perf_process_last_stage(struct rte_mempool *const pool,
|
|
struct rte_event *const ev, struct worker_data *const w,
|
|
void *bufs[], int const buf_sz, uint8_t count)
|
|
{
|
|
bufs[count++] = ev->event_ptr;
|
|
|
|
/* release fence here ensures event_prt is
|
|
* stored before updating the number of
|
|
* processed packets for worker lcores
|
|
*/
|
|
rte_atomic_thread_fence(__ATOMIC_RELEASE);
|
|
w->processed_pkts++;
|
|
|
|
if (unlikely(count == buf_sz)) {
|
|
count = 0;
|
|
rte_mempool_put_bulk(pool, bufs, buf_sz);
|
|
}
|
|
return count;
|
|
}
|
|
|
|
static __rte_always_inline uint8_t
|
|
perf_process_last_stage_latency(struct rte_mempool *const pool,
|
|
struct rte_event *const ev, struct worker_data *const w,
|
|
void *bufs[], int const buf_sz, uint8_t count)
|
|
{
|
|
uint64_t latency;
|
|
struct perf_elt *const m = ev->event_ptr;
|
|
|
|
bufs[count++] = ev->event_ptr;
|
|
|
|
/* release fence here ensures event_prt is
|
|
* stored before updating the number of
|
|
* processed packets for worker lcores
|
|
*/
|
|
rte_atomic_thread_fence(__ATOMIC_RELEASE);
|
|
w->processed_pkts++;
|
|
|
|
if (unlikely(count == buf_sz)) {
|
|
count = 0;
|
|
latency = rte_get_timer_cycles() - m->timestamp;
|
|
rte_mempool_put_bulk(pool, bufs, buf_sz);
|
|
} else {
|
|
latency = rte_get_timer_cycles() - m->timestamp;
|
|
}
|
|
|
|
w->latency += latency;
|
|
return count;
|
|
}
|
|
|
|
|
|
static inline int
|
|
perf_nb_event_ports(struct evt_options *opt)
|
|
{
|
|
return evt_nr_active_lcores(opt->wlcores) +
|
|
evt_nr_active_lcores(opt->plcores);
|
|
}
|
|
|
|
int perf_test_result(struct evt_test *test, struct evt_options *opt);
|
|
int perf_opt_check(struct evt_options *opt, uint64_t nb_queues);
|
|
int perf_test_setup(struct evt_test *test, struct evt_options *opt);
|
|
int perf_ethdev_setup(struct evt_test *test, struct evt_options *opt);
|
|
int perf_cryptodev_setup(struct evt_test *test, struct evt_options *opt);
|
|
int perf_mempool_setup(struct evt_test *test, struct evt_options *opt);
|
|
int perf_event_dev_port_setup(struct evt_test *test, struct evt_options *opt,
|
|
uint8_t stride, uint8_t nb_queues,
|
|
const struct rte_event_port_conf *port_conf);
|
|
int perf_event_dev_service_setup(uint8_t dev_id);
|
|
int perf_launch_lcores(struct evt_test *test, struct evt_options *opt,
|
|
int (*worker)(void *));
|
|
void perf_opt_dump(struct evt_options *opt, uint8_t nb_queues);
|
|
void perf_test_destroy(struct evt_test *test, struct evt_options *opt);
|
|
void perf_eventdev_destroy(struct evt_test *test, struct evt_options *opt);
|
|
void perf_cryptodev_destroy(struct evt_test *test, struct evt_options *opt);
|
|
void perf_ethdev_destroy(struct evt_test *test, struct evt_options *opt);
|
|
void perf_mempool_destroy(struct evt_test *test, struct evt_options *opt);
|
|
|
|
#endif /* _TEST_PERF_COMMON_ */
|