numam-dpdk/lib/librte_ring/rte_ring_peek_zc.h
Honnappa Nagarahalli 47bec9a5ca ring: add zero copy API
Add zero-copy APIs. These APIs provide the capability to
copy the data to/from the ring memory directly, without
having a temporary copy (for ex: an array of mbufs on
the stack). Use cases that involve copying large amount
of data to/from the ring can benefit from these APIs.

Signed-off-by: Honnappa Nagarahalli <honnappa.nagarahalli@arm.com>
Reviewed-by: Dharmik Thakkar <dharmik.thakkar@arm.com>
Acked-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
2020-10-29 14:13:31 +01:00

550 lines
17 KiB
C

/* SPDX-License-Identifier: BSD-3-Clause
*
* Copyright (c) 2020 Arm Limited
* Copyright (c) 2007-2009 Kip Macy kmacy@freebsd.org
* All rights reserved.
* Derived from FreeBSD's bufring.h
* Used as BSD-3 Licensed with permission from Kip Macy.
*/
#ifndef _RTE_RING_PEEK_ZC_H_
#define _RTE_RING_PEEK_ZC_H_
/**
* @file
* @b EXPERIMENTAL: this API may change without prior notice
* It is not recommended to include this file directly.
* Please include <rte_ring_elem.h> instead.
*
* Ring Peek Zero Copy APIs
* These APIs make it possible to split public enqueue/dequeue API
* into 3 parts:
* - enqueue/dequeue start
* - copy data to/from the ring
* - enqueue/dequeue finish
* Along with the advantages of the peek APIs, these APIs provide the ability
* to avoid copying of the data to temporary area (for ex: array of mbufs
* on the stack).
*
* Note that currently these APIs are available only for two sync modes:
* 1) Single Producer/Single Consumer (RTE_RING_SYNC_ST)
* 2) Serialized Producer/Serialized Consumer (RTE_RING_SYNC_MT_HTS).
* It is user's responsibility to create/init ring with appropriate sync
* modes selected.
*
* Following are some examples showing the API usage.
* 1)
* struct elem_obj {uint64_t a; uint32_t b, c;};
* struct elem_obj *obj;
*
* // Create ring with sync type RTE_RING_SYNC_ST or RTE_RING_SYNC_MT_HTS
* // Reserve space on the ring
* n = rte_ring_enqueue_zc_bulk_elem_start(r, sizeof(elem_obj), 1, &zcd, NULL);
*
* // Produce the data directly on the ring memory
* obj = (struct elem_obj *)zcd->ptr1;
* obj->a = rte_get_a();
* obj->b = rte_get_b();
* obj->c = rte_get_c();
* rte_ring_enqueue_zc_elem_finish(ring, n);
*
* 2)
* // Create ring with sync type RTE_RING_SYNC_ST or RTE_RING_SYNC_MT_HTS
* // Reserve space on the ring
* n = rte_ring_enqueue_zc_burst_start(r, 32, &zcd, NULL);
*
* // Pkt I/O core polls packets from the NIC
* if (n != 0) {
* nb_rx = rte_eth_rx_burst(portid, queueid, zcd->ptr1, zcd->n1);
* if (nb_rx == zcd->n1 && n != zcd->n1)
* nb_rx = rte_eth_rx_burst(portid, queueid,
* zcd->ptr2, n - zcd->n1);
*
* // Provide packets to the packet processing cores
* rte_ring_enqueue_zc_finish(r, nb_rx);
* }
*
* Note that between _start_ and _finish_ none other thread can proceed
* with enqueue/dequeue operation till _finish_ completes.
*/
#ifdef __cplusplus
extern "C" {
#endif
#include <rte_ring_peek_c11_mem.h>
/**
* Ring zero-copy information structure.
*
* This structure contains the pointers and length of the space
* reserved on the ring storage.
*/
struct rte_ring_zc_data {
/* Pointer to the first space in the ring */
void *ptr1;
/* Pointer to the second space in the ring if there is wrap-around.
* It contains valid value only if wrap-around happens.
*/
void *ptr2;
/* Number of elements in the first pointer. If this is equal to
* the number of elements requested, then ptr2 is NULL.
* Otherwise, subtracting n1 from number of elements requested
* will give the number of elements available at ptr2.
*/
unsigned int n1;
} __rte_cache_aligned;
static __rte_always_inline void
__rte_ring_get_elem_addr(struct rte_ring *r, uint32_t head,
uint32_t esize, uint32_t num, void **dst1, uint32_t *n1, void **dst2)
{
uint32_t idx, scale, nr_idx;
uint32_t *ring = (uint32_t *)&r[1];
/* Normalize to uint32_t */
scale = esize / sizeof(uint32_t);
idx = head & r->mask;
nr_idx = idx * scale;
*dst1 = ring + nr_idx;
*n1 = num;
if (idx + num > r->size) {
*n1 = r->size - idx;
*dst2 = ring;
} else {
*dst2 = NULL;
}
}
/**
* @internal This function moves prod head value.
*/
static __rte_always_inline unsigned int
__rte_ring_do_enqueue_zc_elem_start(struct rte_ring *r, unsigned int esize,
uint32_t n, enum rte_ring_queue_behavior behavior,
struct rte_ring_zc_data *zcd, unsigned int *free_space)
{
uint32_t free, head, next;
switch (r->prod.sync_type) {
case RTE_RING_SYNC_ST:
n = __rte_ring_move_prod_head(r, RTE_RING_SYNC_ST, n,
behavior, &head, &next, &free);
break;
case RTE_RING_SYNC_MT_HTS:
n = __rte_ring_hts_move_prod_head(r, n, behavior, &head, &free);
break;
case RTE_RING_SYNC_MT:
case RTE_RING_SYNC_MT_RTS:
default:
/* unsupported mode, shouldn't be here */
RTE_ASSERT(0);
n = 0;
free = 0;
return n;
}
__rte_ring_get_elem_addr(r, head, esize, n, &zcd->ptr1,
&zcd->n1, &zcd->ptr2);
if (free_space != NULL)
*free_space = free - n;
return n;
}
/**
* Start to enqueue several objects on the ring.
* Note that no actual objects are put in the queue by this function,
* it just reserves space for the user on the ring.
* User has to copy objects into the queue using the returned pointers.
* User should call rte_ring_enqueue_zc_elem_finish to complete the
* enqueue operation.
*
* @param r
* A pointer to the ring structure.
* @param esize
* The size of ring element, in bytes. It must be a multiple of 4.
* @param n
* The number of objects to add in the ring.
* @param zcd
* Structure containing the pointers and length of the space
* reserved on the ring storage.
* @param free_space
* If non-NULL, returns the amount of space in the ring after the
* reservation operation has finished.
* @return
* The number of objects that can be enqueued, either 0 or n
*/
__rte_experimental
static __rte_always_inline unsigned int
rte_ring_enqueue_zc_bulk_elem_start(struct rte_ring *r, unsigned int esize,
unsigned int n, struct rte_ring_zc_data *zcd, unsigned int *free_space)
{
return __rte_ring_do_enqueue_zc_elem_start(r, esize, n,
RTE_RING_QUEUE_FIXED, zcd, free_space);
}
/**
* Start to enqueue several pointers to objects on the ring.
* Note that no actual pointers are put in the queue by this function,
* it just reserves space for the user on the ring.
* User has to copy pointers to objects into the queue using the
* returned pointers.
* User should call rte_ring_enqueue_zc_finish to complete the
* enqueue operation.
*
* @param r
* A pointer to the ring structure.
* @param n
* The number of objects to add in the ring.
* @param zcd
* Structure containing the pointers and length of the space
* reserved on the ring storage.
* @param free_space
* If non-NULL, returns the amount of space in the ring after the
* reservation operation has finished.
* @return
* The number of objects that can be enqueued, either 0 or n
*/
__rte_experimental
static __rte_always_inline unsigned int
rte_ring_enqueue_zc_bulk_start(struct rte_ring *r, unsigned int n,
struct rte_ring_zc_data *zcd, unsigned int *free_space)
{
return rte_ring_enqueue_zc_bulk_elem_start(r, sizeof(uintptr_t), n,
zcd, free_space);
}
/**
* Start to enqueue several objects on the ring.
* Note that no actual objects are put in the queue by this function,
* it just reserves space for the user on the ring.
* User has to copy objects into the queue using the returned pointers.
* User should call rte_ring_enqueue_zc_elem_finish to complete the
* enqueue operation.
*
* @param r
* A pointer to the ring structure.
* @param esize
* The size of ring element, in bytes. It must be a multiple of 4.
* @param n
* The number of objects to add in the ring.
* @param zcd
* Structure containing the pointers and length of the space
* reserved on the ring storage.
* @param free_space
* If non-NULL, returns the amount of space in the ring after the
* reservation operation has finished.
* @return
* The number of objects that can be enqueued, either 0 or n
*/
__rte_experimental
static __rte_always_inline unsigned int
rte_ring_enqueue_zc_burst_elem_start(struct rte_ring *r, unsigned int esize,
unsigned int n, struct rte_ring_zc_data *zcd, unsigned int *free_space)
{
return __rte_ring_do_enqueue_zc_elem_start(r, esize, n,
RTE_RING_QUEUE_VARIABLE, zcd, free_space);
}
/**
* Start to enqueue several pointers to objects on the ring.
* Note that no actual pointers are put in the queue by this function,
* it just reserves space for the user on the ring.
* User has to copy pointers to objects into the queue using the
* returned pointers.
* User should call rte_ring_enqueue_zc_finish to complete the
* enqueue operation.
*
* @param r
* A pointer to the ring structure.
* @param n
* The number of objects to add in the ring.
* @param zcd
* Structure containing the pointers and length of the space
* reserved on the ring storage.
* @param free_space
* If non-NULL, returns the amount of space in the ring after the
* reservation operation has finished.
* @return
* The number of objects that can be enqueued, either 0 or n.
*/
__rte_experimental
static __rte_always_inline unsigned int
rte_ring_enqueue_zc_burst_start(struct rte_ring *r, unsigned int n,
struct rte_ring_zc_data *zcd, unsigned int *free_space)
{
return rte_ring_enqueue_zc_burst_elem_start(r, sizeof(uintptr_t), n,
zcd, free_space);
}
/**
* Complete enqueuing several objects on the ring.
* Note that number of objects to enqueue should not exceed previous
* enqueue_start return value.
*
* @param r
* A pointer to the ring structure.
* @param n
* The number of objects to add to the ring.
*/
__rte_experimental
static __rte_always_inline void
rte_ring_enqueue_zc_elem_finish(struct rte_ring *r, unsigned int n)
{
uint32_t tail;
switch (r->prod.sync_type) {
case RTE_RING_SYNC_ST:
n = __rte_ring_st_get_tail(&r->prod, &tail, n);
__rte_ring_st_set_head_tail(&r->prod, tail, n, 1);
break;
case RTE_RING_SYNC_MT_HTS:
n = __rte_ring_hts_get_tail(&r->hts_prod, &tail, n);
__rte_ring_hts_set_head_tail(&r->hts_prod, tail, n, 1);
break;
case RTE_RING_SYNC_MT:
case RTE_RING_SYNC_MT_RTS:
default:
/* unsupported mode, shouldn't be here */
RTE_ASSERT(0);
}
}
/**
* Complete enqueuing several pointers to objects on the ring.
* Note that number of objects to enqueue should not exceed previous
* enqueue_start return value.
*
* @param r
* A pointer to the ring structure.
* @param n
* The number of pointers to objects to add to the ring.
*/
__rte_experimental
static __rte_always_inline void
rte_ring_enqueue_zc_finish(struct rte_ring *r, unsigned int n)
{
rte_ring_enqueue_zc_elem_finish(r, n);
}
/**
* @internal This function moves cons head value and copies up to *n*
* objects from the ring to the user provided obj_table.
*/
static __rte_always_inline unsigned int
__rte_ring_do_dequeue_zc_elem_start(struct rte_ring *r,
uint32_t esize, uint32_t n, enum rte_ring_queue_behavior behavior,
struct rte_ring_zc_data *zcd, unsigned int *available)
{
uint32_t avail, head, next;
switch (r->cons.sync_type) {
case RTE_RING_SYNC_ST:
n = __rte_ring_move_cons_head(r, RTE_RING_SYNC_ST, n,
behavior, &head, &next, &avail);
break;
case RTE_RING_SYNC_MT_HTS:
n = __rte_ring_hts_move_cons_head(r, n, behavior,
&head, &avail);
break;
case RTE_RING_SYNC_MT:
case RTE_RING_SYNC_MT_RTS:
default:
/* unsupported mode, shouldn't be here */
RTE_ASSERT(0);
n = 0;
avail = 0;
return n;
}
__rte_ring_get_elem_addr(r, head, esize, n, &zcd->ptr1,
&zcd->n1, &zcd->ptr2);
if (available != NULL)
*available = avail - n;
return n;
}
/**
* Start to dequeue several objects from the ring.
* Note that no actual objects are copied from the queue by this function.
* User has to copy objects from the queue using the returned pointers.
* User should call rte_ring_dequeue_zc_elem_finish to complete the
* dequeue operation.
*
* @param r
* A pointer to the ring structure.
* @param esize
* The size of ring element, in bytes. It must be a multiple of 4.
* @param n
* The number of objects to remove from the ring.
* @param zcd
* Structure containing the pointers and length of the space
* reserved on the ring storage.
* @param available
* If non-NULL, returns the number of remaining ring entries after the
* dequeue has finished.
* @return
* The number of objects that can be dequeued, either 0 or n.
*/
__rte_experimental
static __rte_always_inline unsigned int
rte_ring_dequeue_zc_bulk_elem_start(struct rte_ring *r, unsigned int esize,
unsigned int n, struct rte_ring_zc_data *zcd, unsigned int *available)
{
return __rte_ring_do_dequeue_zc_elem_start(r, esize, n,
RTE_RING_QUEUE_FIXED, zcd, available);
}
/**
* Start to dequeue several pointers to objects from the ring.
* Note that no actual pointers are removed from the queue by this function.
* User has to copy pointers to objects from the queue using the
* returned pointers.
* User should call rte_ring_dequeue_zc_finish to complete the
* dequeue operation.
*
* @param r
* A pointer to the ring structure.
* @param n
* The number of objects to remove from the ring.
* @param zcd
* Structure containing the pointers and length of the space
* reserved on the ring storage.
* @param available
* If non-NULL, returns the number of remaining ring entries after the
* dequeue has finished.
* @return
* The number of objects that can be dequeued, either 0 or n.
*/
__rte_experimental
static __rte_always_inline unsigned int
rte_ring_dequeue_zc_bulk_start(struct rte_ring *r, unsigned int n,
struct rte_ring_zc_data *zcd, unsigned int *available)
{
return rte_ring_dequeue_zc_bulk_elem_start(r, sizeof(uintptr_t),
n, zcd, available);
}
/**
* Start to dequeue several objects from the ring.
* Note that no actual objects are copied from the queue by this function.
* User has to copy objects from the queue using the returned pointers.
* User should call rte_ring_dequeue_zc_elem_finish to complete the
* dequeue operation.
*
* @param r
* A pointer to the ring structure.
* @param esize
* The size of ring element, in bytes. It must be a multiple of 4.
* This must be the same value used while creating the ring. Otherwise
* the results are undefined.
* @param n
* The number of objects to dequeue from the ring.
* @param zcd
* Structure containing the pointers and length of the space
* reserved on the ring storage.
* @param available
* If non-NULL, returns the number of remaining ring entries after the
* dequeue has finished.
* @return
* The number of objects that can be dequeued, either 0 or n.
*/
__rte_experimental
static __rte_always_inline unsigned int
rte_ring_dequeue_zc_burst_elem_start(struct rte_ring *r, unsigned int esize,
unsigned int n, struct rte_ring_zc_data *zcd, unsigned int *available)
{
return __rte_ring_do_dequeue_zc_elem_start(r, esize, n,
RTE_RING_QUEUE_VARIABLE, zcd, available);
}
/**
* Start to dequeue several pointers to objects from the ring.
* Note that no actual pointers are removed from the queue by this function.
* User has to copy pointers to objects from the queue using the
* returned pointers.
* User should call rte_ring_dequeue_zc_finish to complete the
* dequeue operation.
*
* @param r
* A pointer to the ring structure.
* @param n
* The number of objects to remove from the ring.
* @param zcd
* Structure containing the pointers and length of the space
* reserved on the ring storage.
* @param available
* If non-NULL, returns the number of remaining ring entries after the
* dequeue has finished.
* @return
* The number of objects that can be dequeued, either 0 or n.
*/
__rte_experimental
static __rte_always_inline unsigned int
rte_ring_dequeue_zc_burst_start(struct rte_ring *r, unsigned int n,
struct rte_ring_zc_data *zcd, unsigned int *available)
{
return rte_ring_dequeue_zc_burst_elem_start(r, sizeof(uintptr_t), n,
zcd, available);
}
/**
* Complete dequeuing several objects from the ring.
* Note that number of objects to dequeued should not exceed previous
* dequeue_start return value.
*
* @param r
* A pointer to the ring structure.
* @param n
* The number of objects to remove from the ring.
*/
__rte_experimental
static __rte_always_inline void
rte_ring_dequeue_zc_elem_finish(struct rte_ring *r, unsigned int n)
{
uint32_t tail;
switch (r->cons.sync_type) {
case RTE_RING_SYNC_ST:
n = __rte_ring_st_get_tail(&r->cons, &tail, n);
__rte_ring_st_set_head_tail(&r->cons, tail, n, 0);
break;
case RTE_RING_SYNC_MT_HTS:
n = __rte_ring_hts_get_tail(&r->hts_cons, &tail, n);
__rte_ring_hts_set_head_tail(&r->hts_cons, tail, n, 0);
break;
case RTE_RING_SYNC_MT:
case RTE_RING_SYNC_MT_RTS:
default:
/* unsupported mode, shouldn't be here */
RTE_ASSERT(0);
}
}
/**
* Complete dequeuing several objects from the ring.
* Note that number of objects to dequeued should not exceed previous
* dequeue_start return value.
*
* @param r
* A pointer to the ring structure.
* @param n
* The number of objects to remove from the ring.
*/
__rte_experimental
static __rte_always_inline void
rte_ring_dequeue_zc_finish(struct rte_ring *r, unsigned int n)
{
rte_ring_dequeue_elem_finish(r, n);
}
#ifdef __cplusplus
}
#endif
#endif /* _RTE_RING_PEEK_ZC_H_ */