numam-dpdk/drivers/raw/ntb/ntb_hw_intel.c
Xiaoyun Li 11b5c7daf0 raw/ntb: add enqueue and dequeue functions
Introduce enqueue and dequeue functions to support packet based
processing. And enable write-combining for ntb driver since it
can improve the performance a lot.

Signed-off-by: Xiaoyun Li <xiaoyun.li@intel.com>
Acked-by: Jingjing Wu <jingjing.wu@intel.com>
2019-10-21 15:41:18 +02:00

392 lines
8.9 KiB
C

/* SPDX-License-Identifier: BSD-3-Clause
* Copyright(c) 2019 Intel Corporation.
*/
#include <stdint.h>
#include <stdio.h>
#include <errno.h>
#include <rte_io.h>
#include <rte_eal.h>
#include <rte_pci.h>
#include <rte_bus_pci.h>
#include <rte_rawdev.h>
#include <rte_rawdev_pmd.h>
#include "ntb.h"
#include "ntb_hw_intel.h"
enum xeon_ntb_bar {
XEON_NTB_BAR23 = 2,
XEON_NTB_BAR45 = 4,
};
static enum xeon_ntb_bar intel_ntb_bar[] = {
XEON_NTB_BAR23,
XEON_NTB_BAR45,
};
static int
intel_ntb_dev_init(const struct rte_rawdev *dev)
{
struct ntb_hw *hw = dev->dev_private;
uint8_t reg_val, bar;
int ret, i;
if (hw == NULL) {
NTB_LOG(ERR, "Invalid device.");
return -EINVAL;
}
ret = rte_pci_read_config(hw->pci_dev, &reg_val,
sizeof(reg_val), XEON_PPD_OFFSET);
if (ret < 0) {
NTB_LOG(ERR, "Cannot get NTB PPD (PCIe port definition).");
return -EIO;
}
/* Check connection topo type. Only support B2B. */
switch (reg_val & XEON_PPD_CONN_MASK) {
case XEON_PPD_CONN_B2B:
NTB_LOG(INFO, "Topo B2B (back to back) is using.");
break;
case XEON_PPD_CONN_TRANSPARENT:
case XEON_PPD_CONN_RP:
default:
NTB_LOG(ERR, "Not supported conn topo. Please use B2B.");
return -EINVAL;
}
/* Check device type. */
if (reg_val & XEON_PPD_DEV_DSD) {
NTB_LOG(INFO, "DSD, Downstream Device.");
hw->topo = NTB_TOPO_B2B_DSD;
} else {
NTB_LOG(INFO, "USD, Upstream device.");
hw->topo = NTB_TOPO_B2B_USD;
}
/* Check if bar4 is split. Do not support split bar. */
if (reg_val & XEON_PPD_SPLIT_BAR_MASK) {
NTB_LOG(ERR, "Do not support split bar.");
return -EINVAL;
}
hw->hw_addr = (char *)hw->pci_dev->mem_resource[0].addr;
hw->mw_cnt = XEON_MW_COUNT;
hw->db_cnt = XEON_DB_COUNT;
hw->spad_cnt = XEON_SPAD_COUNT;
hw->mw_size = rte_zmalloc("ntb_mw_size",
hw->mw_cnt * sizeof(uint64_t), 0);
for (i = 0; i < hw->mw_cnt; i++) {
bar = intel_ntb_bar[i];
hw->mw_size[i] = hw->pci_dev->mem_resource[bar].len;
}
/* Reserve the last 2 spad registers for users. */
for (i = 0; i < NTB_SPAD_USER_MAX_NUM; i++)
hw->spad_user_list[i] = hw->spad_cnt;
hw->spad_user_list[0] = hw->spad_cnt - 2;
hw->spad_user_list[1] = hw->spad_cnt - 1;
return 0;
}
static void *
intel_ntb_get_peer_mw_addr(const struct rte_rawdev *dev, int mw_idx)
{
struct ntb_hw *hw = dev->dev_private;
uint8_t bar;
if (hw == NULL) {
NTB_LOG(ERR, "Invalid device.");
return 0;
}
if (mw_idx < 0 || mw_idx >= hw->mw_cnt) {
NTB_LOG(ERR, "Invalid memory window index (0 - %u).",
hw->mw_cnt - 1);
return 0;
}
bar = intel_ntb_bar[mw_idx];
return hw->pci_dev->mem_resource[bar].addr;
}
static int
intel_ntb_mw_set_trans(const struct rte_rawdev *dev, int mw_idx,
uint64_t addr, uint64_t size)
{
struct ntb_hw *hw = dev->dev_private;
void *xlat_addr, *limit_addr;
uint64_t xlat_off, limit_off;
uint64_t base, limit;
uint8_t bar;
if (hw == NULL) {
NTB_LOG(ERR, "Invalid device.");
return -EINVAL;
}
if (mw_idx < 0 || mw_idx >= hw->mw_cnt) {
NTB_LOG(ERR, "Invalid memory window index (0 - %u).",
hw->mw_cnt - 1);
return -EINVAL;
}
bar = intel_ntb_bar[mw_idx];
xlat_off = XEON_IMBAR1XBASE_OFFSET + mw_idx * XEON_BAR_INTERVAL_OFFSET;
limit_off = XEON_IMBAR1XLMT_OFFSET + mw_idx * XEON_BAR_INTERVAL_OFFSET;
xlat_addr = hw->hw_addr + xlat_off;
limit_addr = hw->hw_addr + limit_off;
/* Limit reg val should be EMBAR base address plus MW size. */
base = addr;
limit = hw->pci_dev->mem_resource[bar].phys_addr + size;
rte_write64(base, xlat_addr);
rte_write64(limit, limit_addr);
/* Setup the external point so that remote can access. */
xlat_off = XEON_EMBAR1_OFFSET + 8 * mw_idx;
xlat_addr = hw->hw_addr + xlat_off;
limit_off = XEON_EMBAR1XLMT_OFFSET + mw_idx * XEON_BAR_INTERVAL_OFFSET;
limit_addr = hw->hw_addr + limit_off;
base = rte_read64(xlat_addr);
base &= ~0xf;
limit = base + size;
rte_write64(limit, limit_addr);
return 0;
}
static void *
intel_ntb_ioremap(const struct rte_rawdev *dev, uint64_t addr)
{
struct ntb_hw *hw = dev->dev_private;
void *mapped = NULL;
void *base;
int i;
for (i = 0; i < hw->peer_used_mws; i++) {
if (addr >= hw->peer_mw_base[i] &&
addr <= hw->peer_mw_base[i] + hw->mw_size[i]) {
base = intel_ntb_get_peer_mw_addr(dev, i);
mapped = (void *)(size_t)(addr - hw->peer_mw_base[i] +
(size_t)base);
break;
}
}
return mapped;
}
static int
intel_ntb_get_link_status(const struct rte_rawdev *dev)
{
struct ntb_hw *hw = dev->dev_private;
uint16_t reg_val;
int ret;
if (hw == NULL) {
NTB_LOG(ERR, "Invalid device.");
return -EINVAL;
}
ret = rte_pci_read_config(hw->pci_dev, &reg_val,
sizeof(reg_val), XEON_LINK_STATUS_OFFSET);
if (ret < 0) {
NTB_LOG(ERR, "Unable to get link status.");
return -EIO;
}
hw->link_status = NTB_LNK_STA_ACTIVE(reg_val);
if (hw->link_status) {
hw->link_speed = NTB_LNK_STA_SPEED(reg_val);
hw->link_width = NTB_LNK_STA_WIDTH(reg_val);
} else {
hw->link_speed = NTB_SPEED_NONE;
hw->link_width = NTB_WIDTH_NONE;
}
return 0;
}
static int
intel_ntb_set_link(const struct rte_rawdev *dev, bool up)
{
struct ntb_hw *hw = dev->dev_private;
uint32_t ntb_ctrl, reg_off;
void *reg_addr;
reg_off = XEON_NTBCNTL_OFFSET;
reg_addr = hw->hw_addr + reg_off;
ntb_ctrl = rte_read32(reg_addr);
if (up) {
ntb_ctrl &= ~(NTB_CTL_DISABLE | NTB_CTL_CFG_LOCK);
ntb_ctrl |= NTB_CTL_P2S_BAR2_SNOOP | NTB_CTL_S2P_BAR2_SNOOP;
ntb_ctrl |= NTB_CTL_P2S_BAR4_SNOOP | NTB_CTL_S2P_BAR4_SNOOP;
} else {
ntb_ctrl &= ~(NTB_CTL_P2S_BAR2_SNOOP | NTB_CTL_S2P_BAR2_SNOOP);
ntb_ctrl &= ~(NTB_CTL_P2S_BAR4_SNOOP | NTB_CTL_S2P_BAR4_SNOOP);
ntb_ctrl |= NTB_CTL_DISABLE | NTB_CTL_CFG_LOCK;
}
rte_write32(ntb_ctrl, reg_addr);
return 0;
}
static uint32_t
intel_ntb_spad_read(const struct rte_rawdev *dev, int spad, bool peer)
{
struct ntb_hw *hw = dev->dev_private;
uint32_t spad_v, reg_off;
void *reg_addr;
if (spad < 0 || spad >= hw->spad_cnt) {
NTB_LOG(ERR, "Invalid spad reg index.");
return 0;
}
/* When peer is true, read peer spad reg */
reg_off = peer ? XEON_B2B_SPAD_OFFSET : XEON_IM_SPAD_OFFSET;
reg_addr = hw->hw_addr + reg_off + (spad << 2);
spad_v = rte_read32(reg_addr);
return spad_v;
}
static int
intel_ntb_spad_write(const struct rte_rawdev *dev, int spad,
bool peer, uint32_t spad_v)
{
struct ntb_hw *hw = dev->dev_private;
uint32_t reg_off;
void *reg_addr;
if (spad < 0 || spad >= hw->spad_cnt) {
NTB_LOG(ERR, "Invalid spad reg index.");
return -EINVAL;
}
/* When peer is true, write peer spad reg */
reg_off = peer ? XEON_B2B_SPAD_OFFSET : XEON_IM_SPAD_OFFSET;
reg_addr = hw->hw_addr + reg_off + (spad << 2);
rte_write32(spad_v, reg_addr);
return 0;
}
static uint64_t
intel_ntb_db_read(const struct rte_rawdev *dev)
{
struct ntb_hw *hw = dev->dev_private;
uint64_t db_off, db_bits;
void *db_addr;
db_off = XEON_IM_INT_STATUS_OFFSET;
db_addr = hw->hw_addr + db_off;
db_bits = rte_read64(db_addr);
return db_bits;
}
static int
intel_ntb_db_clear(const struct rte_rawdev *dev, uint64_t db_bits)
{
struct ntb_hw *hw = dev->dev_private;
uint64_t db_off;
void *db_addr;
db_off = XEON_IM_INT_STATUS_OFFSET;
db_addr = hw->hw_addr + db_off;
rte_write64(db_bits, db_addr);
return 0;
}
static int
intel_ntb_db_set_mask(const struct rte_rawdev *dev, uint64_t db_mask)
{
struct ntb_hw *hw = dev->dev_private;
uint64_t db_m_off;
void *db_m_addr;
db_m_off = XEON_IM_INT_DISABLE_OFFSET;
db_m_addr = hw->hw_addr + db_m_off;
db_mask |= hw->db_mask;
rte_write64(db_mask, db_m_addr);
hw->db_mask = db_mask;
return 0;
}
static int
intel_ntb_peer_db_set(const struct rte_rawdev *dev, uint8_t db_idx)
{
struct ntb_hw *hw = dev->dev_private;
uint32_t db_off;
void *db_addr;
if (((uint64_t)1 << db_idx) & ~hw->db_valid_mask) {
NTB_LOG(ERR, "Invalid doorbell.");
return -EINVAL;
}
db_off = XEON_IM_DOORBELL_OFFSET + db_idx * 4;
db_addr = hw->hw_addr + db_off;
rte_write32(1, db_addr);
return 0;
}
static int
intel_ntb_vector_bind(const struct rte_rawdev *dev, uint8_t intr, uint8_t msix)
{
struct ntb_hw *hw = dev->dev_private;
uint8_t reg_off;
void *reg_addr;
if (intr >= hw->db_cnt) {
NTB_LOG(ERR, "Invalid intr source.");
return -EINVAL;
}
/* Bind intr source to msix vector */
reg_off = XEON_INTVEC_OFFSET;
reg_addr = hw->hw_addr + reg_off + intr;
rte_write8(msix, reg_addr);
return 0;
}
/* operations for primary side of local ntb */
const struct ntb_dev_ops intel_ntb_ops = {
.ntb_dev_init = intel_ntb_dev_init,
.get_peer_mw_addr = intel_ntb_get_peer_mw_addr,
.mw_set_trans = intel_ntb_mw_set_trans,
.ioremap = intel_ntb_ioremap,
.get_link_status = intel_ntb_get_link_status,
.set_link = intel_ntb_set_link,
.spad_read = intel_ntb_spad_read,
.spad_write = intel_ntb_spad_write,
.db_read = intel_ntb_db_read,
.db_clear = intel_ntb_db_clear,
.db_set_mask = intel_ntb_db_set_mask,
.peer_db_set = intel_ntb_peer_db_set,
.vector_bind = intel_ntb_vector_bind,
};