Reimplement doorbell register emulation for NTB_SB01BASE_LOCKUP.

This allows at least first three doorbells to work very close to normal
hardware, properly signaling events to upper layers without spurious or
lost events.  Doorbells above the first three may still report spurious
events due to lack of reliable information, but they are rarely used.
This commit is contained in:
mav 2016-07-09 11:57:21 +00:00
parent b2ef28faa5
commit 4353c90d6c
2 changed files with 50 additions and 61 deletions

View File

@ -44,6 +44,7 @@ __FBSDID("$FreeBSD$");
#include <sys/systm.h> #include <sys/systm.h>
#include <sys/bus.h> #include <sys/bus.h>
#include <sys/endian.h> #include <sys/endian.h>
#include <sys/interrupt.h>
#include <sys/malloc.h> #include <sys/malloc.h>
#include <sys/module.h> #include <sys/module.h>
#include <sys/mutex.h> #include <sys/mutex.h>
@ -253,6 +254,7 @@ struct ntb_softc {
uint64_t db_valid_mask; uint64_t db_valid_mask;
uint64_t db_link_mask; uint64_t db_link_mask;
uint64_t db_mask; uint64_t db_mask;
uint64_t fake_db_bell; /* NTB_SB01BASE_LOCKUP*/
int last_ts; /* ticks @ last irq */ int last_ts; /* ticks @ last irq */
@ -357,7 +359,6 @@ static void xeon_set_pbar_xlat(struct ntb_softc *, uint64_t base_addr,
enum ntb_bar idx); enum ntb_bar idx);
static int xeon_setup_b2b_mw(struct ntb_softc *, static int xeon_setup_b2b_mw(struct ntb_softc *,
const struct ntb_b2b_addr *addr, const struct ntb_b2b_addr *peer_addr); const struct ntb_b2b_addr *addr, const struct ntb_b2b_addr *peer_addr);
static int xeon_setup_msix_bar(struct ntb_softc *);
static inline bool link_is_up(struct ntb_softc *ntb); static inline bool link_is_up(struct ntb_softc *ntb);
static inline bool _xeon_link_is_up(struct ntb_softc *ntb); static inline bool _xeon_link_is_up(struct ntb_softc *ntb);
static inline bool atom_link_is_err(struct ntb_softc *ntb); static inline bool atom_link_is_err(struct ntb_softc *ntb);
@ -1193,12 +1194,10 @@ ntb_db_set_mask(device_t dev, uint64_t bits)
{ {
struct ntb_softc *ntb = device_get_softc(dev); struct ntb_softc *ntb = device_get_softc(dev);
if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP))
return;
DB_MASK_LOCK(ntb); DB_MASK_LOCK(ntb);
ntb->db_mask |= bits; ntb->db_mask |= bits;
db_iowrite(ntb, ntb->self_reg->db_mask, ntb->db_mask); if (!HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP))
db_iowrite(ntb, ntb->self_reg->db_mask, ntb->db_mask);
DB_MASK_UNLOCK(ntb); DB_MASK_UNLOCK(ntb);
} }
@ -1206,18 +1205,26 @@ static void
ntb_db_clear_mask(device_t dev, uint64_t bits) ntb_db_clear_mask(device_t dev, uint64_t bits)
{ {
struct ntb_softc *ntb = device_get_softc(dev); struct ntb_softc *ntb = device_get_softc(dev);
uint64_t ibits;
int i;
KASSERT((bits & ~ntb->db_valid_mask) == 0, KASSERT((bits & ~ntb->db_valid_mask) == 0,
("%s: Invalid bits 0x%jx (valid: 0x%jx)", __func__, ("%s: Invalid bits 0x%jx (valid: 0x%jx)", __func__,
(uintmax_t)(bits & ~ntb->db_valid_mask), (uintmax_t)(bits & ~ntb->db_valid_mask),
(uintmax_t)ntb->db_valid_mask)); (uintmax_t)ntb->db_valid_mask));
if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP))
return;
DB_MASK_LOCK(ntb); DB_MASK_LOCK(ntb);
ibits = ntb->fake_db_bell & ntb->db_mask & bits;
ntb->db_mask &= ~bits; ntb->db_mask &= ~bits;
db_iowrite(ntb, ntb->self_reg->db_mask, ntb->db_mask); if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) {
/* Simulate fake interrupts if unmasked DB bits are set. */
for (i = 0; i < XEON_NONLINK_DB_MSIX_BITS; i++) {
if ((ibits & ntb_db_vector_mask(dev, i)) != 0)
swi_sched(ntb->int_info[i].tag, 0);
}
} else {
db_iowrite(ntb, ntb->self_reg->db_mask, ntb->db_mask);
}
DB_MASK_UNLOCK(ntb); DB_MASK_UNLOCK(ntb);
} }
@ -1226,17 +1233,8 @@ ntb_db_read(device_t dev)
{ {
struct ntb_softc *ntb = device_get_softc(dev); struct ntb_softc *ntb = device_get_softc(dev);
if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) { if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP))
uint64_t res; return (ntb->fake_db_bell);
unsigned i;
res = 0;
for (i = 0; i < XEON_NONLINK_DB_MSIX_BITS; i++) {
if (ntb->msix_vec[i].masked != 0)
res |= ntb_db_vector_mask(dev, i);
}
return (res);
}
return (db_ioread(ntb, ntb->self_reg->db_bell)); return (db_ioread(ntb, ntb->self_reg->db_bell));
} }
@ -1252,21 +1250,9 @@ ntb_db_clear(device_t dev, uint64_t bits)
(uintmax_t)ntb->db_valid_mask)); (uintmax_t)ntb->db_valid_mask));
if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) { if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) {
unsigned i; DB_MASK_LOCK(ntb);
ntb->fake_db_bell &= ~bits;
for (i = 0; i < XEON_NONLINK_DB_MSIX_BITS; i++) { DB_MASK_UNLOCK(ntb);
if ((bits & ntb_db_vector_mask(dev, i)) != 0) {
DB_MASK_LOCK(ntb);
if (ntb->msix_vec[i].masked != 0) {
/* XXX These need a public API. */
#if 0
pci_unmask_msix(ntb->device, i);
#endif
ntb->msix_vec[i].masked = 0;
}
DB_MASK_UNLOCK(ntb);
}
}
return; return;
} }
@ -1278,6 +1264,19 @@ ntb_vec_mask(struct ntb_softc *ntb, uint64_t db_vector)
{ {
uint64_t shift, mask; uint64_t shift, mask;
if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) {
/*
* Remap vectors in custom way to make at least first
* three doorbells to not generate stray events.
* This breaks Linux compatibility (if one existed)
* when more then one DB is used (not by if_ntb).
*/
if (db_vector < XEON_NONLINK_DB_MSIX_BITS - 1)
return (1 << db_vector);
if (db_vector == XEON_NONLINK_DB_MSIX_BITS - 1)
return (0x7ffc);
}
shift = ntb->db_vec_shift; shift = ntb->db_vec_shift;
mask = (1ull << shift) - 1; mask = (1ull << shift) - 1;
return (mask << (shift * db_vector)); return (mask << (shift * db_vector));
@ -1299,13 +1298,16 @@ ntb_interrupt(struct ntb_softc *ntb, uint32_t vec)
if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP) && if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP) &&
(vec_mask & ntb->db_link_mask) == 0) { (vec_mask & ntb->db_link_mask) == 0) {
DB_MASK_LOCK(ntb); DB_MASK_LOCK(ntb);
if (ntb->msix_vec[vec].masked == 0) {
/* XXX These need a public API. */ /* Do not report same DB events again if not cleared yet. */
#if 0 vec_mask &= ~ntb->fake_db_bell;
pci_mask_msix(ntb->device, vec);
#endif /* Update our internal doorbell register. */
ntb->msix_vec[vec].masked = 1; ntb->fake_db_bell |= vec_mask;
}
/* Do not report masked DB events. */
vec_mask &= ~ntb->db_mask;
DB_MASK_UNLOCK(ntb); DB_MASK_UNLOCK(ntb);
} }
@ -1508,6 +1510,7 @@ ntb_xeon_init_dev(struct ntb_softc *ntb)
ntb->xlat_reg = &xeon_sec_xlat; ntb->xlat_reg = &xeon_sec_xlat;
if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) { if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) {
ntb->fake_db_bell = 0;
ntb->msix_mw_idx = (ntb->mw_count + g_ntb_msix_idx) % ntb->msix_mw_idx = (ntb->mw_count + g_ntb_msix_idx) %
ntb->mw_count; ntb->mw_count;
ntb_printf(2, "Setting up MSIX mw idx %d means %u\n", ntb_printf(2, "Setting up MSIX mw idx %d means %u\n",
@ -1564,10 +1567,6 @@ ntb_xeon_init_dev(struct ntb_softc *ntb)
db_iowrite(ntb, ntb->self_reg->db_mask, ntb->db_mask); db_iowrite(ntb, ntb->self_reg->db_mask, ntb->db_mask);
DB_MASK_UNLOCK(ntb); DB_MASK_UNLOCK(ntb);
rc = xeon_setup_msix_bar(ntb);
if (rc != 0)
return (rc);
rc = ntb_init_isr(ntb); rc = ntb_init_isr(ntb);
return (rc); return (rc);
} }
@ -1729,19 +1728,6 @@ xeon_set_pbar_xlat(struct ntb_softc *ntb, uint64_t base_addr, enum ntb_bar idx)
(void)base_addr; (void)base_addr;
} }
static int
xeon_setup_msix_bar(struct ntb_softc *ntb)
{
enum ntb_bar bar_num;
if (!HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP))
return (0);
bar_num = ntb_mw_to_bar(ntb, ntb->msix_mw_idx);
ntb->peer_lapic_bar = &ntb->bar_info[bar_num];
return (0);
}
static int static int
xeon_setup_b2b_mw(struct ntb_softc *ntb, const struct ntb_b2b_addr *addr, xeon_setup_b2b_mw(struct ntb_softc *ntb, const struct ntb_b2b_addr *addr,
const struct ntb_b2b_addr *peer_addr) const struct ntb_b2b_addr *peer_addr)
@ -1822,8 +1808,10 @@ xeon_setup_b2b_mw(struct ntb_softc *ntb, const struct ntb_b2b_addr *addr,
if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) { if (HAS_FEATURE(ntb, NTB_SB01BASE_LOCKUP)) {
size_t size, xlatoffset; size_t size, xlatoffset;
enum ntb_bar bar_num;
switch (ntb_mw_to_bar(ntb, ntb->msix_mw_idx)) { bar_num = ntb_mw_to_bar(ntb, ntb->msix_mw_idx);
switch (bar_num) {
case NTB_B2B_BAR_1: case NTB_B2B_BAR_1:
size = 8; size = 8;
xlatoffset = XEON_SBAR2XLAT_OFFSET; xlatoffset = XEON_SBAR2XLAT_OFFSET;
@ -1856,6 +1844,8 @@ xeon_setup_b2b_mw(struct ntb_softc *ntb, const struct ntb_b2b_addr *addr,
ntb_reg_write(8, xlatoffset, MSI_INTEL_ADDR_BASE); ntb_reg_write(8, xlatoffset, MSI_INTEL_ADDR_BASE);
ntb->msix_xlat = ntb_reg_read(8, xlatoffset); ntb->msix_xlat = ntb_reg_read(8, xlatoffset);
} }
ntb->peer_lapic_bar = &ntb->bar_info[bar_num];
} }
(void)ntb_reg_read(8, XEON_SBAR2XLAT_OFFSET); (void)ntb_reg_read(8, XEON_SBAR2XLAT_OFFSET);
(void)ntb_reg_read(8, XEON_SBAR4XLAT_OFFSET); (void)ntb_reg_read(8, XEON_SBAR4XLAT_OFFSET);

View File

@ -1215,7 +1215,6 @@ ntb_qp_link_work(void *arg)
qp->event_handler(qp->cb_data, NTB_LINK_UP); qp->event_handler(qp->cb_data, NTB_LINK_UP);
NTB_DB_CLEAR_MASK(ntb, 1ull << qp->qp_num); NTB_DB_CLEAR_MASK(ntb, 1ull << qp->qp_num);
taskqueue_enqueue(qp->rxc_tq, &qp->rxc_db_work);
} else if (nt->link_is_up) } else if (nt->link_is_up)
callout_reset(&qp->link_work, callout_reset(&qp->link_work,
NTB_LINK_DOWN_TIMEOUT * hz / 1000, ntb_qp_link_work, qp); NTB_LINK_DOWN_TIMEOUT * hz / 1000, ntb_qp_link_work, qp);