PowerNV: initial support for PCIe host controller

Provide initial support for PCIe host controller as
well as for IOMMU mapping. This commit allows proper
bus enumeration, but does not guarantee DMA operations
are working.

Created by:            Nathan Whitehorn <nwhitehorn@freebsd.org>
Submitted by:          Wojciech Macek <wma@semihalf.com>
Sponsored by:          FreeBSD Foundation
This commit is contained in:
Wojciech Macek 2018-01-12 07:55:49 +00:00
parent 4ce147895c
commit ac9b43252a
3 changed files with 612 additions and 7 deletions

View File

@ -185,6 +185,8 @@ powerpc/powermac/uninorthpci.c optional powermac pci
powerpc/powermac/vcoregpio.c optional powermac
powerpc/powernv/opal.c optional powernv
powerpc/powernv/opal_console.c optional powernv
powerpc/powernv/opal_dev.c optional powernv
powerpc/powernv/opal_pci.c optional powernv pci
powerpc/powernv/opalcall.S optional powernv
powerpc/powernv/platform_powernv.c optional powernv
powerpc/powerpc/altivec.c optional powerpc | powerpc64

View File

@ -38,13 +38,40 @@ int opal_check(void);
/* Call an OPAL method. Any pointers passed must be real-mode accessible! */
int opal_call(uint64_t token, ...);
#define OPAL_CONSOLE_WRITE 1
#define OPAL_CONSOLE_READ 2
#define OPAL_CEC_POWER_DOWN 5
#define OPAL_CEC_REBOOT 6
#define OPAL_START_CPU 41
#define OPAL_CONSOLE_WRITE 1
#define OPAL_CONSOLE_READ 2
#define OPAL_CEC_POWER_DOWN 5
#define OPAL_CEC_REBOOT 6
#define OPAL_HANDLE_INTERRUPT 9
#define OPAL_PCI_CONFIG_READ_BYTE 13
#define OPAL_PCI_CONFIG_READ_HALF_WORD 14
#define OPAL_PCI_CONFIG_READ_WORD 15
#define OPAL_PCI_CONFIG_WRITE_BYTE 16
#define OPAL_PCI_CONFIG_WRITE_HALF_WORD 17
#define OPAL_PCI_CONFIG_WRITE_WORD 18
#define OPAL_PCI_EEH_FREEZE_CLEAR 26
#define OPAL_PCI_PHB_MMIO_ENABLE 27
#define OPAL_PCI_SET_PHB_MEM_WINDOW 28
#define OPAL_PCI_MAP_PE_MMIO_WINDOW 29
#define OPAL_PCI_SET_XIVE_PE 37
#define OPAL_PCI_RESET 49
#define OPAL_PCI_POLL 62
#define OPAL_PCI_SET_PE 31
#define OPAL_START_CPU 41
#define OPAL_GET_MSI_32 39
#define OPAL_GET_MSI_64 40
#define OPAL_PCI_MSI_EOI 63
#define OPAL_PCI_MAP_PE_DMA_WINDOW_REAL 45
#define OPAL_RETURN_CPU 69
#define OPAL_REINIT_CPUS 70
#define OPAL_SUCCESS 0
#define OPAL_BUSY_EVENT -12
/* For OPAL_PCI_SET_PE */
#define OPAL_UNMAP_PE 0
#define OPAL_MAP_PE 1
#define OPAL_SUCCESS 0
#define OPAL_PARAMETER -1
#define OPAL_CLOSED -5
#define OPAL_BUSY_EVENT -12
#endif

View File

@ -0,0 +1,576 @@
/*-
* Copyright (c) 2015-2016 Nathan Whitehorn
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
#include <sys/cdefs.h>
__FBSDID("$FreeBSD$");
#include <sys/param.h>
#include <sys/systm.h>
#include <sys/module.h>
#include <sys/bus.h>
#include <sys/conf.h>
#include <sys/kernel.h>
#include <sys/pciio.h>
#include <sys/endian.h>
#include <sys/rman.h>
#include <sys/vmem.h>
#include <dev/ofw/openfirm.h>
#include <dev/ofw/ofw_pci.h>
#include <dev/ofw/ofw_bus.h>
#include <dev/ofw/ofw_bus_subr.h>
#include <dev/ofw/ofwpci.h>
#include <dev/pci/pcivar.h>
#include <dev/pci/pcireg.h>
#include <machine/bus.h>
#include <machine/intr_machdep.h>
#include <machine/md_var.h>
#include <vm/vm.h>
#include <vm/pmap.h>
#include "pcib_if.h"
#include "pic_if.h"
#include "iommu_if.h"
#include "opal.h"
/*
* Device interface.
*/
static int opalpci_probe(device_t);
static int opalpci_attach(device_t);
/*
* pcib interface.
*/
static uint32_t opalpci_read_config(device_t, u_int, u_int, u_int,
u_int, int);
static void opalpci_write_config(device_t, u_int, u_int, u_int,
u_int, u_int32_t, int);
static int opalpci_alloc_msi(device_t dev, device_t child,
int count, int maxcount, int *irqs);
static int opalpci_release_msi(device_t dev, device_t child,
int count, int *irqs);
static int opalpci_alloc_msix(device_t dev, device_t child,
int *irq);
static int opalpci_release_msix(device_t dev, device_t child,
int irq);
static int opalpci_map_msi(device_t dev, device_t child,
int irq, uint64_t *addr, uint32_t *data);
static int opalpci_route_interrupt(device_t bus, device_t dev, int pin);
/*
* MSI PIC interface.
*/
static void opalpic_pic_enable(device_t dev, u_int irq, u_int vector);
static void opalpic_pic_eoi(device_t dev, u_int irq);
static void opalpic_pic_mask(device_t dev, u_int irq);
static void opalpic_pic_unmask(device_t dev, u_int irq);
/*
* Commands
*/
#define OPAL_M32_WINDOW_TYPE 1
#define OPAL_M64_WINDOW_TYPE 2
#define OPAL_IO_WINDOW_TYPE 3
#define OPAL_RESET_PHB_COMPLETE 1
#define OPAL_RESET_PCI_IODA_TABLE 6
#define OPAL_DISABLE_M64 0
#define OPAL_ENABLE_M64_SPLIT 1
#define OPAL_ENABLE_M64_NON_SPLIT 2
#define OPAL_EEH_ACTION_CLEAR_FREEZE_MMIO 1
#define OPAL_EEH_ACTION_CLEAR_FREEZE_DMA 2
#define OPAL_EEH_ACTION_CLEAR_FREEZE_ALL 3
/*
* Constants
*/
#define OPAL_PCI_DEFAULT_PE 1
/*
* Driver methods.
*/
static device_method_t opalpci_methods[] = {
/* Device interface */
DEVMETHOD(device_probe, opalpci_probe),
DEVMETHOD(device_attach, opalpci_attach),
/* pcib interface */
DEVMETHOD(pcib_read_config, opalpci_read_config),
DEVMETHOD(pcib_write_config, opalpci_write_config),
DEVMETHOD(pcib_alloc_msi, opalpci_alloc_msi),
DEVMETHOD(pcib_release_msi, opalpci_release_msi),
DEVMETHOD(pcib_alloc_msix, opalpci_alloc_msix),
DEVMETHOD(pcib_release_msix, opalpci_release_msix),
DEVMETHOD(pcib_map_msi, opalpci_map_msi),
DEVMETHOD(pcib_route_interrupt, opalpci_route_interrupt),
/* PIC interface for MSIs */
DEVMETHOD(pic_enable, opalpic_pic_enable),
DEVMETHOD(pic_eoi, opalpic_pic_eoi),
DEVMETHOD(pic_mask, opalpic_pic_mask),
DEVMETHOD(pic_unmask, opalpic_pic_unmask),
DEVMETHOD_END
};
struct opalpci_softc {
struct ofw_pci_softc ofw_sc;
uint64_t phb_id;
vmem_t *msi_vmem;
int msi_base; /* Base XIVE number */
int base_msi_irq; /* Base IRQ assigned by FreeBSD to this PIC */
};
static devclass_t opalpci_devclass;
DEFINE_CLASS_1(pcib, opalpci_driver, opalpci_methods,
sizeof(struct opalpci_softc), ofw_pci_driver);
EARLY_DRIVER_MODULE(opalpci, ofwbus, opalpci_driver, opalpci_devclass, 0, 0,
BUS_PASS_BUS);
static int
opalpci_probe(device_t dev)
{
const char *type;
if (opal_check() != 0)
return (ENXIO);
type = ofw_bus_get_type(dev);
if (type == NULL || (strcmp(type, "pci") != 0 &&
strcmp(type, "pciex") != 0))
return (ENXIO);
if (!OF_hasprop(ofw_bus_get_node(dev), "ibm,opal-phbid"))
return (ENXIO);
device_set_desc(dev, "OPAL Host-PCI bridge");
return (BUS_PROBE_GENERIC);
}
static int
opalpci_attach(device_t dev)
{
struct opalpci_softc *sc;
cell_t id[2], m64window[6], npe;
int i, err;
sc = device_get_softc(dev);
switch (OF_getproplen(ofw_bus_get_node(dev), "ibm,opal-phbid")) {
case 8:
OF_getencprop(ofw_bus_get_node(dev), "ibm,opal-phbid", id, 8);
sc->phb_id = ((uint64_t)id[0] << 32) | id[1];
break;
case 4:
OF_getencprop(ofw_bus_get_node(dev), "ibm,opal-phbid", id, 4);
sc->phb_id = id[0];
break;
default:
device_printf(dev, "PHB ID property had wrong length (%zd)\n",
OF_getproplen(ofw_bus_get_node(dev), "ibm,opal-phbid"));
return (ENXIO);
}
if (bootverbose)
device_printf(dev, "OPAL ID %#lx\n", sc->phb_id);
/*
* Reset PCI IODA table
*/
err = opal_call(OPAL_PCI_RESET, sc->phb_id, OPAL_RESET_PCI_IODA_TABLE,
1);
if (err != 0) {
device_printf(dev, "IODA table reset failed: %d\n", err);
return (ENXIO);
}
while ((err = opal_call(OPAL_PCI_POLL, sc->phb_id)) > 0)
DELAY(1000*err); /* Returns expected delay in ms */
if (err < 0) {
device_printf(dev, "PHB IODA reset poll failed: %d\n", err);
return (ENXIO);
}
/*
* Reset everything. Especially important if we have inherited the
* system from Linux by kexec()
*/
#ifdef NOTYET
if (bootverbose)
device_printf(dev, "Resetting PCI bus\n");
err = opal_call(OPAL_PCI_RESET, sc->phb_id, OPAL_RESET_PHB_COMPLETE, 1);
if (err < 0) {
device_printf(dev, "PHB reset failed: %d\n", err);
return (ENXIO);
}
while ((err = opal_call(OPAL_PCI_POLL, sc->phb_id)) > 0)
DELAY(1000*err); /* Returns expected delay in ms */
if (err < 0) {
device_printf(dev, "PHB reset poll failed: %d\n", err);
return (ENXIO);
}
DELAY(10000);
err = opal_call(OPAL_PCI_RESET, sc->phb_id, OPAL_RESET_PHB_COMPLETE, 0);
if (err < 0) {
device_printf(dev, "PHB reset completion failed: %d\n", err);
return (ENXIO);
}
while ((err = opal_call(OPAL_PCI_POLL, sc->phb_id)) > 0)
DELAY(1000*err); /* Returns expected delay in ms */
if (err < 0) {
device_printf(dev, "PHB reset completion poll failed: %d\n",
err);
return (ENXIO);
}
DELAY(10000);
#endif
/*
* Map all devices on the bus to partitionable endpoint one until
* such time as we start wanting to do things like bhyve.
*/
err = opal_call(OPAL_PCI_SET_PE, sc->phb_id, OPAL_PCI_DEFAULT_PE,
0, 0, 0, 0, /* All devices */
OPAL_MAP_PE);
if (err != 0) {
device_printf(dev, "PE mapping failed: %d\n", err);
return (ENXIO);
}
/*
* Turn on MMIO, mapped to PE 1
*/
if (OF_getencprop(ofw_bus_get_node(dev), "ibm,opal-num-pes", &npe, 4)
!= 4)
npe = 1;
for (i = 0; i < npe; i++) {
err = opal_call(OPAL_PCI_MAP_PE_MMIO_WINDOW, sc->phb_id,
OPAL_PCI_DEFAULT_PE, OPAL_M32_WINDOW_TYPE, 0, i);
if (err != 0)
device_printf(dev, "MMIO %d map failed: %d\n", i, err);
}
/* XXX: multiple M64 windows? */
if (OF_getencprop(ofw_bus_get_node(dev), "ibm,opal-m64-window",
m64window, sizeof(m64window)) == sizeof(m64window)) {
opal_call(OPAL_PCI_SET_PHB_MEM_WINDOW, sc->phb_id,
OPAL_M64_WINDOW_TYPE, 0 /* index */,
((uint64_t)m64window[2] << 32) | m64window[3], 0,
((uint64_t)m64window[4] << 32) | m64window[5]);
opal_call(OPAL_PCI_MAP_PE_MMIO_WINDOW, sc->phb_id,
OPAL_PCI_DEFAULT_PE, OPAL_M64_WINDOW_TYPE,
0 /* index */, 0);
opal_call(OPAL_PCI_PHB_MMIO_ENABLE, sc->phb_id,
OPAL_M64_WINDOW_TYPE, 0, OPAL_ENABLE_M64_NON_SPLIT);
}
/*
* Also disable the IOMMU for the time being for PE 1 (everything)
*/
if (bootverbose)
device_printf(dev, "Mapping 0-%#lx for DMA\n",
roundup2(powerpc_ptob(Maxmem), 16*1024*1024));
err = opal_call(OPAL_PCI_MAP_PE_DMA_WINDOW_REAL, sc->phb_id,
OPAL_PCI_DEFAULT_PE, OPAL_PCI_DEFAULT_PE << 1,
0 /* start address */, roundup2(powerpc_ptob(Maxmem),
16*1024*1024)/* all RAM */);
if (err != 0) {
device_printf(dev, "DMA mapping failed: %d\n", err);
return (ENXIO);
}
/*
* Get MSI properties
*/
sc->msi_vmem = NULL;
if (OF_getproplen(ofw_bus_get_node(dev), "ibm,opal-msi-ranges") > 0) {
cell_t msi_ranges[2];
OF_getencprop(ofw_bus_get_node(dev), "ibm,opal-msi-ranges",
msi_ranges, sizeof(msi_ranges));
sc->msi_base = msi_ranges[0];
sc->msi_vmem = vmem_create("OPAL MSI", msi_ranges[0],
msi_ranges[1], 1, 16, M_BESTFIT | M_WAITOK);
sc->base_msi_irq = powerpc_register_pic(dev,
OF_xref_from_node(ofw_bus_get_node(dev)),
msi_ranges[0] + msi_ranges[1], 0, FALSE);
if (bootverbose)
device_printf(dev, "Supports %d MSIs starting at %d\n",
msi_ranges[1], msi_ranges[0]);
}
/*
* General OFW PCI attach
*/
err = ofw_pci_init(dev);
if (err != 0)
return (err);
/*
* Unfreeze non-config-space PCI operations. Let this fail silently
* if e.g. there is no current freeze.
*/
opal_call(OPAL_PCI_EEH_FREEZE_CLEAR, sc->phb_id, OPAL_PCI_DEFAULT_PE,
OPAL_EEH_ACTION_CLEAR_FREEZE_ALL);
/*
* OPAL stores 64-bit BARs in a special property rather than "ranges"
*/
if (OF_getencprop(ofw_bus_get_node(dev), "ibm,opal-m64-window",
m64window, sizeof(m64window)) == sizeof(m64window)) {
struct ofw_pci_range *rp;
sc->ofw_sc.sc_nrange++;
sc->ofw_sc.sc_range = realloc(sc->ofw_sc.sc_range,
sc->ofw_sc.sc_nrange * sizeof(sc->ofw_sc.sc_range[0]),
M_DEVBUF, M_WAITOK);
rp = &sc->ofw_sc.sc_range[sc->ofw_sc.sc_nrange-1];
rp->pci_hi = OFW_PCI_PHYS_HI_SPACE_MEM64 |
OFW_PCI_PHYS_HI_PREFETCHABLE;
rp->pci = ((uint64_t)m64window[0] << 32) | m64window[1];
rp->host = ((uint64_t)m64window[2] << 32) | m64window[3];
rp->size = ((uint64_t)m64window[4] << 32) | m64window[5];
rman_manage_region(&sc->ofw_sc.sc_mem_rman, rp->pci,
rp->pci + rp->size - 1);
}
return (ofw_pci_attach(dev));
}
static uint32_t
opalpci_read_config(device_t dev, u_int bus, u_int slot, u_int func, u_int reg,
int width)
{
struct opalpci_softc *sc;
uint64_t config_addr;
uint8_t byte;
uint16_t half;
uint32_t word;
int error;
sc = device_get_softc(dev);
config_addr = (bus << 8) | ((slot & 0x1f) << 3) | (func & 0x7);
switch (width) {
case 1:
error = opal_call(OPAL_PCI_CONFIG_READ_BYTE, sc->phb_id,
config_addr, reg, vtophys(&byte));
word = byte;
break;
case 2:
error = opal_call(OPAL_PCI_CONFIG_READ_HALF_WORD, sc->phb_id,
config_addr, reg, vtophys(&half));
word = half;
break;
case 4:
error = opal_call(OPAL_PCI_CONFIG_READ_WORD, sc->phb_id,
config_addr, reg, vtophys(&word));
break;
default:
word = 0xffffffff;
}
/*
* Poking config state for non-existant devices can make
* the host bridge hang up. Clear any errors.
*
* XXX: Make this conditional on the existence of a freeze
*/
opal_call(OPAL_PCI_EEH_FREEZE_CLEAR, sc->phb_id, OPAL_PCI_DEFAULT_PE,
OPAL_EEH_ACTION_CLEAR_FREEZE_ALL);
if (error != OPAL_SUCCESS)
word = 0xffffffff;
return (word);
}
static void
opalpci_write_config(device_t dev, u_int bus, u_int slot, u_int func,
u_int reg, uint32_t val, int width)
{
struct opalpci_softc *sc;
uint64_t config_addr;
int error = OPAL_SUCCESS;
sc = device_get_softc(dev);
config_addr = (bus << 8) | ((slot & 0x1f) << 3) | (func & 0x7);
switch (width) {
case 1:
error = opal_call(OPAL_PCI_CONFIG_WRITE_BYTE, sc->phb_id,
config_addr, reg, val);
break;
case 2:
error = opal_call(OPAL_PCI_CONFIG_WRITE_HALF_WORD, sc->phb_id,
config_addr, reg, val);
break;
case 4:
error = opal_call(OPAL_PCI_CONFIG_WRITE_WORD, sc->phb_id,
config_addr, reg, val);
break;
}
if (error != OPAL_SUCCESS) {
/*
* Poking config state for non-existant devices can make
* the host bridge hang up. Clear any errors.
*/
opal_call(OPAL_PCI_EEH_FREEZE_CLEAR, sc->phb_id,
OPAL_PCI_DEFAULT_PE, OPAL_EEH_ACTION_CLEAR_FREEZE_ALL);
}
}
static int
opalpci_route_interrupt(device_t bus, device_t dev, int pin)
{
return (pin);
}
static int
opalpci_alloc_msi(device_t dev, device_t child, int count, int maxcount,
int *irqs)
{
struct opalpci_softc *sc;
vmem_addr_t start;
phandle_t xref;
int err, i;
sc = device_get_softc(dev);
if (sc->msi_vmem == NULL)
return (ENODEV);
err = vmem_xalloc(sc->msi_vmem, count, powerof2(count), 0, 0,
VMEM_ADDR_MIN, VMEM_ADDR_MAX, M_BESTFIT | M_WAITOK, &start);
if (err)
return (err);
xref = OF_xref_from_node(ofw_bus_get_node(dev));
for (i = 0; i < count; i++)
irqs[i] = MAP_IRQ(xref, start + i);
return (0);
}
static int
opalpci_release_msi(device_t dev, device_t child, int count, int *irqs)
{
struct opalpci_softc *sc;
sc = device_get_softc(dev);
if (sc->msi_vmem == NULL)
return (ENODEV);
vmem_xfree(sc->msi_vmem, irqs[0] - sc->base_msi_irq, count);
return (0);
}
static int
opalpci_alloc_msix(device_t dev, device_t child, int *irq)
{
return (opalpci_alloc_msi(dev, child, 1, 1, irq));
}
static int
opalpci_release_msix(device_t dev, device_t child, int irq)
{
return (opalpci_release_msi(dev, child, 1, &irq));
}
static int
opalpci_map_msi(device_t dev, device_t child, int irq, uint64_t *addr,
uint32_t *data)
{
struct opalpci_softc *sc;
struct pci_devinfo *dinfo;
int err, xive;
sc = device_get_softc(dev);
if (sc->msi_vmem == NULL)
return (ENODEV);
xive = irq - sc->base_msi_irq - sc->msi_base;
opal_call(OPAL_PCI_SET_XIVE_PE, sc->phb_id, OPAL_PCI_DEFAULT_PE, xive);
dinfo = device_get_ivars(child);
if (dinfo->cfg.msi.msi_alloc > 0 &&
(dinfo->cfg.msi.msi_ctrl & PCIM_MSICTRL_64BIT) == 0) {
uint32_t msi32;
err = opal_call(OPAL_GET_MSI_32, sc->phb_id,
OPAL_PCI_DEFAULT_PE, xive, 1, vtophys(&msi32),
vtophys(data));
*addr = be32toh(msi32);
} else {
err = opal_call(OPAL_GET_MSI_64, sc->phb_id,
OPAL_PCI_DEFAULT_PE, xive, 1, vtophys(addr), vtophys(data));
*addr = be64toh(*addr);
}
*data = be32toh(*data);
if (bootverbose && err != 0)
device_printf(child, "OPAL MSI mapping error: %d\n", err);
return ((err == 0) ? 0 : ENXIO);
}
static void
opalpic_pic_enable(device_t dev, u_int irq, u_int vector)
{
PIC_ENABLE(root_pic, irq, vector);
}
static void opalpic_pic_eoi(device_t dev, u_int irq)
{
struct opalpci_softc *sc;
sc = device_get_softc(dev);
opal_call(OPAL_PCI_MSI_EOI, sc->phb_id, irq);
PIC_EOI(root_pic, irq);
}
static void opalpic_pic_mask(device_t dev, u_int irq)
{
PIC_MASK(root_pic, irq);
}
static void opalpic_pic_unmask(device_t dev, u_int irq)
{
PIC_UNMASK(root_pic, irq);
}