50c202c592
- Modules and kernel code alike may use DPCPU_DEFINE(), DPCPU_GET(), DPCPU_SET(), etc. akin to the statically defined PCPU_*. Requires only one extra instruction more than PCPU_* and is virtually the same as __thread for builtin and much faster for shared objects. DPCPU variables can be initialized when defined. - Modules are supported by relocating the module's per-cpu linker set over space reserved in the kernel. Modules may fail to load if there is insufficient space available. - Track space available for modules with a one-off extent allocator. Free may block for memory to allocate space for an extent. Reviewed by: jhb, rwatson, kan, sam, grehan, marius, marcel, stas
486 lines
14 KiB
C
486 lines
14 KiB
C
/* $NetBSD: hpc_machdep.c,v 1.70 2003/09/16 08:18:22 agc Exp $ */
|
|
|
|
/*-
|
|
* Copyright (c) 1994-1998 Mark Brinicombe.
|
|
* Copyright (c) 1994 Brini.
|
|
* All rights reserved.
|
|
*
|
|
* This code is derived from software written for Brini by Mark Brinicombe
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions
|
|
* are met:
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
* 3. All advertising materials mentioning features or use of this software
|
|
* must display the following acknowledgement:
|
|
* This product includes software developed by Brini.
|
|
* 4. The name of the company nor the name of the author may be used to
|
|
* endorse or promote products derived from this software without specific
|
|
* prior written permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY BRINI ``AS IS'' AND ANY EXPRESS OR IMPLIED
|
|
* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
|
|
* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
|
|
* IN NO EVENT SHALL BRINI OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT,
|
|
* INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
|
|
* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
|
|
* SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
|
|
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
|
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
|
|
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
|
|
* SUCH DAMAGE.
|
|
*
|
|
* RiscBSD kernel project
|
|
*
|
|
* machdep.c
|
|
*
|
|
* Machine dependant functions for kernel setup
|
|
*
|
|
* This file needs a lot of work.
|
|
*
|
|
* Created : 17/09/94
|
|
*/
|
|
|
|
#include "opt_msgbuf.h"
|
|
|
|
#include <sys/cdefs.h>
|
|
__FBSDID("$FreeBSD$");
|
|
|
|
#define _ARM32_BUS_DMA_PRIVATE
|
|
#include <sys/param.h>
|
|
#include <sys/systm.h>
|
|
#include <sys/sysproto.h>
|
|
#include <sys/signalvar.h>
|
|
#include <sys/imgact.h>
|
|
#include <sys/kernel.h>
|
|
#include <sys/ktr.h>
|
|
#include <sys/linker.h>
|
|
#include <sys/lock.h>
|
|
#include <sys/malloc.h>
|
|
#include <sys/mutex.h>
|
|
#include <sys/pcpu.h>
|
|
#include <sys/proc.h>
|
|
#include <sys/ptrace.h>
|
|
#include <sys/cons.h>
|
|
#include <sys/bio.h>
|
|
#include <sys/bus.h>
|
|
#include <sys/buf.h>
|
|
#include <sys/exec.h>
|
|
#include <sys/kdb.h>
|
|
#include <sys/msgbuf.h>
|
|
#include <machine/reg.h>
|
|
#include <machine/cpu.h>
|
|
|
|
#include <vm/vm.h>
|
|
#include <vm/pmap.h>
|
|
#include <vm/vm_object.h>
|
|
#include <vm/vm_page.h>
|
|
#include <vm/vm_pager.h>
|
|
#include <vm/vm_map.h>
|
|
#include <vm/vnode_pager.h>
|
|
#include <machine/pmap.h>
|
|
#include <machine/vmparam.h>
|
|
#include <machine/pcb.h>
|
|
#include <machine/undefined.h>
|
|
#include <machine/machdep.h>
|
|
#include <machine/metadata.h>
|
|
#include <machine/armreg.h>
|
|
#include <machine/bus.h>
|
|
#include <sys/reboot.h>
|
|
|
|
#include <arm/xscale/i80321/i80321reg.h>
|
|
#include <arm/xscale/i80321/i80321var.h>
|
|
#include <arm/xscale/i80321/iq80321reg.h>
|
|
#include <arm/xscale/i80321/obiovar.h>
|
|
|
|
#define KERNEL_PT_SYS 0 /* Page table for mapping proc0 zero page */
|
|
#define KERNEL_PT_IOPXS 1
|
|
#define KERNEL_PT_BEFOREKERN 2
|
|
#define KERNEL_PT_AFKERNEL 3 /* L2 table for mapping after kernel */
|
|
#define KERNEL_PT_AFKERNEL_NUM 9
|
|
|
|
/* this should be evenly divisable by PAGE_SIZE / L2_TABLE_SIZE_REAL (or 4) */
|
|
#define NUM_KERNEL_PTS (KERNEL_PT_AFKERNEL + KERNEL_PT_AFKERNEL_NUM)
|
|
|
|
/* Define various stack sizes in pages */
|
|
#define IRQ_STACK_SIZE 1
|
|
#define ABT_STACK_SIZE 1
|
|
#define UND_STACK_SIZE 1
|
|
|
|
extern u_int data_abort_handler_address;
|
|
extern u_int prefetch_abort_handler_address;
|
|
extern u_int undefined_handler_address;
|
|
|
|
struct pv_addr kernel_pt_table[NUM_KERNEL_PTS];
|
|
|
|
extern void *_end;
|
|
|
|
extern int *end;
|
|
|
|
struct pcpu __pcpu;
|
|
struct pcpu *pcpup = &__pcpu;
|
|
|
|
/* Physical and virtual addresses for some global pages */
|
|
|
|
vm_paddr_t phys_avail[10];
|
|
vm_paddr_t dump_avail[4];
|
|
vm_offset_t physical_pages;
|
|
|
|
struct pv_addr systempage;
|
|
struct pv_addr msgbufpv;
|
|
struct pv_addr irqstack;
|
|
struct pv_addr undstack;
|
|
struct pv_addr abtstack;
|
|
struct pv_addr kernelstack;
|
|
struct pv_addr minidataclean;
|
|
|
|
static struct trapframe proc0_tf;
|
|
|
|
#define IQ80321_OBIO_BASE 0xfe800000UL
|
|
#define IQ80321_OBIO_SIZE 0x00100000UL
|
|
/* Static device mappings. */
|
|
static const struct pmap_devmap iq80321_devmap[] = {
|
|
/*
|
|
* Map the on-board devices VA == PA so that we can access them
|
|
* with the MMU on or off.
|
|
*/
|
|
{
|
|
IQ80321_OBIO_BASE,
|
|
IQ80321_OBIO_BASE,
|
|
IQ80321_OBIO_SIZE,
|
|
VM_PROT_READ|VM_PROT_WRITE,
|
|
PTE_NOCACHE,
|
|
},
|
|
{
|
|
IQ80321_IOW_VBASE,
|
|
VERDE_OUT_XLATE_IO_WIN0_BASE,
|
|
VERDE_OUT_XLATE_IO_WIN_SIZE,
|
|
VM_PROT_READ|VM_PROT_WRITE,
|
|
PTE_NOCACHE,
|
|
},
|
|
|
|
{
|
|
IQ80321_80321_VBASE,
|
|
VERDE_PMMR_BASE,
|
|
VERDE_PMMR_SIZE,
|
|
VM_PROT_READ|VM_PROT_WRITE,
|
|
PTE_NOCACHE,
|
|
},
|
|
{
|
|
0,
|
|
0,
|
|
0,
|
|
0,
|
|
0,
|
|
}
|
|
};
|
|
|
|
#define SDRAM_START 0xa0000000
|
|
|
|
extern vm_offset_t xscale_cache_clean_addr;
|
|
|
|
void *
|
|
initarm(void *arg, void *arg2)
|
|
{
|
|
struct pv_addr kernel_l1pt;
|
|
struct pv_addr dpcpu;
|
|
int loop, i;
|
|
u_int l1pagetable;
|
|
vm_offset_t freemempos;
|
|
vm_offset_t freemem_pt;
|
|
vm_offset_t afterkern;
|
|
vm_offset_t freemem_after;
|
|
vm_offset_t lastaddr;
|
|
uint32_t memsize, memstart;
|
|
|
|
set_cpufuncs();
|
|
lastaddr = fake_preload_metadata();
|
|
pcpu_init(pcpup, 0, sizeof(struct pcpu));
|
|
PCPU_SET(curthread, &thread0);
|
|
|
|
freemempos = 0xa0200000;
|
|
/* Define a macro to simplify memory allocation */
|
|
#define valloc_pages(var, np) \
|
|
alloc_pages((var).pv_pa, (np)); \
|
|
(var).pv_va = (var).pv_pa + 0x20000000;
|
|
|
|
#define alloc_pages(var, np) \
|
|
freemempos -= (np * PAGE_SIZE); \
|
|
(var) = freemempos; \
|
|
memset((char *)(var), 0, ((np) * PAGE_SIZE));
|
|
|
|
while (((freemempos - L1_TABLE_SIZE) & (L1_TABLE_SIZE - 1)) != 0)
|
|
freemempos -= PAGE_SIZE;
|
|
valloc_pages(kernel_l1pt, L1_TABLE_SIZE / PAGE_SIZE);
|
|
for (loop = 0; loop < NUM_KERNEL_PTS; ++loop) {
|
|
if (!(loop % (PAGE_SIZE / L2_TABLE_SIZE_REAL))) {
|
|
valloc_pages(kernel_pt_table[loop],
|
|
L2_TABLE_SIZE / PAGE_SIZE);
|
|
} else {
|
|
kernel_pt_table[loop].pv_pa = freemempos +
|
|
(loop % (PAGE_SIZE / L2_TABLE_SIZE_REAL)) *
|
|
L2_TABLE_SIZE_REAL;
|
|
kernel_pt_table[loop].pv_va =
|
|
kernel_pt_table[loop].pv_pa + 0x20000000;
|
|
}
|
|
}
|
|
freemem_pt = freemempos;
|
|
freemempos = 0xa0100000;
|
|
/*
|
|
* Allocate a page for the system page mapped to V0x00000000
|
|
* This page will just contain the system vectors and can be
|
|
* shared by all processes.
|
|
*/
|
|
valloc_pages(systempage, 1);
|
|
|
|
/* Allocate dynamic per-cpu area. */
|
|
valloc_pages(dpcpu, DPCPU_SIZE / PAGE_SIZE);
|
|
dpcpu_init((void *)dpcpu.pv_va, 0);
|
|
|
|
/* Allocate stacks for all modes */
|
|
valloc_pages(irqstack, IRQ_STACK_SIZE);
|
|
valloc_pages(abtstack, ABT_STACK_SIZE);
|
|
valloc_pages(undstack, UND_STACK_SIZE);
|
|
valloc_pages(kernelstack, KSTACK_PAGES);
|
|
alloc_pages(minidataclean.pv_pa, 1);
|
|
valloc_pages(msgbufpv, round_page(MSGBUF_SIZE) / PAGE_SIZE);
|
|
#ifdef ARM_USE_SMALL_ALLOC
|
|
freemempos -= PAGE_SIZE;
|
|
freemem_pt = trunc_page(freemem_pt);
|
|
freemem_after = freemempos - ((freemem_pt - 0xa0100000) /
|
|
PAGE_SIZE) * sizeof(struct arm_small_page);
|
|
arm_add_smallalloc_pages((void *)(freemem_after + 0x20000000)
|
|
, (void *)0xc0100000, freemem_pt - 0xa0100000, 1);
|
|
freemem_after -= ((freemem_after - 0xa0001000) / PAGE_SIZE) *
|
|
sizeof(struct arm_small_page);
|
|
arm_add_smallalloc_pages((void *)(freemem_after + 0x20000000)
|
|
, (void *)0xc0001000, trunc_page(freemem_after) - 0xa0001000, 0);
|
|
freemempos = trunc_page(freemem_after);
|
|
freemempos -= PAGE_SIZE;
|
|
#endif
|
|
/*
|
|
* Allocate memory for the l1 and l2 page tables. The scheme to avoid
|
|
* wasting memory by allocating the l1pt on the first 16k memory was
|
|
* taken from NetBSD rpc_machdep.c. NKPT should be greater than 12 for
|
|
* this to work (which is supposed to be the case).
|
|
*/
|
|
|
|
/*
|
|
* Now we start construction of the L1 page table
|
|
* We start by mapping the L2 page tables into the L1.
|
|
* This means that we can replace L1 mappings later on if necessary
|
|
*/
|
|
l1pagetable = kernel_l1pt.pv_va;
|
|
|
|
/* Map the L2 pages tables in the L1 page table */
|
|
pmap_link_l2pt(l1pagetable, ARM_VECTORS_HIGH & ~(0x00100000 - 1),
|
|
&kernel_pt_table[KERNEL_PT_SYS]);
|
|
pmap_link_l2pt(l1pagetable, IQ80321_IOPXS_VBASE,
|
|
&kernel_pt_table[KERNEL_PT_IOPXS]);
|
|
pmap_link_l2pt(l1pagetable, KERNBASE,
|
|
&kernel_pt_table[KERNEL_PT_BEFOREKERN]);
|
|
pmap_map_chunk(l1pagetable, KERNBASE, SDRAM_START, 0x100000,
|
|
VM_PROT_READ|VM_PROT_WRITE, PTE_CACHE);
|
|
pmap_map_chunk(l1pagetable, KERNBASE + 0x100000, SDRAM_START + 0x100000,
|
|
0x100000, VM_PROT_READ|VM_PROT_WRITE, PTE_PAGETABLE);
|
|
pmap_map_chunk(l1pagetable, KERNBASE + 0x200000, SDRAM_START + 0x200000,
|
|
(((uint32_t)(lastaddr) - KERNBASE - 0x200000) + L1_S_SIZE) & ~(L1_S_SIZE - 1),
|
|
VM_PROT_READ|VM_PROT_WRITE, PTE_CACHE);
|
|
freemem_after = ((int)lastaddr + PAGE_SIZE) & ~(PAGE_SIZE - 1);
|
|
afterkern = round_page(((vm_offset_t)lastaddr + L1_S_SIZE) & ~(L1_S_SIZE
|
|
- 1));
|
|
for (i = 0; i < KERNEL_PT_AFKERNEL_NUM; i++) {
|
|
pmap_link_l2pt(l1pagetable, afterkern + i * 0x00100000,
|
|
&kernel_pt_table[KERNEL_PT_AFKERNEL + i]);
|
|
}
|
|
pmap_map_entry(l1pagetable, afterkern, minidataclean.pv_pa,
|
|
VM_PROT_READ|VM_PROT_WRITE, PTE_CACHE);
|
|
|
|
|
|
#ifdef ARM_USE_SMALL_ALLOC
|
|
if ((freemem_after + 2 * PAGE_SIZE) <= afterkern) {
|
|
arm_add_smallalloc_pages((void *)(freemem_after),
|
|
(void*)(freemem_after + PAGE_SIZE),
|
|
afterkern - (freemem_after + PAGE_SIZE), 0);
|
|
|
|
}
|
|
#endif
|
|
|
|
/* Map the Mini-Data cache clean area. */
|
|
xscale_setup_minidata(l1pagetable, afterkern,
|
|
minidataclean.pv_pa);
|
|
|
|
/* Map the vector page. */
|
|
pmap_map_entry(l1pagetable, ARM_VECTORS_HIGH, systempage.pv_pa,
|
|
VM_PROT_READ|VM_PROT_WRITE, PTE_CACHE);
|
|
pmap_devmap_bootstrap(l1pagetable, iq80321_devmap);
|
|
/*
|
|
* Give the XScale global cache clean code an appropriately
|
|
* sized chunk of unmapped VA space starting at 0xff000000
|
|
* (our device mappings end before this address).
|
|
*/
|
|
xscale_cache_clean_addr = 0xff000000U;
|
|
|
|
cpu_domains((DOMAIN_CLIENT << (PMAP_DOMAIN_KERNEL*2)) | DOMAIN_CLIENT);
|
|
setttb(kernel_l1pt.pv_pa);
|
|
cpu_tlb_flushID();
|
|
cpu_domains(DOMAIN_CLIENT << (PMAP_DOMAIN_KERNEL*2));
|
|
/*
|
|
* Pages were allocated during the secondary bootstrap for the
|
|
* stacks for different CPU modes.
|
|
* We must now set the r13 registers in the different CPU modes to
|
|
* point to these stacks.
|
|
* Since the ARM stacks use STMFD etc. we must set r13 to the top end
|
|
* of the stack memory.
|
|
*/
|
|
|
|
|
|
set_stackptr(PSR_IRQ32_MODE,
|
|
irqstack.pv_va + IRQ_STACK_SIZE * PAGE_SIZE);
|
|
set_stackptr(PSR_ABT32_MODE,
|
|
abtstack.pv_va + ABT_STACK_SIZE * PAGE_SIZE);
|
|
set_stackptr(PSR_UND32_MODE,
|
|
undstack.pv_va + UND_STACK_SIZE * PAGE_SIZE);
|
|
|
|
|
|
|
|
/*
|
|
* We must now clean the cache again....
|
|
* Cleaning may be done by reading new data to displace any
|
|
* dirty data in the cache. This will have happened in setttb()
|
|
* but since we are boot strapping the addresses used for the read
|
|
* may have just been remapped and thus the cache could be out
|
|
* of sync. A re-clean after the switch will cure this.
|
|
* After booting there are no gross relocations of the kernel thus
|
|
* this problem will not occur after initarm().
|
|
*/
|
|
cpu_idcache_wbinv_all();
|
|
/*
|
|
* Fetch the SDRAM start/size from the i80321 SDRAM configration
|
|
* registers.
|
|
*/
|
|
i80321_calibrate_delay();
|
|
i80321_sdram_bounds(&obio_bs_tag, IQ80321_80321_VBASE + VERDE_MCU_BASE,
|
|
&memstart, &memsize);
|
|
physmem = memsize / PAGE_SIZE;
|
|
cninit();
|
|
|
|
/* Set stack for exception handlers */
|
|
|
|
data_abort_handler_address = (u_int)data_abort_handler;
|
|
prefetch_abort_handler_address = (u_int)prefetch_abort_handler;
|
|
undefined_handler_address = (u_int)undefinedinstruction_bounce;
|
|
undefined_init();
|
|
|
|
proc_linkup0(&proc0, &thread0);
|
|
thread0.td_kstack = kernelstack.pv_va;
|
|
thread0.td_pcb = (struct pcb *)
|
|
(thread0.td_kstack + KSTACK_PAGES * PAGE_SIZE) - 1;
|
|
thread0.td_pcb->pcb_flags = 0;
|
|
thread0.td_frame = &proc0_tf;
|
|
pcpup->pc_curpcb = thread0.td_pcb;
|
|
|
|
/* Enable MMU, I-cache, D-cache, write buffer. */
|
|
|
|
arm_vector_init(ARM_VECTORS_HIGH, ARM_VEC_ALL);
|
|
|
|
|
|
|
|
pmap_curmaxkvaddr = afterkern + PAGE_SIZE;
|
|
/*
|
|
* ARM_USE_SMALL_ALLOC uses dump_avail, so it must be filled before
|
|
* calling pmap_bootstrap.
|
|
*/
|
|
dump_avail[0] = 0xa0000000;
|
|
dump_avail[1] = 0xa0000000 + memsize;
|
|
dump_avail[2] = 0;
|
|
dump_avail[3] = 0;
|
|
|
|
pmap_bootstrap(pmap_curmaxkvaddr,
|
|
0xd0000000, &kernel_l1pt);
|
|
msgbufp = (void*)msgbufpv.pv_va;
|
|
msgbufinit(msgbufp, MSGBUF_SIZE);
|
|
mutex_init();
|
|
|
|
i = 0;
|
|
#ifdef ARM_USE_SMALL_ALLOC
|
|
phys_avail[i++] = 0xa0000000;
|
|
phys_avail[i++] = 0xa0001000; /*
|
|
*XXX: Gross hack to get our
|
|
* pages in the vm_page_array
|
|
. */
|
|
#endif
|
|
phys_avail[i++] = round_page(virtual_avail - KERNBASE + SDRAM_START);
|
|
phys_avail[i++] = trunc_page(0xa0000000 + memsize - 1);
|
|
phys_avail[i++] = 0;
|
|
phys_avail[i] = 0;
|
|
|
|
/* Do basic tuning, hz etc */
|
|
init_param1();
|
|
init_param2(physmem);
|
|
kdb_init();
|
|
return ((void *)(kernelstack.pv_va + USPACE_SVC_STACK_TOP -
|
|
sizeof(struct pcb)));
|
|
}
|
|
|
|
|
|
extern int
|
|
machdep_pci_route_interrupt(device_t pcib, device_t dev, int pin)
|
|
{
|
|
int bus;
|
|
int device;
|
|
int func;
|
|
uint32_t busno;
|
|
struct i80321_pci_softc *sc = device_get_softc(pcib);
|
|
bus = pci_get_bus(dev);
|
|
device = pci_get_slot(dev);
|
|
func = pci_get_function(dev);
|
|
busno = bus_space_read_4(sc->sc_st, sc->sc_atu_sh, ATU_PCIXSR);
|
|
busno = PCIXSR_BUSNO(busno);
|
|
if (busno == 0xff)
|
|
busno = 0;
|
|
if (bus != busno)
|
|
goto no_mapping;
|
|
switch (device) {
|
|
/* IQ31244 PCI */
|
|
case 1: /* PCIX-PCIX bridge */
|
|
/*
|
|
* The S-ATA chips are behind the bridge, and all of
|
|
* the S-ATA interrupts are wired together.
|
|
*/
|
|
return (ICU_INT_XINT(2));
|
|
case 2: /* PCI slot */
|
|
/* All pins are wired together. */
|
|
return (ICU_INT_XINT(3));
|
|
case 3: /* i82546 dual Gig-E */
|
|
if (pin == 1 || pin == 2)
|
|
return (ICU_INT_XINT(0));
|
|
goto no_mapping;
|
|
/* IQ80321 PCI */
|
|
case 4: /* i82544 Gig-E */
|
|
case 8: /*
|
|
* Apparently you can set the device for the ethernet adapter
|
|
* to 8 with a jumper, so handle that as well
|
|
*/
|
|
if (pin == 1)
|
|
return (ICU_INT_XINT(0));
|
|
goto no_mapping;
|
|
case 6: /* S-PCI-X slot */
|
|
if (pin == 1)
|
|
return (ICU_INT_XINT(2));
|
|
if (pin == 2)
|
|
return (ICU_INT_XINT(3));
|
|
goto no_mapping;
|
|
default:
|
|
no_mapping:
|
|
printf("No mapping for %d/%d/%d/%c\n", bus, device, func, pin);
|
|
|
|
}
|
|
return (0);
|
|
|
|
}
|