- We only lock the local per-CPU page in the local dTLB, so accessing the
foreign per-CPU pages in cpu_ipi_send() in order to get the module IDs of the other CPUs can cause a page fault. If this happens when doing a TLB shootdown while dealing with another page fault this causes a panic due to the recursive page fault. As I don't spot other code that assumes or requires that accessing foreign per-CPU pages must not page fault solve this by adding a statically allocated (and therefore locked in the kernel pages) array which establishes a FreeBSD CPU ID -> module ID relation and use that in cpu_ipi_selected() (instead of statically allocating the per-CPU pages which would just waste memory on say a dual CPU machine as sun4u theoretically supports up to 128 CPUs or wasting dTLB slots for the foreign per-CPU pages). [1] - Fix a potential race in cpu_ipi_send(); as we don't serialize the access to cpu_ipi_selected() between MI and MD use (only MI-MI and MD-MD) we might catch the NACK bit caused by sending another IPI. Solve this by checking the NACK bit in the contents of the interrupt dispatch status reg read while interrupts were still turned off instead of reading that reg anew after interrupts were turned on again. This is also what the CPU docs suggest to do. - Add a workaround for the SpitFire erratum #54 bug (affecting interrupt dispatch). While public info regarding what this CPU bug actually causes is not available testing shows that with the workaround in place it's less likely to get a "couldn't send ipi" panic, it doesn't solve these panics entirely though. [2] Reported by: kris [1] Some clue from: kmacy [1] Info from: Linux, OpenSolaris [2] Additional testing by: kris MFC after: 3 days
This commit is contained in:
parent
98a829e8ea
commit
ea86aa3726
@ -108,6 +108,7 @@ vm_offset_t mp_tramp;
|
||||
|
||||
u_int mp_boot_mid;
|
||||
|
||||
static u_int cpuid_to_mid[MAXCPU];
|
||||
static volatile u_int shutdown_cpus;
|
||||
|
||||
void cpu_mp_unleash(void *);
|
||||
@ -238,6 +239,8 @@ cpu_mp_start(void)
|
||||
-1, NULL, NULL);
|
||||
intr_setup(PIL_STOP, cpu_ipi_stop, -1, NULL, NULL);
|
||||
|
||||
cpuid_to_mid[PCPU_GET(cpuid)] = mp_boot_mid;
|
||||
|
||||
root = OF_peer(0);
|
||||
csa = &cpu_start_args;
|
||||
for (child = OF_child(root); child != 0; child = OF_peer(child)) {
|
||||
@ -266,6 +269,7 @@ cpu_mp_start(void)
|
||||
intr_restore(s);
|
||||
|
||||
cpuid = mp_ncpus++;
|
||||
cpuid_to_mid[cpuid] = mid;
|
||||
cpu_identify(csa->csa_ver, clock, cpuid);
|
||||
|
||||
va = kmem_alloc(kernel_map, PCPU_PAGES * PAGE_SIZE);
|
||||
@ -413,20 +417,19 @@ cpu_ipi_stop(struct trapframe *tf)
|
||||
void
|
||||
cpu_ipi_selected(u_int cpus, u_long d0, u_long d1, u_long d2)
|
||||
{
|
||||
struct pcpu *pc;
|
||||
u_int cpu;
|
||||
|
||||
while (cpus) {
|
||||
cpu = ffs(cpus) - 1;
|
||||
cpus &= ~(1 << cpu);
|
||||
pc = pcpu_find(cpu);
|
||||
cpu_ipi_send(pc->pc_mid, d0, d1, d2);
|
||||
cpu_ipi_send(cpuid_to_mid[cpu], d0, d1, d2);
|
||||
}
|
||||
}
|
||||
|
||||
void
|
||||
cpu_ipi_send(u_int mid, u_long d0, u_long d1, u_long d2)
|
||||
{
|
||||
u_long ids;
|
||||
u_long s;
|
||||
int i;
|
||||
|
||||
@ -438,11 +441,20 @@ cpu_ipi_send(u_int mid, u_long d0, u_long d1, u_long d2)
|
||||
stxa(AA_SDB_INTR_D1, ASI_SDB_INTR_W, d1);
|
||||
stxa(AA_SDB_INTR_D2, ASI_SDB_INTR_W, d2);
|
||||
stxa(AA_INTR_SEND | (mid << 14), ASI_SDB_INTR_W, 0);
|
||||
/*
|
||||
* Workaround for SpitFire erratum #54; do a dummy read
|
||||
* from a SDB internal register before the MEMBAR #Sync
|
||||
* for the write to ASI_SDB_INTR_W (requiring another
|
||||
* MEMBAR #Sync in order to make sure the write has
|
||||
* occurred before the load).
|
||||
*/
|
||||
membar(Sync);
|
||||
while (ldxa(0, ASI_INTR_DISPATCH_STATUS) & IDR_BUSY)
|
||||
(void)ldxa(AA_SDB_CNTL_HIGH, ASI_SDB_CONTROL_R);
|
||||
membar(Sync);
|
||||
while ((ids = ldxa(0, ASI_INTR_DISPATCH_STATUS)) & IDR_BUSY)
|
||||
;
|
||||
intr_restore(s);
|
||||
if ((ldxa(0, ASI_INTR_DISPATCH_STATUS) & IDR_NACK) == 0)
|
||||
if ((ids & IDR_NACK) == 0)
|
||||
return;
|
||||
}
|
||||
if (
|
||||
|
Loading…
x
Reference in New Issue
Block a user