ab0db651af
The x86-64 doesn't just add two levels to page tables to support 64 bit addresses, but is a different processor. For example, calling conventions, system calls, and segmentation are different from 32-bit x86. Segmentation is basically gone, but gs/fs in combination with MSRs can be used to hold a per-core pointer. In general, x86-64 is more straightforward than 32-bit x86. The port uses code from sv6 and the xv6 "rsc-amd64" branch. A summary of the changes is as follows: - Booting: switch to grub instead of xv6's bootloader (pass -kernel to qemu), because xv6's boot loader doesn't understand 64bit ELF files. And, we don't care anymore about booting. - Makefile: use -m64 instead of -m32 flag for gcc, delete boot loader, xv6.img, bochs, and memfs. For now dont' use -O2, since usertests with -O2 is bigger than MAXFILE! - Update gdb.tmpl to be for i386 or x86-64 - Console/printf: use stdarg.h and treat 64-bit addresses different from ints (32-bit) - Update elfhdr to be 64 bit - entry.S/entryother.S: add code to switch to 64-bit mode: build a simple page table in 32-bit mode before switching to 64-bit mode, share code for entering boot processor and APs, and tweak boot gdt. The boot gdt is the gdt that the kernel proper also uses. (In 64-bit mode, the gdt/segmentation and task state mostly disappear.) - exec.c: fix passing argv (64-bit now instead of 32-bit). - initcode.c: use syscall instead of int. - kernel.ld: load kernel very high, in top terabyte. 64 bits is a lot of address space! - proc.c: initial return is through new syscall path instead of trapret. - proc.h: update struct cpu to have some scratch space since syscall saves less state than int, update struct context to reflect x86-64 calling conventions. - swtch: simplify for x86-64 calling conventions. - syscall: add fetcharg to handle x86-64 calling convetions (6 arguments are passed through registers), and fetchaddr to read a 64-bit value from user space. - sysfile: update to handle pointers from user space (e.g., sys_exec), which are 64 bits. - trap.c: no special trap vector for sys calls, because x86-64 has a different plan for system calls. - trapasm: one plan for syscalls and one plan for traps (interrupt and exceptions). On x86-64, the kernel is responsible for switching user/kernel stacks. To do, xv6 keeps some scratch space in the cpu structure, and uses MSR GS_KERN_BASE to point to the core's cpu structure (using swapgs). - types.h: add uint64, and change pde_t to uint64 - usertests: exit() when fork fails, which helped in tracking down one of the bugs in the switch from 32-bit to 64-bit - vectors: update to make them 64 bits - vm.c: use bootgdt in kernel too, program MSRs for syscalls and core-local state (for swapgs), walk 4 levels in walkpgdir, add DEVSPACETOP, use task segment to set kernel stack for interrupts (but simpler than in 32-bit mode), add an extra argument to freevm (size of user part of address space) to avoid checking all entries till KERNBASE (there are MANY TB before the top 1TB). - x86: update trapframe to have 64-bit entries, which is what the processor pushes on syscalls and traps. simplify lgdt and lidt, using struct desctr, which needs the gcc directives packed and aligned. TODO: - use int32 instead of int? - simplify curproc(). xv6 has per-cpu state again, but this time it must have it. - avoid repetition in walkpgdir - fix validateint() in usertests.c - fix bugs (e.g., observed one a case of entering kernel with invalid gs or proc
139 lines
3.1 KiB
C
139 lines
3.1 KiB
C
// Multiprocessor support
|
|
// Search memory for MP description structures.
|
|
// http://developer.intel.com/design/pentium/datashts/24201606.pdf
|
|
|
|
#include "types.h"
|
|
#include "defs.h"
|
|
#include "param.h"
|
|
#include "memlayout.h"
|
|
#include "mp.h"
|
|
#include "x86.h"
|
|
#include "mmu.h"
|
|
#include "proc.h"
|
|
|
|
struct cpu cpus[NCPU];
|
|
int ncpu;
|
|
uchar ioapicid;
|
|
|
|
static uchar
|
|
sum(uchar *addr, int len)
|
|
{
|
|
int i, sum;
|
|
|
|
sum = 0;
|
|
for(i=0; i<len; i++)
|
|
sum += addr[i];
|
|
return sum;
|
|
}
|
|
|
|
// Look for an MP structure in the len bytes at addr.
|
|
static struct mp*
|
|
mpsearch1(uint64 a, int len)
|
|
{
|
|
uchar *e, *p, *addr;
|
|
|
|
addr = P2V(a);
|
|
e = addr+len;
|
|
for(p = addr; p < e; p += sizeof(struct mp))
|
|
if(memcmp(p, "_MP_", 4) == 0 && sum(p, sizeof(struct mp)) == 0)
|
|
return (struct mp*)p;
|
|
return 0;
|
|
}
|
|
|
|
// Search for the MP Floating Pointer Structure, which according to the
|
|
// spec is in one of the following three locations:
|
|
// 1) in the first KB of the EBDA;
|
|
// 2) in the last KB of system base memory;
|
|
// 3) in the BIOS ROM between 0xE0000 and 0xFFFFF.
|
|
static struct mp*
|
|
mpsearch(void)
|
|
{
|
|
uchar *bda;
|
|
uint p;
|
|
struct mp *mp;
|
|
|
|
bda = (uchar *) P2V(0x400);
|
|
if((p = ((bda[0x0F]<<8)| bda[0x0E]) << 4)){
|
|
if((mp = mpsearch1(p, 1024)))
|
|
return mp;
|
|
} else {
|
|
p = ((bda[0x14]<<8)|bda[0x13])*1024;
|
|
if((mp = mpsearch1(p-1024, 1024)))
|
|
return mp;
|
|
}
|
|
return mpsearch1(0xF0000, 0x10000);
|
|
}
|
|
|
|
// Search for an MP configuration table. For now,
|
|
// don't accept the default configurations (physaddr == 0).
|
|
// Check for correct signature, calculate the checksum and,
|
|
// if correct, check the version.
|
|
// To do: check extended table checksum.
|
|
static struct mpconf*
|
|
mpconfig(struct mp **pmp)
|
|
{
|
|
struct mpconf *conf;
|
|
struct mp *mp;
|
|
|
|
if((mp = mpsearch()) == 0 || mp->physaddr == 0)
|
|
return 0;
|
|
conf = (struct mpconf*) P2V((uint64) mp->physaddr);
|
|
if(memcmp(conf, "PCMP", 4) != 0)
|
|
return 0;
|
|
if(conf->version != 1 && conf->version != 4)
|
|
return 0;
|
|
if(sum((uchar*)conf, conf->length) != 0)
|
|
return 0;
|
|
*pmp = mp;
|
|
return conf;
|
|
}
|
|
|
|
void
|
|
mpinit(void)
|
|
{
|
|
uchar *p, *e;
|
|
int ismp;
|
|
struct mp *mp;
|
|
struct mpconf *conf;
|
|
struct mpproc *proc;
|
|
struct mpioapic *ioapic;
|
|
|
|
if((conf = mpconfig(&mp)) == 0)
|
|
panic("Expect to run on an SMP");
|
|
ismp = 1;
|
|
lapic = P2V((uint64)conf->lapicaddr_p);
|
|
for(p=(uchar*)(conf+1), e=(uchar*)conf+conf->length; p<e; ){
|
|
switch(*p){
|
|
case MPPROC:
|
|
proc = (struct mpproc*)p;
|
|
if(ncpu < NCPU) {
|
|
cpus[ncpu].apicid = proc->apicid; // apicid may differ from ncpu
|
|
ncpu++;
|
|
}
|
|
p += sizeof(struct mpproc);
|
|
continue;
|
|
case MPIOAPIC:
|
|
ioapic = (struct mpioapic*)p;
|
|
ioapicid = ioapic->apicno;
|
|
p += sizeof(struct mpioapic);
|
|
continue;
|
|
case MPBUS:
|
|
case MPIOINTR:
|
|
case MPLINTR:
|
|
p += 8;
|
|
continue;
|
|
default:
|
|
ismp = 0;
|
|
break;
|
|
}
|
|
}
|
|
if(!ismp)
|
|
panic("Didn't find a suitable machine");
|
|
|
|
if(mp->imcrp){
|
|
// Bochs doesn't support IMCR, so this doesn't run on Bochs.
|
|
// But it would on real hardware.
|
|
outb(0x22, 0x70); // Select IMCR
|
|
outb(0x23, inb(0x23) | 1); // Mask external interrupts.
|
|
}
|
|
}
|