xv6-riscv-kernel/sysfile.c

456 lines
7.4 KiB
C
Raw Normal View History

//
// File-system system calls.
// Mostly argument checking, since we don't trust
// user code, and calls into file.c and fs.c.
//
#include "types.h"
#include "riscv.h"
2007-08-28 01:26:33 +02:00
#include "defs.h"
#include "param.h"
2007-08-28 01:26:33 +02:00
#include "stat.h"
#include "proc.h"
#include "fs.h"
2016-09-12 02:59:57 +02:00
#include "spinlock.h"
#include "sleeplock.h"
2006-09-06 20:40:28 +02:00
#include "file.h"
#include "fcntl.h"
2006-09-07 16:13:26 +02:00
// Fetch the nth word-sized system call argument as a file descriptor
// and return both the descriptor and the corresponding struct file.
static int
2007-08-28 01:53:17 +02:00
argfd(int n, int *pfd, struct file **pf)
{
2006-09-07 16:13:26 +02:00
int fd;
struct file *f;
2007-08-28 01:53:17 +02:00
if(argint(n, &fd) < 0)
2006-09-07 16:13:26 +02:00
return -1;
if(fd < 0 || fd >= NOFILE || (f=myproc()->ofile[fd]) == 0)
2006-09-07 16:13:26 +02:00
return -1;
if(pfd)
*pfd = fd;
if(pf)
*pf = f;
return 0;
2006-09-07 16:13:26 +02:00
}
2006-09-07 16:13:26 +02:00
// Allocate a file descriptor for the given file.
// Takes over file reference from caller on success.
static int
fdalloc(struct file *f)
{
int fd;
2019-05-31 15:45:59 +02:00
struct proc *p = myproc();
2007-08-09 19:32:40 +02:00
2006-09-07 16:13:26 +02:00
for(fd = 0; fd < NOFILE; fd++){
2019-05-31 15:45:59 +02:00
if(p->ofile[fd] == 0){
p->ofile[fd] = f;
2006-09-07 16:13:26 +02:00
return fd;
}
}
return -1;
}
2009-07-12 04:26:01 +02:00
int
sys_dup(void)
{
struct file *f;
int fd;
2015-09-27 05:10:25 +02:00
2009-07-12 04:26:01 +02:00
if(argfd(0, 0, &f) < 0)
return -1;
if((fd=fdalloc(f)) < 0)
return -1;
filedup(f);
return fd;
}
int
sys_read(void)
{
struct file *f;
int n;
char *p;
if(argfd(0, 0, &f) < 0 || argint(2, &n) < 0 || argptr(1, &p, n) < 0)
return -1;
return fileread(f, p, n);
2006-09-07 16:13:26 +02:00
}
int
sys_write(void)
{
struct file *f;
int n;
char *p;
if(argfd(0, 0, &f) < 0 || argint(2, &n) < 0 || argptr(1, &p, n) < 0)
2006-09-07 16:13:26 +02:00
return -1;
return filewrite(f, p, n);
}
int
sys_close(void)
{
int fd;
2006-09-07 16:13:26 +02:00
struct file *f;
2015-09-27 05:10:25 +02:00
2006-09-07 16:13:26 +02:00
if(argfd(0, &fd, &f) < 0)
return -1;
myproc()->ofile[fd] = 0;
2006-09-07 16:13:26 +02:00
fileclose(f);
return 0;
}
2007-08-25 00:17:54 +02:00
int
sys_fstat(void)
{
struct file *f;
struct stat *st;
2015-09-27 05:10:25 +02:00
2007-08-25 00:17:54 +02:00
if(argfd(0, 0, &f) < 0 || argptr(1, (void*)&st, sizeof(*st)) < 0)
return -1;
return filestat(f, st);
}
// Create the path new as a link to the same inode as old.
int
sys_link(void)
{
char name[DIRSIZ], *new, *old;
struct inode *dp, *ip;
if(argstr(0, &old) < 0 || argstr(1, &new) < 0)
return -1;
2014-08-27 23:15:30 +02:00
begin_op();
if((ip = namei(old)) == 0){
2014-08-27 23:15:30 +02:00
end_op();
return -1;
}
ilock(ip);
if(ip->type == T_DIR){
iunlockput(ip);
2014-08-27 23:15:30 +02:00
end_op();
return -1;
}
ip->nlink++;
iupdate(ip);
iunlock(ip);
if((dp = nameiparent(new, name)) == 0)
2009-05-31 04:07:51 +02:00
goto bad;
ilock(dp);
2009-05-31 04:07:51 +02:00
if(dp->dev != ip->dev || dirlink(dp, name, ip->inum) < 0){
iunlockput(dp);
goto bad;
2009-05-31 04:07:51 +02:00
}
iunlockput(dp);
iput(ip);
2014-08-27 23:15:30 +02:00
end_op();
return 0;
bad:
ilock(ip);
ip->nlink--;
iupdate(ip);
iunlockput(ip);
2014-08-27 23:15:30 +02:00
end_op();
return -1;
}
// Is the directory dp empty except for "." and ".." ?
static int
isdirempty(struct inode *dp)
{
int off;
struct dirent de;
for(off=2*sizeof(de); off<dp->size; off+=sizeof(de)){
if(readi(dp, (char*)&de, off, sizeof(de)) != sizeof(de))
panic("isdirempty: readi");
if(de.inum != 0)
return 0;
}
return 1;
}
2007-08-25 00:17:54 +02:00
//PAGEBREAK!
int
sys_unlink(void)
{
struct inode *ip, *dp;
struct dirent de;
char name[DIRSIZ], *path;
uint off;
if(argstr(0, &path) < 0)
return -1;
2014-08-27 23:15:30 +02:00
begin_op();
if((dp = nameiparent(path, name)) == 0){
2014-08-27 23:15:30 +02:00
end_op();
return -1;
}
ilock(dp);
// Cannot unlink "." or "..".
if(namecmp(name, ".") == 0 || namecmp(name, "..") == 0)
goto bad;
if((ip = dirlookup(dp, name, &off)) == 0)
goto bad;
ilock(ip);
if(ip->nlink < 1)
panic("unlink: nlink < 1");
if(ip->type == T_DIR && !isdirempty(ip)){
iunlockput(ip);
goto bad;
}
memset(&de, 0, sizeof(de));
if(writei(dp, (char*)&de, off, sizeof(de)) != sizeof(de))
panic("unlink: writei");
if(ip->type == T_DIR){
dp->nlink--;
iupdate(dp);
}
iunlockput(dp);
ip->nlink--;
iupdate(ip);
iunlockput(ip);
2014-08-27 23:15:30 +02:00
end_op();
return 0;
bad:
iunlockput(dp);
2014-08-27 23:15:30 +02:00
end_op();
return -1;
}
static struct inode*
2009-05-31 04:07:51 +02:00
create(char *path, short type, short major, short minor)
{
uint off;
struct inode *ip, *dp;
char name[DIRSIZ];
if((dp = nameiparent(path, name)) == 0)
return 0;
ilock(dp);
2009-05-31 04:07:51 +02:00
if((ip = dirlookup(dp, name, &off)) != 0){
iunlockput(dp);
ilock(ip);
2009-07-12 04:26:01 +02:00
if(type == T_FILE && ip->type == T_FILE)
return ip;
iunlockput(ip);
return 0;
}
2009-07-12 04:26:01 +02:00
if((ip = ialloc(dp->dev, type)) == 0)
panic("create: ialloc");
ilock(ip);
ip->major = major;
ip->minor = minor;
2007-08-27 18:06:15 +02:00
ip->nlink = 1;
iupdate(ip);
if(type == T_DIR){ // Create . and .. entries.
dp->nlink++; // for ".."
iupdate(dp);
// No ip->nlink++ for ".": avoid cyclic ref count.
if(dirlink(ip, ".", ip->inum) < 0 || dirlink(ip, "..", dp->inum) < 0)
2007-08-27 16:39:50 +02:00
panic("create dots");
}
2009-05-31 04:07:51 +02:00
if(dirlink(dp, name, ip->inum) < 0)
panic("create: dirlink");
iunlockput(dp);
return ip;
}
int
sys_open(void)
{
char *path;
int fd, omode;
2006-09-07 16:13:26 +02:00
struct file *f;
struct inode *ip;
2006-09-07 16:13:26 +02:00
if(argstr(0, &path) < 0 || argint(1, &omode) < 0)
return -1;
2014-08-27 23:15:30 +02:00
begin_op();
if(omode & O_CREATE){
ip = create(path, T_FILE, 0, 0);
if(ip == 0){
2014-08-27 23:15:30 +02:00
end_op();
return -1;
}
2007-08-28 20:37:41 +02:00
} else {
if((ip = namei(path)) == 0){
2014-08-27 23:15:30 +02:00
end_op();
return -1;
}
ilock(ip);
2009-05-31 04:07:51 +02:00
if(ip->type == T_DIR && omode != O_RDONLY){
iunlockput(ip);
2014-08-27 23:15:30 +02:00
end_op();
return -1;
}
}
if((f = filealloc()) == 0 || (fd = fdalloc(f)) < 0){
if(f)
fileclose(f);
iunlockput(ip);
2014-08-27 23:15:30 +02:00
end_op();
return -1;
}
iunlock(ip);
2014-08-27 23:15:30 +02:00
end_op();
f->type = FD_INODE;
f->ip = ip;
f->off = 0;
2007-08-27 16:39:50 +02:00
f->readable = !(omode & O_WRONLY);
f->writable = (omode & O_WRONLY) || (omode & O_RDWR);
2006-09-07 16:13:26 +02:00
return fd;
}
2009-07-12 04:26:01 +02:00
int
sys_mkdir(void)
{
char *path;
struct inode *ip;
2014-08-27 23:15:30 +02:00
begin_op();
if(argstr(0, &path) < 0 || (ip = create(path, T_DIR, 0, 0)) == 0){
2014-08-27 23:15:30 +02:00
end_op();
2009-07-12 04:26:01 +02:00
return -1;
}
2009-07-12 04:26:01 +02:00
iunlockput(ip);
2014-08-27 23:15:30 +02:00
end_op();
2009-07-12 04:26:01 +02:00
return 0;
}
int
sys_mknod(void)
{
struct inode *ip;
2006-09-07 16:13:26 +02:00
char *path;
2007-08-24 22:59:43 +02:00
int major, minor;
2015-09-27 05:10:25 +02:00
2014-08-27 23:15:30 +02:00
begin_op();
2015-09-27 05:10:25 +02:00
if((argstr(0, &path)) < 0 ||
argint(1, &major) < 0 ||
argint(2, &minor) < 0 ||
(ip = create(path, T_DEV, major, minor)) == 0){
2014-08-27 23:15:30 +02:00
end_op();
return -1;
}
iunlockput(ip);
2014-08-27 23:15:30 +02:00
end_op();
2006-09-07 16:13:26 +02:00
return 0;
}
int
sys_chdir(void)
{
2006-09-07 16:13:26 +02:00
char *path;
struct inode *ip;
2019-05-31 15:45:59 +02:00
struct proc *p = myproc();
2014-08-27 23:15:30 +02:00
begin_op();
if(argstr(0, &path) < 0 || (ip = namei(path)) == 0){
2014-08-27 23:15:30 +02:00
end_op();
return -1;
}
ilock(ip);
2007-08-28 20:32:08 +02:00
if(ip->type != T_DIR){
iunlockput(ip);
2014-08-27 23:15:30 +02:00
end_op();
return -1;
}
iunlock(ip);
2019-05-31 15:45:59 +02:00
iput(p->cwd);
2014-08-27 23:15:30 +02:00
end_op();
2019-05-31 15:45:59 +02:00
p->cwd = ip;
return 0;
}
int
sys_exec(void)
{
char *path, *argv[MAXARG];
int i;
Checkpoint port of xv6 to x86-64. Passed usertests on 2 processors a few times. The x86-64 doesn't just add two levels to page tables to support 64 bit addresses, but is a different processor. For example, calling conventions, system calls, and segmentation are different from 32-bit x86. Segmentation is basically gone, but gs/fs in combination with MSRs can be used to hold a per-core pointer. In general, x86-64 is more straightforward than 32-bit x86. The port uses code from sv6 and the xv6 "rsc-amd64" branch. A summary of the changes is as follows: - Booting: switch to grub instead of xv6's bootloader (pass -kernel to qemu), because xv6's boot loader doesn't understand 64bit ELF files. And, we don't care anymore about booting. - Makefile: use -m64 instead of -m32 flag for gcc, delete boot loader, xv6.img, bochs, and memfs. For now dont' use -O2, since usertests with -O2 is bigger than MAXFILE! - Update gdb.tmpl to be for i386 or x86-64 - Console/printf: use stdarg.h and treat 64-bit addresses different from ints (32-bit) - Update elfhdr to be 64 bit - entry.S/entryother.S: add code to switch to 64-bit mode: build a simple page table in 32-bit mode before switching to 64-bit mode, share code for entering boot processor and APs, and tweak boot gdt. The boot gdt is the gdt that the kernel proper also uses. (In 64-bit mode, the gdt/segmentation and task state mostly disappear.) - exec.c: fix passing argv (64-bit now instead of 32-bit). - initcode.c: use syscall instead of int. - kernel.ld: load kernel very high, in top terabyte. 64 bits is a lot of address space! - proc.c: initial return is through new syscall path instead of trapret. - proc.h: update struct cpu to have some scratch space since syscall saves less state than int, update struct context to reflect x86-64 calling conventions. - swtch: simplify for x86-64 calling conventions. - syscall: add fetcharg to handle x86-64 calling convetions (6 arguments are passed through registers), and fetchaddr to read a 64-bit value from user space. - sysfile: update to handle pointers from user space (e.g., sys_exec), which are 64 bits. - trap.c: no special trap vector for sys calls, because x86-64 has a different plan for system calls. - trapasm: one plan for syscalls and one plan for traps (interrupt and exceptions). On x86-64, the kernel is responsible for switching user/kernel stacks. To do, xv6 keeps some scratch space in the cpu structure, and uses MSR GS_KERN_BASE to point to the core's cpu structure (using swapgs). - types.h: add uint64, and change pde_t to uint64 - usertests: exit() when fork fails, which helped in tracking down one of the bugs in the switch from 32-bit to 64-bit - vectors: update to make them 64 bits - vm.c: use bootgdt in kernel too, program MSRs for syscalls and core-local state (for swapgs), walk 4 levels in walkpgdir, add DEVSPACETOP, use task segment to set kernel stack for interrupts (but simpler than in 32-bit mode), add an extra argument to freevm (size of user part of address space) to avoid checking all entries till KERNBASE (there are MANY TB before the top 1TB). - x86: update trapframe to have 64-bit entries, which is what the processor pushes on syscalls and traps. simplify lgdt and lidt, using struct desctr, which needs the gcc directives packed and aligned. TODO: - use int32 instead of int? - simplify curproc(). xv6 has per-cpu state again, but this time it must have it. - avoid repetition in walkpgdir - fix validateint() in usertests.c - fix bugs (e.g., observed one a case of entering kernel with invalid gs or proc
2018-09-23 14:24:42 +02:00
uint64 uargv, uarg;
2006-09-07 16:13:26 +02:00
printf("sys_exec\n");
Checkpoint port of xv6 to x86-64. Passed usertests on 2 processors a few times. The x86-64 doesn't just add two levels to page tables to support 64 bit addresses, but is a different processor. For example, calling conventions, system calls, and segmentation are different from 32-bit x86. Segmentation is basically gone, but gs/fs in combination with MSRs can be used to hold a per-core pointer. In general, x86-64 is more straightforward than 32-bit x86. The port uses code from sv6 and the xv6 "rsc-amd64" branch. A summary of the changes is as follows: - Booting: switch to grub instead of xv6's bootloader (pass -kernel to qemu), because xv6's boot loader doesn't understand 64bit ELF files. And, we don't care anymore about booting. - Makefile: use -m64 instead of -m32 flag for gcc, delete boot loader, xv6.img, bochs, and memfs. For now dont' use -O2, since usertests with -O2 is bigger than MAXFILE! - Update gdb.tmpl to be for i386 or x86-64 - Console/printf: use stdarg.h and treat 64-bit addresses different from ints (32-bit) - Update elfhdr to be 64 bit - entry.S/entryother.S: add code to switch to 64-bit mode: build a simple page table in 32-bit mode before switching to 64-bit mode, share code for entering boot processor and APs, and tweak boot gdt. The boot gdt is the gdt that the kernel proper also uses. (In 64-bit mode, the gdt/segmentation and task state mostly disappear.) - exec.c: fix passing argv (64-bit now instead of 32-bit). - initcode.c: use syscall instead of int. - kernel.ld: load kernel very high, in top terabyte. 64 bits is a lot of address space! - proc.c: initial return is through new syscall path instead of trapret. - proc.h: update struct cpu to have some scratch space since syscall saves less state than int, update struct context to reflect x86-64 calling conventions. - swtch: simplify for x86-64 calling conventions. - syscall: add fetcharg to handle x86-64 calling convetions (6 arguments are passed through registers), and fetchaddr to read a 64-bit value from user space. - sysfile: update to handle pointers from user space (e.g., sys_exec), which are 64 bits. - trap.c: no special trap vector for sys calls, because x86-64 has a different plan for system calls. - trapasm: one plan for syscalls and one plan for traps (interrupt and exceptions). On x86-64, the kernel is responsible for switching user/kernel stacks. To do, xv6 keeps some scratch space in the cpu structure, and uses MSR GS_KERN_BASE to point to the core's cpu structure (using swapgs). - types.h: add uint64, and change pde_t to uint64 - usertests: exit() when fork fails, which helped in tracking down one of the bugs in the switch from 32-bit to 64-bit - vectors: update to make them 64 bits - vm.c: use bootgdt in kernel too, program MSRs for syscalls and core-local state (for swapgs), walk 4 levels in walkpgdir, add DEVSPACETOP, use task segment to set kernel stack for interrupts (but simpler than in 32-bit mode), add an extra argument to freevm (size of user part of address space) to avoid checking all entries till KERNBASE (there are MANY TB before the top 1TB). - x86: update trapframe to have 64-bit entries, which is what the processor pushes on syscalls and traps. simplify lgdt and lidt, using struct desctr, which needs the gcc directives packed and aligned. TODO: - use int32 instead of int? - simplify curproc(). xv6 has per-cpu state again, but this time it must have it. - avoid repetition in walkpgdir - fix validateint() in usertests.c - fix bugs (e.g., observed one a case of entering kernel with invalid gs or proc
2018-09-23 14:24:42 +02:00
if(argstr(0, &path) < 0 || argaddr(1, &uargv) < 0){
printf("error 1\n");
return -1;
}
memset(argv, 0, sizeof(argv));
for(i=0;; i++){
if(i >= NELEM(argv)){
printf("error 2\n");
return -1;
}
if(fetchaddr(uargv+sizeof(uint64)*i, (uint64*)&uarg) < 0){
printf("error 3\n");
return -1;
}
if(uarg == 0){
argv[i] = 0;
break;
}
if(fetchstr(uarg, &argv[i]) < 0){
printf("error 4\n");
return -1;
}
}
printf("calling exec\n");
return exec(path, argv);
}
int
sys_pipe(void)
{
int *fd;
struct file *rf, *wf;
int fd0, fd1;
if(argptr(0, (void*)&fd, 2*sizeof(fd[0])) < 0)
return -1;
2007-08-28 06:22:35 +02:00
if(pipealloc(&rf, &wf) < 0)
return -1;
fd0 = -1;
if((fd0 = fdalloc(rf)) < 0 || (fd1 = fdalloc(wf)) < 0){
if(fd0 >= 0)
myproc()->ofile[fd0] = 0;
fileclose(rf);
fileclose(wf);
return -1;
}
fd[0] = fd0;
fd[1] = fd1;
return 0;
}