#include #include #include #include #include #include #include #include #include #include #define SYSCALL_RETURN(val) return regs_savereturn(&process_current->regs, val) _Noreturn void _syscall_exit(int ret) { process_kill(process_current, ret); process_switch_any(); } int _syscall_await(void) { bool has_children = false; process_transition(process_current, PS_WAITS4CHILDDEATH); // find any already dead children for (struct process *iter = process_current->child; iter; iter = iter->sibling) { if (iter->state == PS_DEAD && !iter->noreap) SYSCALL_RETURN(process_try2collect(iter)); if (iter->state != PS_DEADER) has_children = true; } if (!has_children) { process_transition(process_current, PS_RUNNING); SYSCALL_RETURN(~0); // TODO errno } else { SYSCALL_RETURN(-1); } } int _syscall_fork(int flags) { struct process *child = process_fork(process_current, flags); regs_savereturn(&child->regs, 0); SYSCALL_RETURN(1); } handle_t _syscall_open(const char __user *path, int len) { struct vfs_mount *mount; char *path_buf = NULL; if (PATH_MAX < len) SYSCALL_RETURN(-1); if (process_find_handle(process_current, 0) < 0) SYSCALL_RETURN(-1); path_buf = virt_cpy2kmalloc(process_current->pages, path, len); if (!path_buf) goto fail; len = path_simplify(path_buf, path_buf, len); if (len < 0) goto fail; mount = vfs_mount_resolve(process_current->mount, path_buf, len); if (!mount) goto fail; if (mount->prefix_len > 0) { // strip prefix len -= mount->prefix_len; // i can't just adjust path_buf, because it needs to be passed to free() // later on memcpy(path_buf, path_buf + mount->prefix_len, len); } vfsreq_create((struct vfs_request) { .type = VFSOP_OPEN, .input = { .kern = true, .buf_kern = path_buf, .len = len, }, .caller = process_current, .backend = mount->backend, }); return -1; // dummy fail: kfree(path_buf); SYSCALL_RETURN(-1); } int _syscall_mount(handle_t hid, const char __user *path, int len) { struct vfs_mount *mount = NULL; struct vfs_backend *backend = NULL; char *path_buf = NULL; if (PATH_MAX < len) SYSCALL_RETURN(-1); // copy the path to the kernel to simplify it path_buf = virt_cpy2kmalloc(process_current->pages, path, len); if (!path_buf) goto fail; len = path_simplify(path_buf, path_buf, len); if (len < 0) goto fail; // remove trailing slash // mounting something under `/this` and `/this/` should be equalivent if (path_buf[len - 1] == '/') { if (len == 0) goto fail; len--; } if (hid >= 0) { // mounting a real backend? struct handle *handle = process_handle_get(process_current, hid, HANDLE_FS_FRONT); if (!handle) goto fail; backend = handle->fs.backend; backend->refcount++; } // otherwise backend == NULL // append to mount list // TODO move to kernel/vfs/mount.c mount = kmalloc(sizeof *mount); mount->prev = process_current->mount; mount->prefix = path_buf; mount->prefix_owned = true; mount->prefix_len = len; mount->backend = backend; mount->refs = 1; process_current->mount = mount; kmalloc_sanity(mount); kmalloc_sanity(mount->prefix); SYSCALL_RETURN(0); fail: kfree(path_buf); kfree(mount); SYSCALL_RETURN(-1); } int _syscall_read(handle_t handle_num, void __user *buf, size_t len, int offset) { struct handle *handle = process_handle_get(process_current, handle_num, HANDLE_FILE); if (!handle) SYSCALL_RETURN(-1); vfsreq_create((struct vfs_request) { .type = VFSOP_READ, .output = { .buf = (userptr_t) buf, .len = len, }, .id = handle->file.id, .offset = offset, .caller = process_current, .backend = handle->file.backend, }); return -1; // dummy } int _syscall_write(handle_t handle_num, const void __user *buf, size_t len, int offset) { struct handle *handle = process_handle_get(process_current, handle_num, HANDLE_FILE); if (!handle) SYSCALL_RETURN(-1); vfsreq_create((struct vfs_request) { .type = VFSOP_WRITE, .input = { .buf = (userptr_t) buf, .len = len, }, .id = handle->file.id, .offset = offset, .caller = process_current, .backend = handle->file.backend, }); return -1; // dummy } int _syscall_close(handle_t hid) { if (hid < 0 || hid >= HANDLE_MAX) return -1; struct handle **h = &process_current->handles[hid]; if (!*h) SYSCALL_RETURN(-1); handle_close(*h); *h = NULL; SYSCALL_RETURN(0); } handle_t _syscall_fs_fork2(void) { struct vfs_backend *backend; struct process *child; handle_t front; front = process_find_handle(process_current, 1); if (front < 0) SYSCALL_RETURN(-1); process_current->handles[front] = handle_init(HANDLE_FS_FRONT); backend = kmalloc(sizeof *backend); backend->heap = true; backend->is_user = true; backend->potential_handlers = 1; backend->refcount = 2; // child + handle backend->user.handler = NULL; backend->queue = NULL; child = process_fork(process_current, 0); if (child->controlled) vfs_backend_refdown(child->controlled); child->controlled = backend; regs_savereturn(&child->regs, 0); process_current->handles[front]->fs.backend = backend; SYSCALL_RETURN(front); } int _syscall_fs_wait(char __user *buf, int max_len, struct fs_wait_response __user *res) { struct vfs_backend *backend = process_current->controlled; if (!backend) SYSCALL_RETURN(-1); process_transition(process_current, PS_WAITS4REQUEST); assert(!backend->user.handler); // TODO allow multiple processes to wait on the same backend backend->user.handler = process_current; /* checking the validity of those pointers here would make * vfs_backend_accept simpler. TODO? */ process_current->awaited_req.buf = buf; process_current->awaited_req.max_len = max_len; process_current->awaited_req.res = res; vfs_backend_tryaccept(backend); // sets return value return -1; // dummy } int _syscall_fs_respond(char __user *buf, int ret) { struct vfs_request *req = process_current->handled_req; if (!req) SYSCALL_RETURN(-1); if (req->output.len > 0 && ret > 0) { // if this vfsop outputs data and ret is positive, it's the length of the buffer // TODO document ret = min(ret, capped_cast32(req->output.len)); if (!virt_cpy(req->caller->pages, req->output.buf, process_current->pages, buf, ret)) { // how should this error even be handled? TODO } } process_current->handled_req = NULL; vfsreq_finish(req, ret); SYSCALL_RETURN(0); } int _syscall_memflag(void __user *addr, size_t len, int flags) { userptr_t goal = addr + len; struct pagedir *pages = process_current->pages; if (flags != MEMFLAG_PRESENT) panic_unimplemented(); // TODO addr = (userptr_t)((int __force)addr & ~PAGE_MASK); // align to page boundary for (; addr < goal; addr += PAGE_SIZE) { if (pagedir_virt2phys(pages, addr, false, false)) { // allocated page, currently a no-op // if you'll be changing this - remember to check if the pages are owned by the kernel! } else { // allocate the new pages pagedir_map(pages, addr, page_alloc(1), true, true); } } SYSCALL_RETURN(-1); } int _syscall(int num, int a, int b, int c, int d) { switch (num) { case _SYSCALL_EXIT: _syscall_exit(a); case _SYSCALL_AWAIT: return _syscall_await(); case _SYSCALL_FORK: return _syscall_fork(a); case _SYSCALL_OPEN: return _syscall_open((userptr_t)a, b); case _SYSCALL_MOUNT: return _syscall_mount(a, (userptr_t)b, c); case _SYSCALL_READ: return _syscall_read(a, (userptr_t)b, c, d); case _SYSCALL_WRITE: return _syscall_write(a, (userptr_t)b, c, d); case _SYSCALL_CLOSE: return _syscall_close(a); case _SYSCALL_FS_FORK2: return _syscall_fs_fork2(); case _SYSCALL_FS_WAIT: return _syscall_fs_wait((userptr_t)a, b, (userptr_t)c); case _SYSCALL_FS_RESPOND: return _syscall_fs_respond((userptr_t)a, b); case _SYSCALL_MEMFLAG: return _syscall_memflag((userptr_t)a, b, c); default: kprintf("unknown syscall "); panic_unimplemented(); // TODO fail gracefully } }