/* * Copyright (C) 2008 Bahadir Balban */ #include #include #include #include #include #include #include #include #include #include #include INC_ARCH(bootdesc.h) #include struct page *page_init(struct page *page) { /* Reset page */ memset(page, 0, sizeof(*page)); page->refcnt = -1; spin_lock_init(&page->lock); INIT_LIST_HEAD(&page->list); return page; } struct page *find_page(struct vm_object *obj, unsigned long pfn) { struct page *p; list_for_each_entry(p, &obj->page_cache, list) if (p->offset == pfn) return p; return 0; } /* * Deletes all pages in a page cache, assumes pages are from the * page allocator, and page structs are from the page_array, which * is the default situation. */ int default_release_pages(struct vm_object *vm_obj) { struct page *p, *n; list_for_each_entry_safe(p, n, &vm_obj->page_cache, list) { list_del(&p->list); BUG_ON(p->refcnt); /* Return page back to allocator */ free_page((void *)page_to_phys(p)); /* Free the page structure */ kfree(p); /* Reduce object page count */ BUG_ON(--vm_obj->npages < 0); } return 0; } struct page *file_page_in(struct vm_object *vm_obj, unsigned long page_offset) { struct vm_file *f = vm_object_to_file(vm_obj); struct page *page; void *vaddr, *paddr; int err; /* Check first if the file has such a page at all */ if (__pfn(page_align_up(f->length) <= page_offset)) { printf("%s: %s: Trying to look up page %d, but file length " "is %d bytes.\n", __TASKNAME__, __FUNCTION__, page_offset, f->length); BUG(); } /* The page is not resident in page cache. */ if (!(page = find_page(vm_obj, page_offset))) { /* Allocate a new page */ paddr = alloc_page(1); vaddr = phys_to_virt(paddr); page = phys_to_page(paddr); /* Map the page to vfs task */ l4_map(paddr, vaddr, 1, MAP_USR_RW_FLAGS, VFS_TID); /* Syscall to vfs to read into the page. */ if ((err = vfs_read(vm_file_to_vnum(f), page_offset, 1, vaddr)) < 0) goto out_err; /* Unmap it from vfs */ l4_unmap(vaddr, 1, VFS_TID); /* Update vm object details */ vm_obj->npages++; /* Update page details */ page_init(page); page->refcnt++; page->owner = vm_obj; page->offset = page_offset; page->virtual = 0; /* Add the page to owner's list of in-memory pages */ BUG_ON(!list_empty(&page->list)); insert_page_olist(page, vm_obj); } return page; out_err: l4_unmap(vaddr, 1, VFS_TID); free_page(paddr); return PTR_ERR(err); } /* * All non-mmapable char devices are handled by this. * VFS calls those devices to read their pages */ struct vm_pager file_pager = { .ops = { .page_in = file_page_in, .release_pages = default_release_pages, }, }; /* A proposal for shadow vma container, could be part of vm_file->priv_data */ struct vm_swap_node { struct vm_file *swap_file; struct task_ids task_ids; struct address_pool *pool; }; /* * This should save swap_node/page information either in the pte or in a global * list of swap descriptors, and then write the page into the possibly one and * only swap file. */ struct page *swap_page_in(struct vm_object *vm_obj, unsigned long file_offset) { struct page *p; /* No swapping yet, so the page is either here or not here. */ if (!(p = find_page(vm_obj, file_offset))) return PTR_ERR(-EINVAL); else return p; } struct vm_pager swap_pager = { .ops = { .page_in = swap_page_in, .release_pages = default_release_pages, }, }; /* * Just releases the page structures since the actual pages are * already in memory as read-only. */ int bootfile_release_pages(struct vm_object *vm_obj) { struct page *p, *n; list_for_each_entry_safe(p, n, &vm_obj->page_cache, list) { list_del(&p->list); BUG_ON(p->refcnt); /* Free the page structure */ kfree(p); /* Reduce object page count */ BUG_ON(--vm_obj->npages < 0); } return 0; } /* Returns the page with given offset in this vm_object */ struct page *bootfile_page_in(struct vm_object *vm_obj, unsigned long offset) { struct vm_file *boot_file = vm_object_to_file(vm_obj); struct svc_image *img = boot_file->priv_data; struct page *page; /* Check first if the file has such a page at all */ if (__pfn(page_align_up(boot_file->length) <= offset)) { printf("%s: %s: Trying to look up page %d, but file length " "is %d bytes.\n", __TASKNAME__, __FUNCTION__, offset, boot_file->length); BUG(); } /* The page is not resident in page cache. */ if (!(page = find_page(vm_obj, offset))) { page = phys_to_page(img->phys_start + __pfn_to_addr(offset)); /* Update page */ page_init(page); page->refcnt++; page->owner = vm_obj; page->offset = offset; /* Update object */ vm_obj->npages++; /* Add the page to owner's list of in-memory pages */ BUG_ON(!list_empty(&page->list)); insert_page_olist(page, vm_obj); } return page; } struct vm_pager bootfile_pager = { .ops = { .page_in = bootfile_page_in, .release_pages = bootfile_release_pages, }, }; /* From bare boot images, create mappable device files */ int init_boot_files(struct initdata *initdata) { struct bootdesc *bd = initdata->bootdesc; struct vm_file *boot_file; struct svc_image *img; INIT_LIST_HEAD(&initdata->boot_file_list); for (int i = 0; i < bd->total_images; i++) { img = &bd->images[i]; boot_file = vm_file_create(); boot_file->priv_data = img; boot_file->length = img->phys_end - img->phys_start; boot_file->type = VM_FILE_BOOTFILE; /* Initialise the vm object */ boot_file->vm_obj.flags = VM_OBJ_FILE; boot_file->vm_obj.pager = &bootfile_pager; /* Add the object to global vm_object list */ list_add(&boot_file->vm_obj.list, &vm_object_list); /* Add the file to initdata's bootfile list */ list_add_tail(&boot_file->list, &initdata->boot_file_list); } return 0; } /* Returns the page with given offset in this vm_object */ struct page *devzero_page_in(struct vm_object *vm_obj, unsigned long page_offset) { struct vm_file *devzero = vm_object_to_file(vm_obj); struct page *zpage = devzero->priv_data; BUG_ON(!(devzero->type & VM_FILE_DEVZERO)); /* Update zero page struct. */ spin_lock(&zpage->lock); BUG_ON(zpage->refcnt < 0); zpage->refcnt++; spin_unlock(&zpage->lock); return zpage; } struct vm_pager devzero_pager = { .ops = { .page_in = devzero_page_in, }, }; struct vm_file *get_devzero(void) { struct vm_file *f; list_for_each_entry(f, &vm_file_list, list) if (f->type == VM_FILE_DEVZERO) return f; return 0; } int init_devzero(void) { void *zphys, *zvirt; struct page *zpage; struct vm_file *devzero; /* Allocate and initialise the zero page */ zphys = alloc_page(1); zpage = phys_to_page(zphys); zvirt = l4_map_helper(zphys, 1); memset(zvirt, 0, PAGE_SIZE); l4_unmap_helper(zvirt, 1); /* Allocate and initialise devzero file */ devzero = vm_file_create(); devzero->type = VM_FILE_DEVZERO; devzero->priv_data = zpage; devzero->length = page_align(~0UL); /* So we dont wraparound to 0! */ devzero->vm_obj.npages = __pfn(devzero->length); devzero->vm_obj.pager = &devzero_pager; devzero->vm_obj.flags = VM_OBJ_FILE; /* Initialise zpage */ zpage->refcnt++; zpage->owner = &devzero->vm_obj; list_add(&devzero->vm_obj.list, &vm_object_list); list_add(&devzero->list, &vm_file_list); return 0; }