Initial commit

2026-04-06 03:59:07 +02:00 · 2008-01-13 13:53:52 +00:00
commit e2b791a3d8
789 changed files with 95825 additions and 0 deletions
--- a/tasks/mm0/src/mmap.c
+++ b/tasks/mm0/src/mmap.c
@@ -0,0 +1,489 @@
+/*
+ * mmap/munmap and friends.
+ *
+ * Copyright (C) 2007 Bahadir Balban
+ */
+#include <vm_area.h>
+#include <kmalloc/kmalloc.h>
+#include INC_API(errno.h)
+#include <posix/sys/types.h>
+#include <task.h>
+#include <mmap.h>
+#include <l4lib/arch/syscalls.h>
+
+static struct vm_file devzero;
+
+/* Swap related bookkeeping.
+static struct vm_file shm_swap_file;
+static struct id_pool *swap_file_offset_pool;
+*/
+
+/* mmap system call implementation */
+int sys_mmap(l4id_t sender, void *start, size_t length, int prot,
+	     int flags, int fd, off_t offset)
+{
+	return 0;
+}
+
+/* TODO: This is to be implemented when fs0 is ready. */
+int do_msync(void *addr, unsigned long size, unsigned int flags, struct tcb *task)
+{
+	// unsigned long npages = __pfn(size);
+	struct vm_area *vma = find_vma((unsigned long)addr,
+				       &task->vm_area_list);
+	if (!vma)
+		return -EINVAL;
+
+	/* Must check if this is a shadow copy or not */
+	if (vma->flags & VMA_COW) {
+		;	/* ... Fill this in. ... */
+	}
+
+	/* TODO:
+	 * Flush the vma's pages back to their file. Perhaps add a dirty bit
+	 * to the vma so that this can be completely avoided for clean vmas?
+	 * For anon pages this is the swap file. For real file-backed pages
+	 * its the real file. However, this can't be fully implemented yet since
+	 * we don't have FS0 yet.
+	 */
+	return 0;
+}
+
+/*
+ * This releases a physical page struct from its owner and
+ * frees the page back to the page allocator.
+ */
+int page_release(struct page *page)
+{
+	spin_lock(&page->lock);
+	page->count--;
+	BUG_ON(page->count < -1);
+	if (page->count == -1) {
+		/* Unlink the page from its owner's list */
+		list_del_init(&page->list);
+
+		/* Zero out the fields */
+		page->owner = 0;
+		page->flags = 0;
+		page->f_offset = 0;
+		page->virtual = 0;
+
+		/*
+		 * No refs to page left, and since every physical memory page
+		 * comes from the page allocator, we return it back.
+		 */
+		free_page((void *)page_to_phys(page));
+	}
+	spin_unlock(&page->lock);
+	return 0;
+}
+
+/*
+ * Freeing and unmapping of vma pages:
+ *
+ * For a vma that is about to be split, shrunk or destroyed, this function
+ * finds out about the physical pages in memory that represent the vma,
+ * reduces their refcount, and if they're unused, frees them back to the
+ * physical page allocator, and finally unmaps those corresponding virtual
+ * addresses from the unmapper task's address space. This sequence is
+ * somewhat a rewinding of the actions that the page fault handler takes
+ * when the vma was faulted by the process.
+ */
+int vma_release_pages(struct vm_area *vma, struct tcb *task,
+		      unsigned long pfn_start, unsigned long pfn_end)
+{
+	unsigned long f_start, f_end;
+	struct page *page, *n;
+
+	/* Assume vma->pfn_start is lower than or equal to pfn_start */
+	BUG_ON(vma->pfn_start > pfn_start);
+
+	/* Assume vma->pfn_end is higher or equal to pfn_end */
+	BUG_ON(vma->pfn_end < pfn_end);
+
+	/* Find the file offsets of the range to be freed. */
+	f_start = vma->f_offset + pfn_start - vma->pfn_start;
+	f_end = vma->f_offset + vma->pfn_end - pfn_end;
+
+	list_for_each_entry_safe(page, n, &vma->owner->page_cache_list, list) {
+		if (page->f_offset >= f_start && page->f_offset <= f_end) {
+			l4_unmap((void *)virtual(page), 1, task->tid);
+			page_release(page);
+		}
+	}
+	return 0;
+}
+int vma_unmap(struct vm_area **orig, struct vm_area **new,
+	      unsigned long, unsigned long, struct tcb *);
+/*
+ * This is called by every vma modifier function in vma_unmap(). This in turn
+ * calls vma_unmap recursively to modify the shadow vmas, the same way the
+ * actual vmas get modified. Only COW vmas would need to do this recursion
+ * and the max level of recursion is one, since only one level of shadows exist.
+ */
+int vma_unmap_shadows(struct vm_area *vma, struct tcb *task, unsigned long pfn_start,
+		      unsigned long pfn_end)
+{
+	struct vm_area *shadow, *n;
+
+	/* Now do all shadows */
+	list_for_each_entry_safe(shadow, n, &vma->shadow_list,
+				 shadow_list) {
+		BUG_ON(!(vma->flags & VMA_COW));
+		if (shadow->pfn_start >= pfn_start &&
+		    shadow->pfn_end <= pfn_end) {
+			struct vm_area *split_shadow;
+			/* This may result in shrink/destroy/split of the shadow */
+			vma_unmap(&shadow, &split_shadow, pfn_start, pfn_end, task);
+			if (shadow && split_shadow)
+				list_add_tail(&split_shadow->list,
+					      &shadow->list);
+			/* FIXME: Is this all to be done here??? Find what to do here. */
+			BUG();
+		}
+	}
+	return 0;
+}
+
+struct vm_area *vma_new(unsigned long pfn_start, unsigned long npages,
+			unsigned int flags,  unsigned long f_offset,
+			struct vm_file *owner)
+{
+	struct vm_area *vma;
+
+	/* Initialise new area */
+	if (!(vma = kzalloc(sizeof(struct vm_area))))
+		return 0;
+
+	vma->pfn_start = pfn_start;
+	vma->pfn_end = pfn_start + npages;
+	vma->flags = flags;
+	vma->f_offset = f_offset;
+	vma->owner = owner;
+	INIT_LIST_HEAD(&vma->list);
+	INIT_LIST_HEAD(&vma->shadow_list);
+
+	return vma;
+}
+
+/* TODO: vma_destroy/shrink/split should also handle swap file modification */
+
+/* Frees and unlinks a vma from its list. TODO: Add list locking */
+int vma_destroy(struct vm_area *vma, struct tcb *task)
+{
+	struct vm_area *shadow, *n;
+
+	/* Release the vma pages */
+	vma_release_pages(vma, task, vma->pfn_start, vma->pfn_end);
+
+	/* Free all shadows, if any. */
+	list_for_each_entry_safe(shadow, n, &vma->shadow_list, list) {
+		/* Release all shadow pages */
+		vma_release_pages(shadow, task, shadow->pfn_start, shadow->pfn_end);
+		list_del(&shadow->list);
+		kfree(shadow);
+	}
+
+	/* Unlink and free the vma itself */
+	list_del(&vma->list);
+	if (kfree(vma) < 0)
+		BUG();
+
+	return 0;
+}
+
+/* This splits a vma, splitter region must be in the *middle* of original vma */
+struct vm_area *vma_split(struct vm_area *vma, struct tcb *task,
+			  unsigned long pfn_start, unsigned long pfn_end)
+{
+	struct vm_area *new, *shadow, *n;
+
+	/* Allocate an uninitialised vma first */
+	if (!(new = vma_new(0, 0, 0, 0, 0)))
+		return 0;
+
+
+	/*
+	 * Some sanity checks to show that splitter range does end up
+	 * producing two smaller vmas.
+	 */
+	BUG_ON(vma->pfn_start >= pfn_start || vma->pfn_end <= pfn_end);
+
+	/* Release the pages before modifying the original vma */
+	vma_release_pages(vma, task, pfn_start, pfn_end);
+
+	new->pfn_end = vma->pfn_end;
+	new->pfn_start = pfn_end;
+	new->f_offset = vma->f_offset + new->pfn_start - vma->pfn_start;
+	vma->pfn_end = pfn_start;
+
+	new->flags = vma->flags;
+	new->owner = vma->owner;
+
+	/* Modify the shadows accordingly first. They may
+	 * split/shrink or get completely destroyed or stay still. */
+	vma_unmap_shadows(vma, task, pfn_start, pfn_end);
+
+	/*
+	 * Now split the modified shadows list into two vmas:
+	 * If the file was COW and its vma had split, vma_new would have
+	 * a valid value and as such the shadows must be separated into
+	 * the two new vmas according to which one they belong to.
+	 */
+	list_for_each_entry_safe(shadow, n, &vma->shadow_list,
+				 shadow_list) {
+		BUG_ON(!(vma->flags & VMA_COW));
+		BUG_ON(!(new->flags & VMA_COW));
+		if (shadow->pfn_start >= new->pfn_start &&
+		    shadow->pfn_end <= new->pfn_end) {
+			list_del_init(&shadow->list);
+			list_add(&shadow->list, &new->shadow_list);
+		} else
+			BUG_ON(!(shadow->pfn_start >= vma->pfn_start &&
+			       shadow->pfn_end <= vma->pfn_end));
+	}
+
+	return new;
+}
+
+/*
+ * For written anonymous regions swapfile segments are allocated dynamically.
+ * when vma regions are modified these allocations must be re-adjusted.
+ * This call handles this adjustment as well as the vma.
+ */
+int vma_swapfile_realloc(struct vm_area *vma, unsigned long pfn_start,
+			 unsigned long pfn_end)
+{
+	/* TODO: Reslot in swapfile */
+	BUG();
+	return 0;
+}
+
+
+
+/* This shrinks the vma from *one* end only, either start or end */
+int vma_shrink(struct vm_area *vma, struct tcb *task, unsigned long pfn_start,
+	       unsigned long pfn_end)
+{
+	unsigned long diff;
+
+	BUG_ON(pfn_start >= pfn_end);
+
+	/* FIXME: Shadows are currently buggy - TBD */
+	if (!list_empty(&vma->shadow_list)) {
+		BUG();
+		vma_swapfile_realloc(vma, pfn_start, pfn_end);
+		return 0;
+	}
+
+	/* Release the pages before modifying the original vma */
+	vma_release_pages(vma, task, pfn_start, pfn_end);
+
+	/* Shrink from the beginning */
+	if (pfn_start > vma->pfn_start) {
+		diff = pfn_start - vma->pfn_start;
+		vma->f_offset += diff;
+		vma->pfn_start = pfn_start;
+
+	/* Shrink from the end */
+	} else if (pfn_end < vma->pfn_end) {
+		diff = vma->pfn_end - pfn_end;
+		vma->pfn_end = pfn_end;
+	} else
+		BUG();
+
+	return vma_unmap_shadows(vma, task, pfn_start, pfn_end);
+}
+
+/*
+ * Unmaps the given region from a vma. Depending on the region and vma range,
+ * this may result in either shrinking, splitting or destruction of the vma.
+ */
+int vma_unmap(struct vm_area **actual, struct vm_area **split,
+	      unsigned long pfn_start, unsigned long pfn_end, struct tcb *task)
+{
+	struct vm_area *vma = *actual;
+	struct vm_area *vma_new = 0;
+
+	/* Split needed? */
+	if (vma->pfn_start < pfn_start && vma->pfn_end > pfn_end) {
+		if (!(vma_new = vma_split(vma, task, pfn_start, pfn_end)))
+			return -ENOMEM;
+		list_add_tail(&vma_new->list, &vma->list);
+
+	/* Shrink needed? */
+	} else if (((vma->pfn_start == pfn_start) && (vma->pfn_end > pfn_end))
+	    	   || ((vma->pfn_start < pfn_start) && (vma->pfn_end == pfn_end)))
+		vma_shrink(vma, task, pfn_start, pfn_end);
+
+	/* Destroy needed? */
+	else if ((vma->pfn_start >= pfn_start) && (vma->pfn_end <= pfn_end)) {
+		/* NOTE: VMA can't be referred after this point. */
+		vma_destroy(vma, task);
+		vma = 0;
+	} else
+		BUG();
+
+	/* Update actual pointers */
+	*actual = vma;
+	*split = vma_new;
+
+	return 0;
+}
+
+/* Unmaps given address range from its vma. Releases those pages in that vma. */
+int do_munmap(void *vaddr, unsigned long size, struct tcb *task)
+{
+	unsigned long npages = __pfn(size);
+	unsigned long pfn_start = __pfn(vaddr);
+	unsigned long pfn_end = pfn_start + npages;
+	struct vm_area *vma, *vma_new = 0;
+	int err;
+
+	/* Check if any such vma exists */
+	if (!(vma = find_vma((unsigned long)vaddr, &task->vm_area_list)))
+		return -EINVAL;
+
+	/*
+	 * If end of the range is outside of the vma that has the start
+	 * address, we ignore the rest and assume end is the end of that vma.
+	 * TODO: Find out how posix handles this.
+	 */
+	if (pfn_end > vma->pfn_end) {
+		printf("%s: %s: Warning, unmap end 0x%x beyond vma range. "
+		       "Ignoring.\n", __TASKNAME__, __FUNCTION__,
+		       __pfn_to_addr(pfn_end));
+		pfn_end = vma->pfn_end;
+	}
+	if ((err = vma_unmap(&vma, &vma_new, pfn_start, pfn_end, task)) < 0)
+		return err;
+#if 0
+mod_phys_pages:
+
+	/* The stage where the actual pages are unmapped from the page tables */
+pgtable_unmap:
+
+	/* TODO:
+	 * - Find out if the vma is cow, and contains shadow vmas.
+	 * - Remove and free shadow vmas or the real vma, or shrink them if applicable.
+	 * - Free the swap file segment for the vma if vma is private (cow).
+	 * - Reduce refcount for the in-memory pages.
+	 * - If refcount is zero (they could be shared!), either add pages to some page
+	 *   cache, or simpler the better, free the actual pages back to the page allocator.
+	 * - l4_unmap() the corresponding virtual region from the page tables.
+	 */
+#endif
+	return 0;
+}
+
+static struct vm_area *
+is_vma_mergeable(unsigned long pfn_start, unsigned long pfn_end,
+		 unsigned int flags, struct vm_area *vma)
+{
+	/* TODO:
+	 * The swap implementation is too simple for now. The vmas on swap
+	 * are stored non-sequentially, and adjacent vmas don't imply adjacent
+	 * file position on swap. So at the moment merging swappable vmas
+	 * doesn't make sense. But this is going to change in the future.
+	 */
+	if (vma->flags & VMA_COW) {
+		BUG();
+		/* FIXME: XXX: Think about this! */
+	}
+
+	/* Check for vma adjacency */
+	if ((vma->pfn_start == pfn_end) && (vma->flags == flags))
+		return vma;
+	if ((vma->pfn_end == pfn_start) && (vma->flags == flags))
+		return vma;
+
+	return 0;
+}
+
+/*
+ * Finds an unmapped virtual memory area for the given parameters. If it
+ * overlaps with an existing vma, it returns -1, if it is adjacent to an
+ * existing vma and the flags match, it returns the adjacent vma. Otherwise it
+ * returns 0.
+ */
+int find_unmapped_area(struct vm_area **existing, struct vm_file *file,
+		       unsigned long pfn_start, unsigned long npages,
+		       unsigned int flags, struct list_head *vm_area_head)
+{
+	struct vm_area *vma;
+	unsigned long pfn_end = pfn_start + npages;
+	*existing = 0;
+
+	list_for_each_entry(vma, vm_area_head, list) {
+		/* Check overlap */
+		if ((vma->pfn_start <= pfn_start) &&
+		    (pfn_start < vma->pfn_end)) {
+			printf("%s: VMAs overlap.\n", __FUNCTION__);
+			return -1;	/* Overlap */
+		} if ((vma->pfn_start < pfn_end) &&
+		    (pfn_end < vma->pfn_end)) {
+			printf("%s: VMAs overlap.\n", __FUNCTION__);
+			return -1;	/* Overlap */
+		}
+		if (is_vma_mergeable(pfn_start, pfn_end, flags, vma)) {
+			*existing = vma;
+			return 0;
+		}
+	}
+	return 0;
+}
+
+/*
+ * Maps the given file with given flags at the given page offset to the given
+ * task's address space at the specified virtual memory address and length.
+ *
+ * The actual paging in/out of the file from/into memory pages is handled by
+ * the file's pager upon page faults.
+ */
+int do_mmap(struct vm_file *mapfile, unsigned long f_offset, struct tcb *t,
+	    unsigned long map_address, unsigned int flags, unsigned int pages)
+{
+	struct vm_area *vma;
+	unsigned long pfn_start = __pfn(map_address);
+
+	if (!mapfile) {
+	       if (flags & VMA_ANON) {
+			mapfile = &devzero;
+			f_offset = 0;
+	       } else
+			BUG();
+	} else if (pages > (__pfn(page_align_up(mapfile->length)) - f_offset)) {
+		printf("%s: Trying to map %d pages from page %d, "
+		       "but file length is %d\n", __FUNCTION__, pages,
+		       f_offset, __pfn(page_align_up(mapfile->length)));
+		return -EINVAL;
+	}
+
+	printf("%s: Mapping 0x%x - 0x%x\n", __FUNCTION__, map_address,
+	       map_address + pages * PAGE_SIZE);
+
+	/* See if it overlaps or is mergeable to an existing vma. */
+	if (find_unmapped_area(&vma, mapfile, pfn_start, pages, flags,
+			       &t->vm_area_list) < 0)
+		return -EINVAL;	/* Indicates overlap. */
+
+	/* Mergeable vma returned? */
+	if (vma) {
+		if (vma->pfn_end == pfn_start)
+			vma->pfn_end = pfn_start + pages;
+		else {
+			vma->f_offset -= vma->pfn_start - pfn_start;
+
+			/* Check if adjusted yields the original */
+			BUG_ON(vma->f_offset != f_offset);
+			vma->pfn_start = pfn_start;
+		}
+	} else { /* Initialise new area */
+		if (!(vma = vma_new(pfn_start, pages, flags, f_offset,
+				    mapfile)))
+			return -ENOMEM;
+		list_add(&vma->list, &t->vm_area_list);
+	}
+	return 0;
+}
+