src - OpenBSD base system

diff options


context:
space:
mode:

author	Owain Ainsworth <oga@cvs.openbsd.org>	2009-06-02 23:00:20 +0000
committer	Owain Ainsworth <oga@cvs.openbsd.org>	2009-06-02 23:00:20 +0000
commit	6e1481035fcdd30fd7cc0e2650ad2e51cabb8d9d (patch)
tree	c0a17586063eb7ab1d1f02beb45592aa9705ab6c /sys/uvm/uvm_page.c
parent	a35c336f9ebdea1410b999c9869e68c40354c1e3 (diff)

Instead of the global hash table with the terrible hashfunction and a

global lock, switch the uvm object pages to being kept in a per-object RB_TREE. Right now this is approximately the same speed, but cleaner. When biglock usage is reduced this will improve concurrency due to lock contention.. ok beck@ art@. Thanks to jasper for the speed testing.

Diffstat (limited to 'sys/uvm/uvm_page.c')

-rw-r--r--

sys/uvm/uvm_page.c

162

1 files changed, 17 insertions, 145 deletions

diff --git a/sys/uvm/uvm_page.c b/sys/uvm/uvm_page.c
index 47e7c91582f..76ba5b1fe45 100644
--- a/sys/uvm/uvm_page.c
+++ b/sys/uvm/uvm_page.c

@@ -1,4 +1,4 @@

-/* $OpenBSD: uvm_page.c,v 1.83 2009/06/02 19:49:08 ariane Exp $ */

+/* $OpenBSD: uvm_page.c,v 1.84 2009/06/02 23:00:19 oga Exp $ */

/* $NetBSD: uvm_page.c,v 1.44 2000/11/27 08:40:04 chs Exp $ */

@@ -118,14 +118,6 @@ static vaddr_t virtual_space_start;

static vaddr_t virtual_space_end;

- * we use a hash table with only one bucket during bootup. we will

- * later rehash (resize) the hash table once the allocator is ready.

- * we static allocate the one bootstrap bucket below...

- */

-static struct pglist uvm_bootbucket;

-/*

* History

UVMHIST_DECL(pghist);

@@ -142,7 +134,7 @@ static void uvm_pageremove(struct vm_page *);

- * uvm_pageinsert: insert a page in the object and the hash table

+ * uvm_pageinsert: insert a page in the object

* => caller must lock object

* => caller must lock page queues

@@ -153,23 +145,17 @@ static void uvm_pageremove(struct vm_page *);

__inline static void

uvm_pageinsert(struct vm_page *pg)

{

- struct pglist *buck;

UVMHIST_FUNC("uvm_pageinsert"); UVMHIST_CALLED(pghist);

KASSERT((pg->pg_flags & PG_TABLED) == 0);

- mtx_enter(&uvm.hashlock);

- buck = &uvm.page_hash[uvm_pagehash(pg->uobject,pg->offset)];

- TAILQ_INSERT_TAIL(buck, pg, fq.queues.hashq); /* put in hash */

- mtx_leave(&uvm.hashlock);

- TAILQ_INSERT_TAIL(&pg->uobject->memq, pg,

- fq.queues.listq); /* put in object */

+ RB_INSERT(uobj_pgs, &pg->uobject->memt, pg);

atomic_setbits_int(&pg->pg_flags, PG_TABLED);

pg->uobject->uo_npages++;

}

- * uvm_page_remove: remove page from object and hash

+ * uvm_page_remove: remove page from object

* => caller must lock object

* => caller must lock page queues

@@ -178,23 +164,11 @@ uvm_pageinsert(struct vm_page *pg)

static __inline void

uvm_pageremove(struct vm_page *pg)

{

- struct pglist *buck;

UVMHIST_FUNC("uvm_pageremove"); UVMHIST_CALLED(pghist);

KASSERT(pg->pg_flags & PG_TABLED);

- mtx_enter(&uvm.hashlock);

- buck = &uvm.page_hash[uvm_pagehash(pg->uobject,pg->offset)];

- TAILQ_REMOVE(buck, pg, fq.queues.hashq);

- mtx_leave(&uvm.hashlock);

-#ifdef UBC

- if (pg->uobject->pgops == &uvm_vnodeops) {

- uvm_pgcnt_vnode--;

- }

-#endif

/* object should be locked */

- TAILQ_REMOVE(&pg->uobject->memq, pg, fq.queues.listq);

+ RB_REMOVE(uobj_pgs, &pg->uobject->memt, pg);

atomic_clearbits_int(&pg->pg_flags, PG_TABLED|PQ_AOBJ);

pg->uobject->uo_npages--;

@@ -202,6 +176,14 @@ uvm_pageremove(struct vm_page *pg)

pg->pg_version++;

}

+int

+uvm_pagecmp(struct vm_page *a, struct vm_page *b)

+ return (a->offset < b->offset ? -1 : a->offset > b->offset);

+RB_GENERATE(uobj_pgs, vm_page, fq.queues.tree, uvm_pagecmp);

* uvm_page_init: init the page system. called from uvm_init().

@@ -234,18 +216,6 @@ uvm_page_init(vaddr_t *kvm_startp, vaddr_t *kvm_endp)

mtx_init(&uvm.fpageqlock, IPL_VM);

uvm_pmr_init();

- /*

- * init the <obj,offset> => <page> hash table. for now

- * we just have one bucket (the bootstrap bucket). later on we

- * will allocate new buckets as we dynamically resize the hash table.

- */

- uvm.page_nhash = 1; /* 1 bucket */

- uvm.page_hashmask = 0; /* mask for hash function */

- uvm.page_hash = &uvm_bootbucket; /* install bootstrap bucket */

- TAILQ_INIT(uvm.page_hash); /* init hash table */

- mtx_init(&uvm.hashlock, IPL_VM); /* init hash table lock */

* allocate vm_page structures.

@@ -743,97 +713,9 @@ uvm_page_physload(paddr_t start, paddr_t end, paddr_t avail_start,

* done!

- if (!preload)

- uvm_page_rehash();

- return;

-/*

- * uvm_page_rehash: reallocate hash table based on number of free pages.

- */

-void

-uvm_page_rehash(void)

- int freepages, lcv, bucketcount, oldcount;

- struct pglist *newbuckets, *oldbuckets;

- struct vm_page *pg;

- size_t newsize, oldsize;

- /*

- * compute number of pages that can go in the free pool

- */

- freepages = 0;

- for (lcv = 0 ; lcv < vm_nphysseg ; lcv++)

- freepages +=

- (vm_physmem[lcv].avail_end - vm_physmem[lcv].avail_start);

- /*

- * compute number of buckets needed for this number of pages

- */

- bucketcount = 1;

- while (bucketcount < freepages)

- bucketcount = bucketcount * 2;

- /*

- * compute the size of the current table and new table.

- */

- oldbuckets = uvm.page_hash;

- oldcount = uvm.page_nhash;

- oldsize = round_page(sizeof(struct pglist) * oldcount);

- newsize = round_page(sizeof(struct pglist) * bucketcount);

- /*

- * allocate the new buckets

- */

- newbuckets = (struct pglist *) uvm_km_alloc(kernel_map, newsize);

- if (newbuckets == NULL) {

- printf("uvm_page_physrehash: WARNING: could not grow page "

- "hash table\n");

- return;

- }

- for (lcv = 0 ; lcv < bucketcount ; lcv++)

- TAILQ_INIT(&newbuckets[lcv]);

- /*

- * now replace the old buckets with the new ones and rehash everything

- */

- mtx_enter(&uvm.hashlock);

- uvm.page_hash = newbuckets;

- uvm.page_nhash = bucketcount;

- uvm.page_hashmask = bucketcount - 1; /* power of 2 */

- /* ... and rehash */

- for (lcv = 0 ; lcv < oldcount ; lcv++) {

- while ((pg = TAILQ_FIRST(&oldbuckets[lcv])) != NULL) {

- TAILQ_REMOVE(&oldbuckets[lcv], pg, fq.queues.hashq);

- TAILQ_INSERT_TAIL(

- &uvm.page_hash[uvm_pagehash(pg->uobject, pg->offset)],

- pg, fq.queues.hashq);

- }

- mtx_leave(&uvm.hashlock);

- /*

- * free old bucket array if is not the boot-time table

- */

- if (oldbuckets != &uvm_bootbucket)

- uvm_km_free(kernel_map, (vaddr_t) oldbuckets, oldsize);

- /*

- * done

- */

return;

}

#ifdef DDB /* XXXCDC: TMP TMP TMP DEBUG DEBUG DEBUG */

void uvm_page_physdump(void); /* SHUT UP GCC */

@@ -859,7 +741,6 @@ uvm_page_physdump(void)

case VM_PSTRAT_BIGFIRST: printf("BIGFIRST\n"); break;

default: printf("<<UNKNOWN>>!!!!\n");

}

- printf("number of buckets = %d\n", uvm.page_nhash);

}

#endif

@@ -1002,7 +883,7 @@ uvm_pagerealloc(struct vm_page *pg, struct uvm_object *newobj, voff_t newoff)

* uvm_pagefree: free page

- * => erase page's identity (i.e. remove from hash/object)

+ * => erase page's identity (i.e. remove from object)

* => put page on free list

* => caller must lock owning object (either anon or uvm_object)

* => caller must lock page queues

@@ -1400,19 +1281,10 @@ PHYS_TO_VM_PAGE(paddr_t pa)

struct vm_page *

uvm_pagelookup(struct uvm_object *obj, voff_t off)

{

- struct vm_page *pg;

- struct pglist *buck;

- mtx_enter(&uvm.hashlock);

- buck = &uvm.page_hash[uvm_pagehash(obj,off)];

+ struct vm_page find;

- TAILQ_FOREACH(pg, buck, fq.queues.hashq) {

- if (pg->uobject == obj && pg->offset == off) {

- break;

- }

- mtx_leave(&uvm.hashlock);

- return(pg);

+ find.offset = off;

+ return (RB_FIND(uobj_pgs, &obj->memt, &find));

}