src - OpenBSD base system

diff options


context:
space:
mode:

author	David Gwynne <dlg@cvs.openbsd.org>	2016-11-02 01:20:51 +0000
committer	David Gwynne <dlg@cvs.openbsd.org>	2016-11-02 01:20:51 +0000
commit	b19b3325d78a93eae4cf0265baaa6d4e72277a6e (patch)
tree	f637f80d74ab5e50b4376fdf8710c55f7152dcb4 /sys/kern/subr_pool.c
parent	ca449bdf3cb10151cb206d94772339a4578284b5 (diff)

add per cpu caches for free pool items.

this is modelled on whats described in the "Magazines and Vmem: Extending the Slab Allocator to Many CPUs and Arbitrary Resources" paper by Jeff Bonwick and Jonathan Adams. the main semantic borrowed from the paper is the use of two lists of free pool items on each cpu, and only moving one of the lists in and out of a global depot of free lists to mitigate against a cpu thrashing against that global depot. unlike slabs, pools do not maintain or cache constructed items, which allows us to use the items themselves to build the free list rather than having to allocate arrays to point at constructed pool items. the per cpu caches are build on top of the cpumem api. this has been kicked a bit by hrvoje popovski and simon mages (thank you). im putting it in now so it is easier to work on and test. ok jmatthew@

Diffstat (limited to 'sys/kern/subr_pool.c')

-rw-r--r--

sys/kern/subr_pool.c

317

1 files changed, 316 insertions, 1 deletions

diff --git a/sys/kern/subr_pool.c b/sys/kern/subr_pool.c
index 95197120db1..546589f69ce 100644
--- a/sys/kern/subr_pool.c
+++ b/sys/kern/subr_pool.c

@@ -1,4 +1,4 @@

-/* $OpenBSD: subr_pool.c,v 1.198 2016/09/15 02:00:16 dlg Exp $ */

+/* $OpenBSD: subr_pool.c,v 1.199 2016/11/02 01:20:50 dlg Exp $ */

/* $NetBSD: subr_pool.c,v 1.61 2001/09/26 07:14:56 chs Exp $ */

/*-

@@ -42,6 +42,7 @@

#include <sys/sysctl.h>

#include <sys/task.h>

#include <sys/timeout.h>

+#include <sys/percpu.h>

#include <uvm/uvm_extern.h>

@@ -96,6 +97,33 @@ struct pool_item {

};

#define POOL_IMAGIC(ph, pi) ((u_long)(pi) ^ (ph)->ph_magic)

+#ifdef MULTIPROCESSOR

+struct pool_list {

+ struct pool_list *pl_next; /* next in list */

+ unsigned long pl_cookie;

+ struct pool_list *pl_nextl; /* next list */

+ unsigned long pl_nitems; /* items in list */

+};

+struct pool_cache {

+ struct pool_list *pc_actv;

+ unsigned long pc_nactv; /* cache pc_actv nitems */

+ struct pool_list *pc_prev;

+ uint64_t pc_gen; /* generation number */

+ uint64_t pc_gets;

+ uint64_t pc_puts;

+ uint64_t pc_fails;

+ int pc_nout;

+};

+void *pool_cache_get(struct pool *);

+void pool_cache_put(struct pool *, void *);

+void pool_cache_destroy(struct pool *);

+#endif

+void pool_cache_info(struct pool *, struct kinfo_pool *);

#ifdef POOL_DEBUG

int pool_debug = 1;

#else

@@ -355,6 +383,11 @@ pool_destroy(struct pool *pp)

struct pool_item_header *ph;

struct pool *prev, *iter;

+#ifdef MULTIPROCESSOR

+ if (pp->pr_cache != NULL)

+ pool_cache_destroy(pp);

+#endif

#ifdef DIAGNOSTIC

if (pp->pr_nout != 0)

panic("%s: pool busy: still out: %u", __func__, pp->pr_nout);

@@ -421,6 +454,14 @@ pool_get(struct pool *pp, int flags)

void *v = NULL;

int slowdown = 0;

+#ifdef MULTIPROCESSOR

+ if (pp->pr_cache != NULL) {

+ v = pool_cache_get(pp);

+ if (v != NULL)

+ goto good;

+ }

+#endif

KASSERT(flags & (PR_WAITOK | PR_NOWAIT));

mtx_enter(&pp->pr_mtx);

@@ -453,6 +494,9 @@ pool_get(struct pool *pp, int flags)

v = mem.v;

}

+#ifdef MULTIPROCESSOR

+good:

+#endif

if (ISSET(flags, PR_ZERO))

memset(v, 0, pp->pr_size);

@@ -631,6 +675,13 @@ pool_put(struct pool *pp, void *v)

panic("%s: NULL item", __func__);

#endif

+#ifdef MULTIPROCESSOR

+ if (pp->pr_cache != NULL && TAILQ_EMPTY(&pp->pr_requests)) {

+ pool_cache_put(pp, v);

+ return;

+ }

+#endif

mtx_enter(&pp->pr_mtx);

splassert(pp->pr_ipl);

@@ -1333,6 +1384,8 @@ sysctl_dopool(int *name, u_int namelen, char *oldp, size_t *oldlenp)

pi.pr_nidle = pp->pr_nidle;

mtx_leave(&pp->pr_mtx);

+ pool_cache_info(pp, &pi);

rv = sysctl_rdstruct(oldp, oldlenp, NULL, &pi, sizeof(pi));

break;

}

@@ -1499,3 +1552,265 @@ pool_multi_free_ni(struct pool *pp, void *v)

km_free(v, pp->pr_pgsize, &kv, pp->pr_crange);

KERNEL_UNLOCK();

}

+#ifdef MULTIPROCESSOR

+struct pool pool_caches; /* per cpu cache entries */

+void

+pool_cache_init(struct pool *pp)

+ struct cpumem *cm;

+ struct pool_cache *pc;

+ struct cpumem_iter i;

+ if (pool_caches.pr_size == 0) {

+ pool_init(&pool_caches, sizeof(struct pool_cache), 64,

+ IPL_NONE, PR_WAITOK, "plcache", NULL);

+ }

+ KASSERT(pp->pr_size >= sizeof(*pc));

+ cm = cpumem_get(&pool_caches);

+ mtx_init(&pp->pr_cache_mtx, pp->pr_ipl);

+ pp->pr_cache_list = NULL;

+ pp->pr_cache_nlist = 0;

+ pp->pr_cache_items = 8;

+ pp->pr_cache_contention = 0;

+ CPUMEM_FOREACH(pc, &i, cm) {

+ pc->pc_actv = NULL;

+ pc->pc_nactv = 0;

+ pc->pc_prev = NULL;

+ pc->pc_gets = 0;

+ pc->pc_puts = 0;

+ pc->pc_fails = 0;

+ pc->pc_nout = 0;

+ }

+ pp->pr_cache = cm;

+static inline void

+pool_list_enter(struct pool *pp)

+ if (mtx_enter_try(&pp->pr_cache_mtx) == 0) {

+ mtx_enter(&pp->pr_cache_mtx);

+ pp->pr_cache_contention++;

+ }

+static inline void

+pool_list_leave(struct pool *pp)

+ mtx_leave(&pp->pr_cache_mtx);

+static inline struct pool_list *

+pool_list_alloc(struct pool *pp, struct pool_cache *pc)

+ struct pool_list *pl;

+ pool_list_enter(pp);

+ pl = pp->pr_cache_list;

+ if (pl != NULL) {

+ pp->pr_cache_list = pl->pl_nextl;

+ pp->pr_cache_nlist--;

+ }

+ pp->pr_cache_nout += pc->pc_nout;

+ pc->pc_nout = 0;

+ pool_list_leave(pp);

+ return (pl);

+static inline void

+pool_list_free(struct pool *pp, struct pool_cache *pc, struct pool_list *pl)

+ pool_list_enter(pp);

+ pl->pl_nextl = pp->pr_cache_list;

+ pp->pr_cache_list = pl;

+ pp->pr_cache_nlist++;

+ pp->pr_cache_nout += pc->pc_nout;

+ pc->pc_nout = 0;

+ pool_list_leave(pp);

+static inline struct pool_cache *

+pool_cache_enter(struct pool *pp, int *s)

+ struct pool_cache *pc;

+ pc = cpumem_enter(pp->pr_cache);

+ *s = splraise(pp->pr_ipl);

+ pc->pc_gen++;

+ return (pc);

+static inline void

+pool_cache_leave(struct pool *pp, struct pool_cache *pc, int s)

+ pc->pc_gen++;

+ splx(s);

+ cpumem_leave(pp->pr_cache, pc);

+void *

+pool_cache_get(struct pool *pp)

+ struct pool_cache *pc;

+ struct pool_list *pl;

+ int s;

+ pc = pool_cache_enter(pp, &s);

+ if (pc->pc_actv != NULL) {

+ pl = pc->pc_actv;

+ } else if (pc->pc_prev != NULL) {

+ pl = pc->pc_prev;

+ pc->pc_prev = NULL;

+ } else if ((pl = pool_list_alloc(pp, pc)) == NULL) {

+ pc->pc_fails++;

+ goto done;

+ }

+ pc->pc_actv = pl->pl_next;

+ pc->pc_nactv = pl->pl_nitems - 1;

+ pc->pc_gets++;

+ pc->pc_nout++;

+done:

+ pool_cache_leave(pp, pc, s);

+ return (pl);

+void

+pool_cache_put(struct pool *pp, void *v)

+ struct pool_cache *pc;

+ struct pool_list *pl = v;

+ unsigned long cache_items = pp->pr_cache_items;

+ unsigned long nitems;

+ int s;

+ pc = pool_cache_enter(pp, &s);

+ nitems = pc->pc_nactv;

+ if (nitems >= cache_items) {

+ if (pc->pc_prev != NULL)

+ pool_list_free(pp, pc, pc->pc_prev);

+ pc->pc_prev = pc->pc_actv;

+ pc->pc_actv = NULL;

+ pc->pc_nactv = 0;

+ nitems = 0;

+ }

+ pl->pl_next = pc->pc_actv;

+ pl->pl_nitems = ++nitems;

+ pc->pc_actv = pl;

+ pc->pc_nactv = nitems;

+ pc->pc_puts++;

+ pc->pc_nout--;

+ pool_cache_leave(pp, pc, s);

+struct pool_list *

+pool_list_put(struct pool *pp, struct pool_list *pl)

+ struct pool_list *rpl, *npl;

+ if (pl == NULL)

+ return (NULL);

+ rpl = (struct pool_list *)pl->pl_next;

+ do {

+ npl = pl->pl_next;

+ pool_put(pp, pl);

+ pl = npl;

+ } while (pl != NULL);

+ return (rpl);

+void

+pool_cache_destroy(struct pool *pp)

+ struct pool_cache *pc;

+ struct pool_list *pl;

+ struct cpumem_iter i;

+ struct cpumem *cm;

+ cm = pp->pr_cache;

+ pp->pr_cache = NULL; /* make pool_put avoid the cache */

+ CPUMEM_FOREACH(pc, &i, cm) {

+ pool_list_put(pp, pc->pc_actv);

+ pool_list_put(pp, pc->pc_prev);

+ }

+ cpumem_put(&pool_caches, cm);

+ pl = pp->pr_cache_list;

+ while (pl != NULL)

+ pl = pool_list_put(pp, pl);

+void

+pool_cache_info(struct pool *pp, struct kinfo_pool *pi)

+ struct pool_cache *pc;

+ struct cpumem_iter i;

+ if (pp->pr_cache == NULL)

+ return;

+ /* loop through the caches twice to collect stats */

+ /* once without the mtx so we can yield while reading nget/nput */

+ CPUMEM_FOREACH(pc, &i, pp->pr_cache) {

+ uint64_t gen, nget, nput;

+ do {

+ while ((gen = pc->pc_gen) & 1)

+ yield();

+ nget = pc->pc_gets;

+ nput = pc->pc_puts;

+ } while (gen != pc->pc_gen);

+ pi->pr_nget += nget;

+ pi->pr_nput += nput;

+ }

+ /* and once with the mtx so we can get consistent nout values */

+ mtx_enter(&pp->pr_cache_mtx);

+ CPUMEM_FOREACH(pc, &i, pp->pr_cache)

+ pi->pr_nout += pc->pc_nout;

+ pi->pr_nout += pp->pr_cache_nout;

+ mtx_leave(&pp->pr_cache_mtx);

+#else /* MULTIPROCESSOR */

+void

+pool_cache_init(struct pool *pp)

+ /* nop */

+void

+pool_cache_info(struct pool *pp, struct kinfo_pool *pi)

+ /* nop */

+#endif /* MULTIPROCESSOR */