bpf: Add percpu allocation support to bpf_mem_alloc.

author Alexei Starovoitov <ast@kernel.org>

Fri, 2 Sep 2022 21:10:52 +0000 (14:10 -0700)

committer Daniel Borkmann <daniel@iogearbox.net>

Mon, 5 Sep 2022 13:33:06 +0000 (15:33 +0200)
author Alexei Starovoitov <ast@kernel.org>
Fri, 2 Sep 2022 21:10:52 +0000 (14:10 -0700)
committer Daniel Borkmann <daniel@iogearbox.net>
Mon, 5 Sep 2022 13:33:06 +0000 (15:33 +0200)
diff --git a/include/linux/bpf_mem_alloc.h b/include/linux/bpf_mem_alloc.h

index 8047330..653ed15 100644 (file)
--- a/include/linux/bpf_mem_alloc.h
+++ b/include/linux/bpf_mem_alloc.h
@@ -12,7 +12,7 @@ struct bpf_mem_alloc {
         struct bpf_mem_cache __percpu *cache;
  };
  
         struct bpf_mem_cache __percpu *cache;
  };
  
-int bpf_mem_alloc_init(struct bpf_mem_alloc *ma, int size);
+int bpf_mem_alloc_init(struct bpf_mem_alloc *ma, int size, bool percpu);
  void bpf_mem_alloc_destroy(struct bpf_mem_alloc *ma);
  
  /* kmalloc/kfree equivalent: */
  void bpf_mem_alloc_destroy(struct bpf_mem_alloc *ma);
  
  /* kmalloc/kfree equivalent: */
diff --git a/kernel/bpf/hashtab.c b/kernel/bpf/hashtab.c

index 0d888a9..70b02ff 100644 (file)
--- a/kernel/bpf/hashtab.c
+++ b/kernel/bpf/hashtab.c
@@ -607,7 +607,7 @@ static struct bpf_map *htab_map_alloc(union bpf_attr *attr)
                                 goto free_prealloc;
                 }
         } else {
                                 goto free_prealloc;
                 }
         } else {
-               err = bpf_mem_alloc_init(&htab->ma, htab->elem_size);
+               err = bpf_mem_alloc_init(&htab->ma, htab->elem_size, false);
                 if (err)
                         goto free_map_locked;
         }
                 if (err)
                         goto free_map_locked;
         }
diff --git a/kernel/bpf/memalloc.c b/kernel/bpf/memalloc.c

index 5d8648a..f7b0778 100644 (file)
--- a/kernel/bpf/memalloc.c
+++ b/kernel/bpf/memalloc.c
@@ -101,6 +101,7 @@ struct bpf_mem_cache {
         /* count of objects in free_llist */
         int free_cnt;
         int low_watermark, high_watermark, batch;
         /* count of objects in free_llist */
         int free_cnt;
         int low_watermark, high_watermark, batch;
+       bool percpu;
  
         struct rcu_head rcu;
         struct llist_head free_by_rcu;
  
         struct rcu_head rcu;
         struct llist_head free_by_rcu;
@@ -133,6 +134,19 @@ static void *__alloc(struct bpf_mem_cache *c, int node)
          */
         gfp_t flags = GFP_NOWAIT | __GFP_NOWARN | __GFP_ACCOUNT;
  
          */
         gfp_t flags = GFP_NOWAIT | __GFP_NOWARN | __GFP_ACCOUNT;
  
+       if (c->percpu) {
+               void **obj = kmem_cache_alloc_node(c->kmem_cache, flags, node);
+               void *pptr = __alloc_percpu_gfp(c->unit_size, 8, flags);
+
+               if (!obj || !pptr) {
+                       free_percpu(pptr);
+                       kfree(obj);
+                       return NULL;
+               }
+               obj[1] = pptr;
+               return obj;
+       }
+
         if (c->kmem_cache)
                 return kmem_cache_alloc_node(c->kmem_cache, flags, node);
  
         if (c->kmem_cache)
                 return kmem_cache_alloc_node(c->kmem_cache, flags, node);
  
@@ -193,6 +207,12 @@ static void alloc_bulk(struct bpf_mem_cache *c, int cnt, int node)
  
  static void free_one(struct bpf_mem_cache *c, void *obj)
  {
  
  static void free_one(struct bpf_mem_cache *c, void *obj)
  {
+       if (c->percpu) {
+               free_percpu(((void **)obj)[1]);
+               kmem_cache_free(c->kmem_cache, obj);
+               return;
+       }
+
         if (c->kmem_cache)
                 kmem_cache_free(c->kmem_cache, obj);
         else
         if (c->kmem_cache)
                 kmem_cache_free(c->kmem_cache, obj);
         else
@@ -332,21 +352,30 @@ static void prefill_mem_cache(struct bpf_mem_cache *c, int cpu)
   * kmalloc/kfree. Max allocation size is 4096 in this case.
   * This is bpf_dynptr and bpf_kptr use case.
   */
   * kmalloc/kfree. Max allocation size is 4096 in this case.
   * This is bpf_dynptr and bpf_kptr use case.
   */
-int bpf_mem_alloc_init(struct bpf_mem_alloc *ma, int size)
+int bpf_mem_alloc_init(struct bpf_mem_alloc *ma, int size, bool percpu)
  {
         static u16 sizes[NUM_CACHES] = {96, 192, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096};
         struct bpf_mem_caches *cc, __percpu *pcc;
         struct bpf_mem_cache *c, __percpu *pc;
  {
         static u16 sizes[NUM_CACHES] = {96, 192, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096};
         struct bpf_mem_caches *cc, __percpu *pcc;
         struct bpf_mem_cache *c, __percpu *pc;
-       struct kmem_cache *kmem_cache;
+       struct kmem_cache *kmem_cache = NULL;
         struct obj_cgroup *objcg = NULL;
         char buf[32];
         struct obj_cgroup *objcg = NULL;
         char buf[32];
-       int cpu, i;
+       int cpu, i, unit_size;
  
         if (size) {
                 pc = __alloc_percpu_gfp(sizeof(*pc), 8, GFP_KERNEL);
                 if (!pc)
                         return -ENOMEM;
  
         if (size) {
                 pc = __alloc_percpu_gfp(sizeof(*pc), 8, GFP_KERNEL);
                 if (!pc)
                         return -ENOMEM;
-               size += LLIST_NODE_SZ; /* room for llist_node */
+
+               if (percpu) {
+                       unit_size = size;
+                       /* room for llist_node and per-cpu pointer */
+                       size = LLIST_NODE_SZ + sizeof(void *);
+               } else {
+                       size += LLIST_NODE_SZ; /* room for llist_node */
+                       unit_size = size;
+               }
+
                 snprintf(buf, sizeof(buf), "bpf-%u", size);
                 kmem_cache = kmem_cache_create(buf, size, 8, 0, NULL);
                 if (!kmem_cache) {
                 snprintf(buf, sizeof(buf), "bpf-%u", size);
                 kmem_cache = kmem_cache_create(buf, size, 8, 0, NULL);
                 if (!kmem_cache) {
@@ -359,14 +388,19 @@ int bpf_mem_alloc_init(struct bpf_mem_alloc *ma, int size)
                 for_each_possible_cpu(cpu) {
                         c = per_cpu_ptr(pc, cpu);
                         c->kmem_cache = kmem_cache;
                 for_each_possible_cpu(cpu) {
                         c = per_cpu_ptr(pc, cpu);
                         c->kmem_cache = kmem_cache;
-                       c->unit_size = size;
+                       c->unit_size = unit_size;
                         c->objcg = objcg;
                         c->objcg = objcg;
+                       c->percpu = percpu;
                         prefill_mem_cache(c, cpu);
                 }
                 ma->cache = pc;
                 return 0;
         }
  
                         prefill_mem_cache(c, cpu);
                 }
                 ma->cache = pc;
                 return 0;
         }
  
+       /* size == 0 && percpu is an invalid combination */
+       if (WARN_ON_ONCE(percpu))
+               return -EINVAL;
+
         pcc = __alloc_percpu_gfp(sizeof(*cc), 8, GFP_KERNEL);
         if (!pcc)
                 return -ENOMEM;
         pcc = __alloc_percpu_gfp(sizeof(*cc), 8, GFP_KERNEL);
         if (!pcc)
                 return -ENOMEM;
author	Alexei Starovoitov <ast@kernel.org>
	Fri, 2 Sep 2022 21:10:52 +0000 (14:10 -0700)
committer	Daniel Borkmann <daniel@iogearbox.net>
	Mon, 5 Sep 2022 13:33:06 +0000 (15:33 +0200)
include/linux/bpf_mem_alloc.h		patch \| blob \| history
kernel/bpf/hashtab.c		patch \| blob \| history
kernel/bpf/memalloc.c		patch \| blob \| history