bpf: Switch bpf_map ref counter to atomic64_t so bpf_map_inc() never fails

author Andrii Nakryiko <andriin@fb.com>

Sun, 17 Nov 2019 17:28:02 +0000 (09:28 -0800)

committer Daniel Borkmann <daniel@iogearbox.net>

Mon, 18 Nov 2019 10:41:59 +0000 (11:41 +0100)
author Andrii Nakryiko <andriin@fb.com>
Sun, 17 Nov 2019 17:28:02 +0000 (09:28 -0800)
committer Daniel Borkmann <daniel@iogearbox.net>
Mon, 18 Nov 2019 10:41:59 +0000 (11:41 +0100)
diff --git a/drivers/net/ethernet/netronome/nfp/bpf/offload.c b/drivers/net/ethernet/netronome/nfp/bpf/offload.c

index 88fab6a..06927ba 100644 (file)
--- a/drivers/net/ethernet/netronome/nfp/bpf/offload.c
+++ b/drivers/net/ethernet/netronome/nfp/bpf/offload.c
@@ -46,9 +46,7 @@ nfp_map_ptr_record(struct nfp_app_bpf *bpf, struct nfp_prog *nfp_prog,
         /* Grab a single ref to the map for our record.  The prog destroy ndo
          * happens after free_used_maps().
          */
-       map = bpf_map_inc(map, false);
-       if (IS_ERR(map))
-               return PTR_ERR(map);
+       bpf_map_inc(map);
  
         record = kmalloc(sizeof(*record), GFP_KERNEL);
         if (!record) {
diff --git a/include/linux/bpf.h b/include/linux/bpf.h

index 5b81cde..34a3444 100644 (file)
--- a/include/linux/bpf.h
+++ b/include/linux/bpf.h
@@ -103,8 +103,8 @@ struct bpf_map {
         /* The 3rd and 4th cacheline with misc members to avoid false sharing
          * particularly with refcounting.
          */
-       atomic_t refcnt ____cacheline_aligned;
-       atomic_t usercnt;
+       atomic64_t refcnt ____cacheline_aligned;
+       atomic64_t usercnt;
         struct work_struct work;
         char name[BPF_OBJ_NAME_LEN];
  };
@@ -783,9 +783,9 @@ void bpf_map_free_id(struct bpf_map *map, bool do_idr_lock);
  
  struct bpf_map *bpf_map_get_with_uref(u32 ufd);
  struct bpf_map *__bpf_map_get(struct fd f);
-struct bpf_map * __must_check bpf_map_inc(struct bpf_map *map, bool uref);
-struct bpf_map * __must_check bpf_map_inc_not_zero(struct bpf_map *map,
-                                                  bool uref);
+void bpf_map_inc(struct bpf_map *map);
+void bpf_map_inc_with_uref(struct bpf_map *map);
+struct bpf_map * __must_check bpf_map_inc_not_zero(struct bpf_map *map);
  void bpf_map_put_with_uref(struct bpf_map *map);
  void bpf_map_put(struct bpf_map *map);
  int bpf_map_charge_memlock(struct bpf_map *map, u32 pages);
diff --git a/kernel/bpf/inode.c b/kernel/bpf/inode.c

index a70f720..2f17f24 100644 (file)
--- a/kernel/bpf/inode.c
+++ b/kernel/bpf/inode.c
@@ -34,7 +34,7 @@ static void *bpf_any_get(void *raw, enum bpf_type type)
                 raw = bpf_prog_inc(raw);
                 break;
         case BPF_TYPE_MAP:
-               raw = bpf_map_inc(raw, true);
+               bpf_map_inc_with_uref(raw);
                 break;
         default:
                 WARN_ON_ONCE(1);
diff --git a/kernel/bpf/map_in_map.c b/kernel/bpf/map_in_map.c

index fab4fb1..4cbe987 100644 (file)
--- a/kernel/bpf/map_in_map.c
+++ b/kernel/bpf/map_in_map.c
@@ -98,7 +98,7 @@ void *bpf_map_fd_get_ptr(struct bpf_map *map,
                 return inner_map;
  
         if (bpf_map_meta_equal(map->inner_map_meta, inner_map))
-               inner_map = bpf_map_inc(inner_map, false);
+               bpf_map_inc(inner_map);
         else
                 inner_map = ERR_PTR(-EINVAL);
  
diff --git a/kernel/bpf/syscall.c b/kernel/bpf/syscall.c

index c88c815..2003075 100644 (file)
--- a/kernel/bpf/syscall.c
+++ b/kernel/bpf/syscall.c
@@ -311,7 +311,7 @@ static void bpf_map_free_deferred(struct work_struct *work)
  
  static void bpf_map_put_uref(struct bpf_map *map)
  {
-       if (atomic_dec_and_test(&map->usercnt)) {
+       if (atomic64_dec_and_test(&map->usercnt)) {
                 if (map->ops->map_release_uref)
                         map->ops->map_release_uref(map);
         }
@@ -322,7 +322,7 @@ static void bpf_map_put_uref(struct bpf_map *map)
   */
  static void __bpf_map_put(struct bpf_map *map, bool do_idr_lock)
  {
-       if (atomic_dec_and_test(&map->refcnt)) {
+       if (atomic64_dec_and_test(&map->refcnt)) {
                 /* bpf_map_free_id() must be called first */
                 bpf_map_free_id(map, do_idr_lock);
                 btf_put(map->btf);
@@ -575,8 +575,8 @@ static int map_create(union bpf_attr *attr)
         if (err)
                 goto free_map;
  
-       atomic_set(&map->refcnt, 1);
-       atomic_set(&map->usercnt, 1);
+       atomic64_set(&map->refcnt, 1);
+       atomic64_set(&map->usercnt, 1);
  
         if (attr->btf_key_type_id || attr->btf_value_type_id) {
                 struct btf *btf;
@@ -653,21 +653,19 @@ struct bpf_map *__bpf_map_get(struct fd f)
         return f.file->private_data;
  }
  
-/* prog's and map's refcnt limit */
-#define BPF_MAX_REFCNT 32768
-
-struct bpf_map *bpf_map_inc(struct bpf_map *map, bool uref)
+void bpf_map_inc(struct bpf_map *map)
  {
-       if (atomic_inc_return(&map->refcnt) > BPF_MAX_REFCNT) {
-               atomic_dec(&map->refcnt);
-               return ERR_PTR(-EBUSY);
-       }
-       if (uref)
-               atomic_inc(&map->usercnt);
-       return map;
+       atomic64_inc(&map->refcnt);
  }
  EXPORT_SYMBOL_GPL(bpf_map_inc);
  
+void bpf_map_inc_with_uref(struct bpf_map *map)
+{
+       atomic64_inc(&map->refcnt);
+       atomic64_inc(&map->usercnt);
+}
+EXPORT_SYMBOL_GPL(bpf_map_inc_with_uref);
+
  struct bpf_map *bpf_map_get_with_uref(u32 ufd)
  {
         struct fd f = fdget(ufd);
@@ -677,38 +675,30 @@ struct bpf_map *bpf_map_get_with_uref(u32 ufd)
         if (IS_ERR(map))
                 return map;
  
-       map = bpf_map_inc(map, true);
+       bpf_map_inc_with_uref(map);
         fdput(f);
  
         return map;
  }
  
  /* map_idr_lock should have been held */
-static struct bpf_map *__bpf_map_inc_not_zero(struct bpf_map *map,
-                                             bool uref)
+static struct bpf_map *__bpf_map_inc_not_zero(struct bpf_map *map, bool uref)
  {
         int refold;
  
-       refold = atomic_fetch_add_unless(&map->refcnt, 1, 0);
-
-       if (refold >= BPF_MAX_REFCNT) {
-               __bpf_map_put(map, false);
-               return ERR_PTR(-EBUSY);
-       }
-
+       refold = atomic64_fetch_add_unless(&map->refcnt, 1, 0);
         if (!refold)
                 return ERR_PTR(-ENOENT);
-
         if (uref)
-               atomic_inc(&map->usercnt);
+               atomic64_inc(&map->usercnt);
  
         return map;
  }
  
-struct bpf_map *bpf_map_inc_not_zero(struct bpf_map *map, bool uref)
+struct bpf_map *bpf_map_inc_not_zero(struct bpf_map *map)
  {
         spin_lock_bh(&map_idr_lock);
-       map = __bpf_map_inc_not_zero(map, uref);
+       map = __bpf_map_inc_not_zero(map, false);
         spin_unlock_bh(&map_idr_lock);
  
         return map;
@@ -1455,6 +1445,9 @@ static struct bpf_prog *____bpf_prog_get(struct fd f)
         return f.file->private_data;
  }
  
+/* prog's refcnt limit */
+#define BPF_MAX_REFCNT 32768
+
  struct bpf_prog *bpf_prog_add(struct bpf_prog *prog, int i)
  {
         if (atomic_add_return(i, &prog->aux->refcnt) > BPF_MAX_REFCNT) {
diff --git a/kernel/bpf/verifier.c b/kernel/bpf/verifier.c

index e9dc95a..9f59f7a 100644 (file)
--- a/kernel/bpf/verifier.c
+++ b/kernel/bpf/verifier.c
@@ -8179,11 +8179,7 @@ static int replace_map_fd_with_map_ptr(struct bpf_verifier_env *env)
                          * will be used by the valid program until it's unloaded
                          * and all maps are released in free_used_maps()
                          */
-                       map = bpf_map_inc(map, false);
-                       if (IS_ERR(map)) {
-                               fdput(f);
-                               return PTR_ERR(map);
-                       }
+                       bpf_map_inc(map);
  
                         aux->map_index = env->used_map_cnt;
                         env->used_maps[env->used_map_cnt++] = map;
diff --git a/kernel/bpf/xskmap.c b/kernel/bpf/xskmap.c

index da16c30..90c4fce 100644 (file)
--- a/kernel/bpf/xskmap.c
+++ b/kernel/bpf/xskmap.c
@@ -11,10 +11,8 @@
  
  int xsk_map_inc(struct xsk_map *map)
  {
-       struct bpf_map *m = &map->map;
-
-       m = bpf_map_inc(m, false);
-       return PTR_ERR_OR_ZERO(m);
+       bpf_map_inc(&map->map);
+       return 0;
  }
  
  void xsk_map_put(struct xsk_map *map)
diff --git a/net/core/bpf_sk_storage.c b/net/core/bpf_sk_storage.c

index da5639a..458be6b 100644 (file)
--- a/net/core/bpf_sk_storage.c
+++ b/net/core/bpf_sk_storage.c
@@ -798,7 +798,7 @@ int bpf_sk_storage_clone(const struct sock *sk, struct sock *newsk)
                  * Try to grab map refcnt to make sure that it's still
                  * alive and prevent concurrent removal.
                  */
-               map = bpf_map_inc_not_zero(&smap->map, false);
+               map = bpf_map_inc_not_zero(&smap->map);
                 if (IS_ERR(map))
                         continue;
author	Andrii Nakryiko <andriin@fb.com>
	Sun, 17 Nov 2019 17:28:02 +0000 (09:28 -0800)
committer	Daniel Borkmann <daniel@iogearbox.net>
	Mon, 18 Nov 2019 10:41:59 +0000 (11:41 +0100)
drivers/net/ethernet/netronome/nfp/bpf/offload.c		patch \| blob \| history
include/linux/bpf.h		patch \| blob \| history
kernel/bpf/inode.c		patch \| blob \| history
kernel/bpf/map_in_map.c		patch \| blob \| history
kernel/bpf/syscall.c		patch \| blob \| history
kernel/bpf/verifier.c		patch \| blob \| history
kernel/bpf/xskmap.c		patch \| blob \| history
net/core/bpf_sk_storage.c		patch \| blob \| history