net: Generate reuseport group ID on group creation

author Jakub Sitnicki <jakub@cloudflare.com>

Tue, 18 Feb 2020 17:10:21 +0000 (17:10 +0000)

committer Daniel Borkmann <daniel@iogearbox.net>

Fri, 21 Feb 2020 21:29:45 +0000 (22:29 +0100)
author Jakub Sitnicki <jakub@cloudflare.com>
Tue, 18 Feb 2020 17:10:21 +0000 (17:10 +0000)
committer Daniel Borkmann <daniel@iogearbox.net>
Fri, 21 Feb 2020 21:29:45 +0000 (22:29 +0100)
diff --git a/include/net/sock_reuseport.h b/include/net/sock_reuseport.h

index 43f4a81..3ecaa15 100644 (file)
--- a/include/net/sock_reuseport.h
+++ b/include/net/sock_reuseport.h
@@ -55,6 +55,4 @@ static inline bool reuseport_has_conns(struct sock *sk, bool set)
         return ret;
  }
  
-int reuseport_get_id(struct sock_reuseport *reuse);
-
  #endif  /* _SOCK_REUSEPORT_H */
diff --git a/kernel/bpf/reuseport_array.c b/kernel/bpf/reuseport_array.c

index 50c083b..01badd3 100644 (file)
--- a/kernel/bpf/reuseport_array.c
+++ b/kernel/bpf/reuseport_array.c
@@ -305,11 +305,6 @@ int bpf_fd_reuseport_array_update_elem(struct bpf_map *map, void *key,
         if (err)
                 goto put_file_unlock;
  
-       /* Ensure reuse->reuseport_id is set */
-       err = reuseport_get_id(reuse);
-       if (err < 0)
-               goto put_file_unlock;
-
         WRITE_ONCE(nsk->sk_user_data, &array->ptrs[index]);
         rcu_assign_pointer(array->ptrs[index], nsk);
         free_osk = osk;
diff --git a/net/core/filter.c b/net/core/filter.c

index 77d2f47..925b23d 100644 (file)
--- a/net/core/filter.c
+++ b/net/core/filter.c
@@ -8641,18 +8641,8 @@ BPF_CALL_4(sk_select_reuseport, struct sk_reuseport_kern *, reuse_kern,
         }
  
         if (unlikely(reuse->reuseport_id != reuse_kern->reuseport_id)) {
-               struct sock *sk;
-
-               if (unlikely(!reuse_kern->reuseport_id))
-                       /* There is a small race between adding the
-                        * sk to the map and setting the
-                        * reuse_kern->reuseport_id.
-                        * Treat it as the sk has not been added to
-                        * the bpf map yet.
-                        */
-                       return -ENOENT;
+               struct sock *sk = reuse_kern->sk;
  
-               sk = reuse_kern->sk;
                 if (sk->sk_protocol != selected_sk->sk_protocol)
                         return -EPROTOTYPE;
                 else if (sk->sk_family != selected_sk->sk_family)
diff --git a/net/core/sock_reuseport.c b/net/core/sock_reuseport.c

index 91e9f22..adcb3ae 100644 (file)
--- a/net/core/sock_reuseport.c
+++ b/net/core/sock_reuseport.c
@@ -16,27 +16,8 @@
  
  DEFINE_SPINLOCK(reuseport_lock);
  
-#define REUSEPORT_MIN_ID 1
  static DEFINE_IDA(reuseport_ida);
  
-int reuseport_get_id(struct sock_reuseport *reuse)
-{
-       int id;
-
-       if (reuse->reuseport_id)
-               return reuse->reuseport_id;
-
-       id = ida_simple_get(&reuseport_ida, REUSEPORT_MIN_ID, 0,
-                           /* Called under reuseport_lock */
-                           GFP_ATOMIC);
-       if (id < 0)
-               return id;
-
-       reuse->reuseport_id = id;
-
-       return reuse->reuseport_id;
-}
-
  static struct sock_reuseport *__reuseport_alloc(unsigned int max_socks)
  {
         unsigned int size = sizeof(struct sock_reuseport) +
@@ -55,6 +36,7 @@ static struct sock_reuseport *__reuseport_alloc(unsigned int max_socks)
  int reuseport_alloc(struct sock *sk, bool bind_inany)
  {
         struct sock_reuseport *reuse;
+       int id, ret = 0;
  
         /* bh lock used since this function call may precede hlist lock in
          * soft irq of receive path or setsockopt from process context
@@ -78,10 +60,18 @@ int reuseport_alloc(struct sock *sk, bool bind_inany)
  
         reuse = __reuseport_alloc(INIT_SOCKS);
         if (!reuse) {
-               spin_unlock_bh(&reuseport_lock);
-               return -ENOMEM;
+               ret = -ENOMEM;
+               goto out;
         }
  
+       id = ida_alloc(&reuseport_ida, GFP_ATOMIC);
+       if (id < 0) {
+               kfree(reuse);
+               ret = id;
+               goto out;
+       }
+
+       reuse->reuseport_id = id;
         reuse->socks[0] = sk;
         reuse->num_socks = 1;
         reuse->bind_inany = bind_inany;
@@ -90,7 +80,7 @@ int reuseport_alloc(struct sock *sk, bool bind_inany)
  out:
         spin_unlock_bh(&reuseport_lock);
  
-       return 0;
+       return ret;
  }
  EXPORT_SYMBOL(reuseport_alloc);
  
@@ -134,8 +124,7 @@ static void reuseport_free_rcu(struct rcu_head *head)
  
         reuse = container_of(head, struct sock_reuseport, rcu);
         sk_reuseport_prog_free(rcu_dereference_protected(reuse->prog, 1));
-       if (reuse->reuseport_id)
-               ida_simple_remove(&reuseport_ida, reuse->reuseport_id);
+       ida_free(&reuseport_ida, reuse->reuseport_id);
         kfree(reuse);
  }
  
@@ -199,12 +188,15 @@ void reuseport_detach_sock(struct sock *sk)
         reuse = rcu_dereference_protected(sk->sk_reuseport_cb,
                                           lockdep_is_held(&reuseport_lock));
  
-       /* At least one of the sk in this reuseport group is added to
-        * a bpf map.  Notify the bpf side.  The bpf map logic will
-        * remove the sk if it is indeed added to a bpf map.
+       /* Notify the bpf side. The sk may be added to a sockarray
+        * map. If so, sockarray logic will remove it from the map.
+        *
+        * Other bpf map types that work with reuseport, like sockmap,
+        * don't need an explicit callback from here. They override sk
+        * unhash/close ops to remove the sk from the map before we
+        * get to this point.
          */
-       if (reuse->reuseport_id)
-               bpf_sk_reuseport_detach(sk);
+       bpf_sk_reuseport_detach(sk);
  
         rcu_assign_pointer(sk->sk_reuseport_cb, NULL);
author	Jakub Sitnicki <jakub@cloudflare.com>
	Tue, 18 Feb 2020 17:10:21 +0000 (17:10 +0000)
committer	Daniel Borkmann <daniel@iogearbox.net>
	Fri, 21 Feb 2020 21:29:45 +0000 (22:29 +0100)
include/net/sock_reuseport.h		patch \| blob \| history
kernel/bpf/reuseport_array.c		patch \| blob \| history
net/core/filter.c		patch \| blob \| history
net/core/sock_reuseport.c		patch \| blob \| history