freezer,sched: Rewrite core freezer logic

author Peter Zijlstra <peterz@infradead.org>

Mon, 22 Aug 2022 11:18:22 +0000 (13:18 +0200)

committer Peter Zijlstra <peterz@infradead.org>

Wed, 7 Sep 2022 19:53:50 +0000 (21:53 +0200)
author Peter Zijlstra <peterz@infradead.org>
Mon, 22 Aug 2022 11:18:22 +0000 (13:18 +0200)
committer Peter Zijlstra <peterz@infradead.org>
Wed, 7 Sep 2022 19:53:50 +0000 (21:53 +0200)
diff --git a/drivers/android/binder.c b/drivers/android/binder.c

index c964d7c8c3841386225d317ca34a8118c7a8a880..50197ef4b787a6f8768a13ec1246a1cdde065d95 100644 (file)
--- a/drivers/android/binder.c
+++ b/drivers/android/binder.c
@@ -4247,10 +4247,9 @@ static int binder_wait_for_work(struct binder_thread *thread,
         struct binder_proc *proc = thread->proc;
         int ret = 0;
  
-       freezer_do_not_count();
         binder_inner_proc_lock(proc);
         for (;;) {
-               prepare_to_wait(&thread->wait, &wait, TASK_INTERRUPTIBLE);
+               prepare_to_wait(&thread->wait, &wait, TASK_INTERRUPTIBLE|TASK_FREEZABLE);
                 if (binder_has_work_ilocked(thread, do_proc_work))
                         break;
                 if (do_proc_work)
@@ -4267,7 +4266,6 @@ static int binder_wait_for_work(struct binder_thread *thread,
         }
         finish_wait(&thread->wait, &wait);
         binder_inner_proc_unlock(proc);
-       freezer_count();
  
         return ret;
  }
diff --git a/drivers/media/pci/pt3/pt3.c b/drivers/media/pci/pt3/pt3.c

index 0d51bdf01f4327d81183f9e8445a689364e9047c..f6deac85962e4add5b4a3990314dc6ef3e2b59d9 100644 (file)
--- a/drivers/media/pci/pt3/pt3.c
+++ b/drivers/media/pci/pt3/pt3.c
@@ -445,8 +445,8 @@ static int pt3_fetch_thread(void *data)
                 pt3_proc_dma(adap);
  
                 delay = ktime_set(0, PT3_FETCH_DELAY * NSEC_PER_MSEC);
-               set_current_state(TASK_UNINTERRUPTIBLE);
-               freezable_schedule_hrtimeout_range(&delay,
+               set_current_state(TASK_UNINTERRUPTIBLE|TASK_FREEZABLE);
+               schedule_hrtimeout_range(&delay,
                                         PT3_FETCH_DELAY_DELTA * NSEC_PER_MSEC,
                                         HRTIMER_MODE_REL);
         }
diff --git a/fs/cifs/inode.c b/fs/cifs/inode.c

index eeeaba3dec0536b0fa79199333fc380181dd4bff..54e6bfc6a5a6423317bebd42a86d15a0df1d3364 100644 (file)
--- a/fs/cifs/inode.c
+++ b/fs/cifs/inode.c
@@ -2326,7 +2326,7 @@ cifs_invalidate_mapping(struct inode *inode)
  static int
  cifs_wait_bit_killable(struct wait_bit_key *key, int mode)
  {
-       freezable_schedule_unsafe();
+       schedule();
         if (signal_pending_state(mode, current))
                 return -ERESTARTSYS;
         return 0;
@@ -2344,7 +2344,7 @@ cifs_revalidate_mapping(struct inode *inode)
                 return 0;
  
         rc = wait_on_bit_lock_action(flags, CIFS_INO_LOCK, cifs_wait_bit_killable,
-                                    TASK_KILLABLE);
+                                    TASK_KILLABLE|TASK_FREEZABLE_UNSAFE);
         if (rc)
                 return rc;
  
diff --git a/fs/cifs/transport.c b/fs/cifs/transport.c

index de7aeced7e16bbe952dd3f9aeb16385bcf40de8d..eda09fba1550afb63bfd11f7669dc811b5d30679 100644 (file)
--- a/fs/cifs/transport.c
+++ b/fs/cifs/transport.c
@@ -757,8 +757,9 @@ wait_for_response(struct TCP_Server_Info *server, struct mid_q_entry *midQ)
  {
         int error;
  
-       error = wait_event_freezekillable_unsafe(server->response_q,
-                                   midQ->mid_state != MID_REQUEST_SUBMITTED);
+       error = wait_event_state(server->response_q,
+                                midQ->mid_state != MID_REQUEST_SUBMITTED,
+                                (TASK_KILLABLE|TASK_FREEZABLE_UNSAFE));
         if (error < 0)
                 return -ERESTARTSYS;
  
diff --git a/fs/coredump.c b/fs/coredump.c

index 3d9054c49a119360bcea5e3562bee4d0ed054fcb..9ce59f212a4a0975a51f51efd32ea26187ddb400 100644 (file)
--- a/fs/coredump.c
+++ b/fs/coredump.c
@@ -402,9 +402,8 @@ static int coredump_wait(int exit_code, struct core_state *core_state)
         if (core_waiters > 0) {
                 struct core_thread *ptr;
  
-               freezer_do_not_count();
-               wait_for_completion(&core_state->startup);
-               freezer_count();
+               wait_for_completion_state(&core_state->startup,
+                                         TASK_UNINTERRUPTIBLE|TASK_FREEZABLE);
                 /*
                  * Wait for all the threads to become inactive, so that
                  * all the thread context (extended register state, like
diff --git a/fs/nfs/file.c b/fs/nfs/file.c

index d2bcd4834c0e6857713aae58c3910d800594dd64..e8301a3727380dbf49ae321696eb989068e3ade2 100644 (file)
--- a/fs/nfs/file.c
+++ b/fs/nfs/file.c
@@ -570,7 +570,8 @@ static vm_fault_t nfs_vm_page_mkwrite(struct vm_fault *vmf)
         }
  
         wait_on_bit_action(&NFS_I(inode)->flags, NFS_INO_INVALIDATING,
-                       nfs_wait_bit_killable, TASK_KILLABLE);
+                          nfs_wait_bit_killable,
+                          TASK_KILLABLE|TASK_FREEZABLE_UNSAFE);
  
         lock_page(page);
         mapping = page_file_mapping(page);
diff --git a/fs/nfs/inode.c b/fs/nfs/inode.c

index b4e46b0ffa2dc04d268827312286af190fef1ab3..a6058f5787a5962df5c94c3b30ab45f9328883e8 100644 (file)
--- a/fs/nfs/inode.c
+++ b/fs/nfs/inode.c
@@ -72,18 +72,13 @@ nfs_fattr_to_ino_t(struct nfs_fattr *fattr)
         return nfs_fileid_to_ino_t(fattr->fileid);
  }
  
-static int nfs_wait_killable(int mode)
+int nfs_wait_bit_killable(struct wait_bit_key *key, int mode)
  {
-       freezable_schedule_unsafe();
+       schedule();
         if (signal_pending_state(mode, current))
                 return -ERESTARTSYS;
         return 0;
  }
-
-int nfs_wait_bit_killable(struct wait_bit_key *key, int mode)
-{
-       return nfs_wait_killable(mode);
-}
  EXPORT_SYMBOL_GPL(nfs_wait_bit_killable);
  
  /**
@@ -1331,7 +1326,8 @@ int nfs_clear_invalid_mapping(struct address_space *mapping)
          */
         for (;;) {
                 ret = wait_on_bit_action(bitlock, NFS_INO_INVALIDATING,
-                                        nfs_wait_bit_killable, TASK_KILLABLE);
+                                        nfs_wait_bit_killable,
+                                        TASK_KILLABLE|TASK_FREEZABLE_UNSAFE);
                 if (ret)
                         goto out;
                 spin_lock(&inode->i_lock);
diff --git a/fs/nfs/nfs3proc.c b/fs/nfs/nfs3proc.c

index 1597eef40d54f6f7005d9326e154323b7f104fd3..2e7579626cf01dfa66ce8b980357b9b59e0c0db6 100644 (file)
--- a/fs/nfs/nfs3proc.c
+++ b/fs/nfs/nfs3proc.c
@@ -36,7 +36,8 @@ nfs3_rpc_wrapper(struct rpc_clnt *clnt, struct rpc_message *msg, int flags)
                 res = rpc_call_sync(clnt, msg, flags);
                 if (res != -EJUKEBOX)
                         break;
-               freezable_schedule_timeout_killable_unsafe(NFS_JUKEBOX_RETRY_TIME);
+               __set_current_state(TASK_KILLABLE|TASK_FREEZABLE_UNSAFE);
+               schedule_timeout(NFS_JUKEBOX_RETRY_TIME);
                 res = -ERESTARTSYS;
         } while (!fatal_signal_pending(current));
         return res;
diff --git a/fs/nfs/nfs4proc.c b/fs/nfs/nfs4proc.c

index 3ed14a2a84a4450ab8d4f75fe5b05e204c6bc19f..4553803538e5f91618eb85405926ba0662de5f98 100644 (file)
--- a/fs/nfs/nfs4proc.c
+++ b/fs/nfs/nfs4proc.c
@@ -416,8 +416,8 @@ static int nfs4_delay_killable(long *timeout)
  {
         might_sleep();
  
-       freezable_schedule_timeout_killable_unsafe(
-               nfs4_update_delay(timeout));
+       __set_current_state(TASK_KILLABLE|TASK_FREEZABLE_UNSAFE);
+       schedule_timeout(nfs4_update_delay(timeout));
         if (!__fatal_signal_pending(current))
                 return 0;
         return -EINTR;
@@ -427,7 +427,8 @@ static int nfs4_delay_interruptible(long *timeout)
  {
         might_sleep();
  
-       freezable_schedule_timeout_interruptible_unsafe(nfs4_update_delay(timeout));
+       __set_current_state(TASK_INTERRUPTIBLE|TASK_FREEZABLE_UNSAFE);
+       schedule_timeout(nfs4_update_delay(timeout));
         if (!signal_pending(current))
                 return 0;
         return __fatal_signal_pending(current) ? -EINTR :-ERESTARTSYS;
@@ -7406,7 +7407,8 @@ nfs4_retry_setlk_simple(struct nfs4_state *state, int cmd,
                 status = nfs4_proc_setlk(state, cmd, request);
                 if ((status != -EAGAIN) || IS_SETLK(cmd))
                         break;
-               freezable_schedule_timeout_interruptible(timeout);
+               __set_current_state(TASK_INTERRUPTIBLE|TASK_FREEZABLE);
+               schedule_timeout(timeout);
                 timeout *= 2;
                 timeout = min_t(unsigned long, NFS4_LOCK_MAXTIMEOUT, timeout);
                 status = -ERESTARTSYS;
@@ -7474,10 +7476,8 @@ nfs4_retry_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
                         break;
  
                 status = -ERESTARTSYS;
-               freezer_do_not_count();
-               wait_woken(&waiter.wait, TASK_INTERRUPTIBLE,
+               wait_woken(&waiter.wait, TASK_INTERRUPTIBLE|TASK_FREEZABLE,
                            NFS4_LOCK_MAXTIMEOUT);
-               freezer_count();
         } while (!signalled());
  
         remove_wait_queue(q, &waiter.wait);
diff --git a/fs/nfs/nfs4state.c b/fs/nfs/nfs4state.c

index 9bab3e9c702a47153703c7f7ae62176fed75fe6f..7e185f7eb2608c818be6e2ae91bdac426b25d868 100644 (file)
--- a/fs/nfs/nfs4state.c
+++ b/fs/nfs/nfs4state.c
@@ -1314,7 +1314,8 @@ int nfs4_wait_clnt_recover(struct nfs_client *clp)
  
         refcount_inc(&clp->cl_count);
         res = wait_on_bit_action(&clp->cl_state, NFS4CLNT_MANAGER_RUNNING,
-                                nfs_wait_bit_killable, TASK_KILLABLE);
+                                nfs_wait_bit_killable,
+                                TASK_KILLABLE|TASK_FREEZABLE_UNSAFE);
         if (res)
                 goto out;
         if (clp->cl_cons_state < 0)
diff --git a/fs/nfs/pnfs.c b/fs/nfs/pnfs.c

index 41a9b6b58fb9fa15c9f162fa8dfa267a1c16e049..70706db317f380821d77fd49eb78a3d0010c90dd 100644 (file)
--- a/fs/nfs/pnfs.c
+++ b/fs/nfs/pnfs.c
@@ -1908,7 +1908,7 @@ static int pnfs_prepare_to_retry_layoutget(struct pnfs_layout_hdr *lo)
         pnfs_layoutcommit_inode(lo->plh_inode, false);
         return wait_on_bit_action(&lo->plh_flags, NFS_LAYOUT_RETURN,
                                    nfs_wait_bit_killable,
-                                  TASK_KILLABLE);
+                                  TASK_KILLABLE|TASK_FREEZABLE_UNSAFE);
  }
  
  static void nfs_layoutget_begin(struct pnfs_layout_hdr *lo)
@@ -3193,7 +3193,7 @@ pnfs_layoutcommit_inode(struct inode *inode, bool sync)
                 status = wait_on_bit_lock_action(&nfsi->flags,
                                 NFS_INO_LAYOUTCOMMITTING,
                                 nfs_wait_bit_killable,
-                               TASK_KILLABLE);
+                               TASK_KILLABLE|TASK_FREEZABLE_UNSAFE);
                 if (status)
                         goto out;
         }
diff --git a/fs/xfs/xfs_trans_ail.c b/fs/xfs/xfs_trans_ail.c

index d3a97a028560651828a5e73b75f8d3585a5a96eb..16fbf2a1144c17603921cea2af838e2b1c9bdf5b 100644 (file)
--- a/fs/xfs/xfs_trans_ail.c
+++ b/fs/xfs/xfs_trans_ail.c
@@ -602,9 +602,9 @@ xfsaild(
  
         while (1) {
                 if (tout && tout <= 20)
-                       set_current_state(TASK_KILLABLE);
+                       set_current_state(TASK_KILLABLE|TASK_FREEZABLE);
                 else
-                       set_current_state(TASK_INTERRUPTIBLE);
+                       set_current_state(TASK_INTERRUPTIBLE|TASK_FREEZABLE);
  
                 /*
                  * Check kthread_should_stop() after we set the task state to
@@ -653,14 +653,14 @@ xfsaild(
                     ailp->ail_target == ailp->ail_target_prev &&
                     list_empty(&ailp->ail_buf_list)) {
                         spin_unlock(&ailp->ail_lock);
-                       freezable_schedule();
+                       schedule();
                         tout = 0;
                         continue;
                 }
                 spin_unlock(&ailp->ail_lock);
  
                 if (tout)
-                       freezable_schedule_timeout(msecs_to_jiffies(tout));
+                       schedule_timeout(msecs_to_jiffies(tout));
  
                 __set_current_state(TASK_RUNNING);
  
diff --git a/include/linux/freezer.h b/include/linux/freezer.h

index 0621c5f86c397e62d549051c19d97b4dff626748..b303472255be4e0886584863e1a462345fcc9fec 100644 (file)
--- a/include/linux/freezer.h
+++ b/include/linux/freezer.h
@@ -8,9 +8,11 @@
  #include <linux/sched.h>
  #include <linux/wait.h>
  #include <linux/atomic.h>
+#include <linux/jump_label.h>
  
  #ifdef CONFIG_FREEZER
-extern atomic_t system_freezing_cnt;   /* nr of freezing conds in effect */
+DECLARE_STATIC_KEY_FALSE(freezer_active);
+
  extern bool pm_freezing;               /* PM freezing in effect */
  extern bool pm_nosig_freezing;         /* PM nosig freezing in effect */
  
@@ -22,10 +24,7 @@ extern unsigned int freeze_timeout_msecs;
  /*
   * Check if a process has been frozen
   */
-static inline bool frozen(struct task_struct *p)
-{
-       return p->flags & PF_FROZEN;
-}
+extern bool frozen(struct task_struct *p);
  
  extern bool freezing_slow_path(struct task_struct *p);
  
@@ -34,9 +33,10 @@ extern bool freezing_slow_path(struct task_struct *p);
   */
  static inline bool freezing(struct task_struct *p)
  {
-       if (likely(!atomic_read(&system_freezing_cnt)))
-               return false;
-       return freezing_slow_path(p);
+       if (static_branch_unlikely(&freezer_active))
+               return freezing_slow_path(p);
+
+       return false;
  }
  
  /* Takes and releases task alloc lock using task_lock() */
@@ -48,23 +48,14 @@ extern int freeze_kernel_threads(void);
  extern void thaw_processes(void);
  extern void thaw_kernel_threads(void);
  
-/*
- * DO NOT ADD ANY NEW CALLERS OF THIS FUNCTION
- * If try_to_freeze causes a lockdep warning it means the caller may deadlock
- */
-static inline bool try_to_freeze_unsafe(void)
+static inline bool try_to_freeze(void)
  {
         might_sleep();
         if (likely(!freezing(current)))
                 return false;
-       return __refrigerator(false);
-}
-
-static inline bool try_to_freeze(void)
-{
         if (!(current->flags & PF_NOFREEZE))
                 debug_check_no_locks_held();
-       return try_to_freeze_unsafe();
+       return __refrigerator(false);
  }
  
  extern bool freeze_task(struct task_struct *p);
@@ -79,195 +70,6 @@ static inline bool cgroup_freezing(struct task_struct *task)
  }
  #endif /* !CONFIG_CGROUP_FREEZER */
  
-/*
- * The PF_FREEZER_SKIP flag should be set by a vfork parent right before it
- * calls wait_for_completion(&vfork) and reset right after it returns from this
- * function.  Next, the parent should call try_to_freeze() to freeze itself
- * appropriately in case the child has exited before the freezing of tasks is
- * complete.  However, we don't want kernel threads to be frozen in unexpected
- * places, so we allow them to block freeze_processes() instead or to set
- * PF_NOFREEZE if needed. Fortunately, in the ____call_usermodehelper() case the
- * parent won't really block freeze_processes(), since ____call_usermodehelper()
- * (the child) does a little before exec/exit and it can't be frozen before
- * waking up the parent.
- */
-
-
-/**
- * freezer_do_not_count - tell freezer to ignore %current
- *
- * Tell freezers to ignore the current task when determining whether the
- * target frozen state is reached.  IOW, the current task will be
- * considered frozen enough by freezers.
- *
- * The caller shouldn't do anything which isn't allowed for a frozen task
- * until freezer_cont() is called.  Usually, freezer[_do_not]_count() pair
- * wrap a scheduling operation and nothing much else.
- */
-static inline void freezer_do_not_count(void)
-{
-       current->flags |= PF_FREEZER_SKIP;
-}
-
-/**
- * freezer_count - tell freezer to stop ignoring %current
- *
- * Undo freezer_do_not_count().  It tells freezers that %current should be
- * considered again and tries to freeze if freezing condition is already in
- * effect.
- */
-static inline void freezer_count(void)
-{
-       current->flags &= ~PF_FREEZER_SKIP;
-       /*
-        * If freezing is in progress, the following paired with smp_mb()
-        * in freezer_should_skip() ensures that either we see %true
-        * freezing() or freezer_should_skip() sees !PF_FREEZER_SKIP.
-        */
-       smp_mb();
-       try_to_freeze();
-}
-
-/* DO NOT ADD ANY NEW CALLERS OF THIS FUNCTION */
-static inline void freezer_count_unsafe(void)
-{
-       current->flags &= ~PF_FREEZER_SKIP;
-       smp_mb();
-       try_to_freeze_unsafe();
-}
-
-/**
- * freezer_should_skip - whether to skip a task when determining frozen
- *                      state is reached
- * @p: task in quesion
- *
- * This function is used by freezers after establishing %true freezing() to
- * test whether a task should be skipped when determining the target frozen
- * state is reached.  IOW, if this function returns %true, @p is considered
- * frozen enough.
- */
-static inline bool freezer_should_skip(struct task_struct *p)
-{
-       /*
-        * The following smp_mb() paired with the one in freezer_count()
-        * ensures that either freezer_count() sees %true freezing() or we
-        * see cleared %PF_FREEZER_SKIP and return %false.  This makes it
-        * impossible for a task to slip frozen state testing after
-        * clearing %PF_FREEZER_SKIP.
-        */
-       smp_mb();
-       return p->flags & PF_FREEZER_SKIP;
-}
-
-/*
- * These functions are intended to be used whenever you want allow a sleeping
- * task to be frozen. Note that neither return any clear indication of
- * whether a freeze event happened while in this function.
- */
-
-/* Like schedule(), but should not block the freezer. */
-static inline void freezable_schedule(void)
-{
-       freezer_do_not_count();
-       schedule();
-       freezer_count();
-}
-
-/* DO NOT ADD ANY NEW CALLERS OF THIS FUNCTION */
-static inline void freezable_schedule_unsafe(void)
-{
-       freezer_do_not_count();
-       schedule();
-       freezer_count_unsafe();
-}
-
-/*
- * Like schedule_timeout(), but should not block the freezer.  Do not
- * call this with locks held.
- */
-static inline long freezable_schedule_timeout(long timeout)
-{
-       long __retval;
-       freezer_do_not_count();
-       __retval = schedule_timeout(timeout);
-       freezer_count();
-       return __retval;
-}
-
-/*
- * Like schedule_timeout_interruptible(), but should not block the freezer.  Do not
- * call this with locks held.
- */
-static inline long freezable_schedule_timeout_interruptible(long timeout)
-{
-       long __retval;
-       freezer_do_not_count();
-       __retval = schedule_timeout_interruptible(timeout);
-       freezer_count();
-       return __retval;
-}
-
-/* DO NOT ADD ANY NEW CALLERS OF THIS FUNCTION */
-static inline long freezable_schedule_timeout_interruptible_unsafe(long timeout)
-{
-       long __retval;
-
-       freezer_do_not_count();
-       __retval = schedule_timeout_interruptible(timeout);
-       freezer_count_unsafe();
-       return __retval;
-}
-
-/* Like schedule_timeout_killable(), but should not block the freezer. */
-static inline long freezable_schedule_timeout_killable(long timeout)
-{
-       long __retval;
-       freezer_do_not_count();
-       __retval = schedule_timeout_killable(timeout);
-       freezer_count();
-       return __retval;
-}
-
-/* DO NOT ADD ANY NEW CALLERS OF THIS FUNCTION */
-static inline long freezable_schedule_timeout_killable_unsafe(long timeout)
-{
-       long __retval;
-       freezer_do_not_count();
-       __retval = schedule_timeout_killable(timeout);
-       freezer_count_unsafe();
-       return __retval;
-}
-
-/*
- * Like schedule_hrtimeout_range(), but should not block the freezer.  Do not
- * call this with locks held.
- */
-static inline int freezable_schedule_hrtimeout_range(ktime_t *expires,
-               u64 delta, const enum hrtimer_mode mode)
-{
-       int __retval;
-       freezer_do_not_count();
-       __retval = schedule_hrtimeout_range(expires, delta, mode);
-       freezer_count();
-       return __retval;
-}
-
-/*
- * Freezer-friendly wrappers around wait_event_interruptible(),
- * wait_event_killable() and wait_event_interruptible_timeout(), originally
- * defined in <linux/wait.h>
- */
-
-/* DO NOT ADD ANY NEW CALLERS OF THIS FUNCTION */
-#define wait_event_freezekillable_unsafe(wq, condition)                        \
-({                                                                     \
-       int __retval;                                                   \
-       freezer_do_not_count();                                         \
-       __retval = wait_event_killable(wq, (condition));                \
-       freezer_count_unsafe();                                         \
-       __retval;                                                       \
-})
-
  #else /* !CONFIG_FREEZER */
  static inline bool frozen(struct task_struct *p) { return false; }
  static inline bool freezing(struct task_struct *p) { return false; }
@@ -281,35 +83,8 @@ static inline void thaw_kernel_threads(void) {}
  
  static inline bool try_to_freeze(void) { return false; }
  
-static inline void freezer_do_not_count(void) {}
-static inline void freezer_count(void) {}
-static inline int freezer_should_skip(struct task_struct *p) { return 0; }
  static inline void set_freezable(void) {}
  
-#define freezable_schedule()  schedule()
-
-#define freezable_schedule_unsafe()  schedule()
-
-#define freezable_schedule_timeout(timeout)  schedule_timeout(timeout)
-
-#define freezable_schedule_timeout_interruptible(timeout)              \
-       schedule_timeout_interruptible(timeout)
-
-#define freezable_schedule_timeout_interruptible_unsafe(timeout)       \
-       schedule_timeout_interruptible(timeout)
-
-#define freezable_schedule_timeout_killable(timeout)                   \
-       schedule_timeout_killable(timeout)
-
-#define freezable_schedule_timeout_killable_unsafe(timeout)            \
-       schedule_timeout_killable(timeout)
-
-#define freezable_schedule_hrtimeout_range(expires, delta, mode)       \
-       schedule_hrtimeout_range(expires, delta, mode)
-
-#define wait_event_freezekillable_unsafe(wq, condition)                        \
-               wait_event_killable(wq, condition)
-
  #endif /* !CONFIG_FREEZER */
  
  #endif /* FREEZER_H_INCLUDED */
diff --git a/include/linux/sched.h b/include/linux/sched.h

index 9fc23a2d98132033e1844ed2f9425e3e14bc8a85..4c91efd6df821c0a411b29741a961ddfb30c324c 100644 (file)
--- a/include/linux/sched.h
+++ b/include/linux/sched.h
@@ -97,12 +97,19 @@ struct task_group;
  #define TASK_WAKING                    0x00000200
  #define TASK_NOLOAD                    0x00000400
  #define TASK_NEW                       0x00000800
-/* RT specific auxilliary flag to mark RT lock waiters */
  #define TASK_RTLOCK_WAIT               0x00001000
-#define TASK_STATE_MAX                 0x00002000
+#define TASK_FREEZABLE                 0x00002000
+#define __TASK_FREEZABLE_UNSAFE               (0x00004000 * IS_ENABLED(CONFIG_LOCKDEP))
+#define TASK_FROZEN                    0x00008000
+#define TASK_STATE_MAX                 0x00010000
  
  #define TASK_ANY                       (TASK_STATE_MAX-1)
  
+/*
+ * DO NOT ADD ANY NEW USERS !
+ */
+#define TASK_FREEZABLE_UNSAFE          (TASK_FREEZABLE | __TASK_FREEZABLE_UNSAFE)
+
  /* Convenience macros for the sake of set_current_state: */
  #define TASK_KILLABLE                  (TASK_WAKEKILL | TASK_UNINTERRUPTIBLE)
  #define TASK_STOPPED                   (TASK_WAKEKILL | __TASK_STOPPED)
@@ -1716,7 +1723,6 @@ extern struct pid *cad_pid;
  #define PF_NPROC_EXCEEDED      0x00001000      /* set_user() noticed that RLIMIT_NPROC was exceeded */
  #define PF_USED_MATH           0x00002000      /* If unset the fpu must be initialized before use */
  #define PF_NOFREEZE            0x00008000      /* This thread should not be frozen */
-#define PF_FROZEN              0x00010000      /* Frozen for system suspend */
  #define PF_KSWAPD              0x00020000      /* I am kswapd */
  #define PF_MEMALLOC_NOFS       0x00040000      /* All allocation requests will inherit GFP_NOFS */
  #define PF_MEMALLOC_NOIO       0x00080000      /* All allocation requests will inherit GFP_NOIO */
@@ -1727,7 +1733,6 @@ extern struct pid *cad_pid;
  #define PF_NO_SETAFFINITY      0x04000000      /* Userland is not allowed to meddle with cpus_mask */
  #define PF_MCE_EARLY           0x08000000      /* Early kill for mce process policy */
  #define PF_MEMALLOC_PIN                0x10000000      /* Allocation context constrained to zones which allow long term pinning. */
-#define PF_FREEZER_SKIP                0x40000000      /* Freezer should not count it as freezable */
  #define PF_SUSPEND_TASK                0x80000000      /* This thread called freeze_processes() and should not be frozen */
  
  /*
diff --git a/include/linux/sunrpc/sched.h b/include/linux/sunrpc/sched.h

index acc62647317c6a9346461963841f6f924258466f..baeca2f564dced06ce1fbdd4cffdabc5bacd2894 100644 (file)
--- a/include/linux/sunrpc/sched.h
+++ b/include/linux/sunrpc/sched.h
@@ -252,7 +252,7 @@ int         rpc_malloc(struct rpc_task *);
  void           rpc_free(struct rpc_task *);
  int            rpciod_up(void);
  void           rpciod_down(void);
-int            __rpc_wait_for_completion_task(struct rpc_task *task, wait_bit_action_f *);
+int            rpc_wait_for_completion_task(struct rpc_task *task);
  #if IS_ENABLED(CONFIG_SUNRPC_DEBUG)
  struct net;
  void           rpc_show_tasks(struct net *);
@@ -264,11 +264,6 @@ extern struct workqueue_struct *xprtiod_workqueue;
  void           rpc_prepare_task(struct rpc_task *task);
  gfp_t          rpc_task_gfp_mask(void);
  
-static inline int rpc_wait_for_completion_task(struct rpc_task *task)
-{
-       return __rpc_wait_for_completion_task(task, NULL);
-}
-
  #if IS_ENABLED(CONFIG_SUNRPC_DEBUG) || IS_ENABLED(CONFIG_TRACEPOINTS)
  static inline const char * rpc_qname(const struct rpc_wait_queue *q)
  {
diff --git a/include/linux/wait.h b/include/linux/wait.h

index b926eb9f3e266d98bba8da25ac4f3f1dca12b9c6..14ad8a0e9fac6f6f506535412fef61b1147b614d 100644 (file)
--- a/include/linux/wait.h
+++ b/include/linux/wait.h
@@ -361,8 +361,8 @@ do {                                                                                \
  } while (0)
  
  #define __wait_event_freezable(wq_head, condition)                             \
-       ___wait_event(wq_head, condition, TASK_INTERRUPTIBLE, 0, 0,             \
-                           freezable_schedule())
+       ___wait_event(wq_head, condition, (TASK_INTERRUPTIBLE|TASK_FREEZABLE),  \
+                       0, 0, schedule())
  
  /**
   * wait_event_freezable - sleep (or freeze) until a condition gets true
@@ -420,8 +420,8 @@ do {                                                                                \
  
  #define __wait_event_freezable_timeout(wq_head, condition, timeout)            \
         ___wait_event(wq_head, ___wait_cond_timeout(condition),                 \
-                     TASK_INTERRUPTIBLE, 0, timeout,                           \
-                     __ret = freezable_schedule_timeout(__ret))
+                     (TASK_INTERRUPTIBLE|TASK_FREEZABLE), 0, timeout,          \
+                     __ret = schedule_timeout(__ret))
  
  /*
   * like wait_event_timeout() -- except it uses TASK_INTERRUPTIBLE to avoid
@@ -642,8 +642,8 @@ do {                                                                                \
  
  
  #define __wait_event_freezable_exclusive(wq, condition)                                \
-       ___wait_event(wq, condition, TASK_INTERRUPTIBLE, 1, 0,                  \
-                       freezable_schedule())
+       ___wait_event(wq, condition, (TASK_INTERRUPTIBLE|TASK_FREEZABLE), 1, 0,\
+                       schedule())
  
  #define wait_event_freezable_exclusive(wq, condition)                          \
  ({                                                                             \
diff --git a/kernel/cgroup/legacy_freezer.c b/kernel/cgroup/legacy_freezer.c

index 08236798d17315622d73540d62a89dcbafdc5c77..1b6b21851e9d47daa3456123d604ab4d5e0f3b9c 100644 (file)
--- a/kernel/cgroup/legacy_freezer.c
+++ b/kernel/cgroup/legacy_freezer.c
@@ -113,7 +113,7 @@ static int freezer_css_online(struct cgroup_subsys_state *css)
  
         if (parent && (parent->state & CGROUP_FREEZING)) {
                 freezer->state |= CGROUP_FREEZING_PARENT | CGROUP_FROZEN;
-               atomic_inc(&system_freezing_cnt);
+               static_branch_inc(&freezer_active);
         }
  
         mutex_unlock(&freezer_mutex);
@@ -134,7 +134,7 @@ static void freezer_css_offline(struct cgroup_subsys_state *css)
         mutex_lock(&freezer_mutex);
  
         if (freezer->state & CGROUP_FREEZING)
-               atomic_dec(&system_freezing_cnt);
+               static_branch_dec(&freezer_active);
  
         freezer->state = 0;
  
@@ -179,6 +179,7 @@ static void freezer_attach(struct cgroup_taskset *tset)
                         __thaw_task(task);
                 } else {
                         freeze_task(task);
+
                         /* clear FROZEN and propagate upwards */
                         while (freezer && (freezer->state & CGROUP_FROZEN)) {
                                 freezer->state &= ~CGROUP_FROZEN;
@@ -271,16 +272,8 @@ static void update_if_frozen(struct cgroup_subsys_state *css)
         css_task_iter_start(css, 0, &it);
  
         while ((task = css_task_iter_next(&it))) {
-               if (freezing(task)) {
-                       /*
-                        * freezer_should_skip() indicates that the task
-                        * should be skipped when determining freezing
-                        * completion.  Consider it frozen in addition to
-                        * the usual frozen condition.
-                        */
-                       if (!frozen(task) && !freezer_should_skip(task))
-                               goto out_iter_end;
-               }
+               if (freezing(task) && !frozen(task))
+                       goto out_iter_end;
         }
  
         freezer->state |= CGROUP_FROZEN;
@@ -357,7 +350,7 @@ static void freezer_apply_state(struct freezer *freezer, bool freeze,
  
         if (freeze) {
                 if (!(freezer->state & CGROUP_FREEZING))
-                       atomic_inc(&system_freezing_cnt);
+                       static_branch_inc(&freezer_active);
                 freezer->state |= state;
                 freeze_cgroup(freezer);
         } else {
@@ -366,9 +359,9 @@ static void freezer_apply_state(struct freezer *freezer, bool freeze,
                 freezer->state &= ~state;
  
                 if (!(freezer->state & CGROUP_FREEZING)) {
-                       if (was_freezing)
-                               atomic_dec(&system_freezing_cnt);
                         freezer->state &= ~CGROUP_FROZEN;
+                       if (was_freezing)
+                               static_branch_dec(&freezer_active);
                         unfreeze_cgroup(freezer);
                 }
         }
diff --git a/kernel/exit.c b/kernel/exit.c

index 84021b24f79e3d1d2dc11fe70bf69cf620c7fc85..ba683f8d292a4a2c816d1d1c24201e979ae03fe1 100644 (file)
--- a/kernel/exit.c
+++ b/kernel/exit.c
@@ -374,10 +374,10 @@ static void coredump_task_exit(struct task_struct *tsk)
                         complete(&core_state->startup);
  
                 for (;;) {
-                       set_current_state(TASK_UNINTERRUPTIBLE);
+                       set_current_state(TASK_UNINTERRUPTIBLE|TASK_FREEZABLE);
                         if (!self.task) /* see coredump_finish() */
                                 break;
-                       freezable_schedule();
+                       schedule();
                 }
                 __set_current_state(TASK_RUNNING);
         }
diff --git a/kernel/fork.c b/kernel/fork.c

index 90c85b17bf698744c12cb165c05396fa55db7c3a..a1de2f5e305d5e55a3e09cc2b2e71f68ab0a3b64 100644 (file)
--- a/kernel/fork.c
+++ b/kernel/fork.c
@@ -1420,13 +1420,12 @@ static void complete_vfork_done(struct task_struct *tsk)
  static int wait_for_vfork_done(struct task_struct *child,
                                 struct completion *vfork)
  {
+       unsigned int state = TASK_UNINTERRUPTIBLE|TASK_KILLABLE|TASK_FREEZABLE;
         int killed;
  
-       freezer_do_not_count();
         cgroup_enter_frozen();
-       killed = wait_for_completion_killable(vfork);
+       killed = wait_for_completion_state(vfork, state);
         cgroup_leave_frozen(false);
-       freezer_count();
  
         if (killed) {
                 task_lock(child);
diff --git a/kernel/freezer.c b/kernel/freezer.c

index 45ab36ffd0e79cf84fe4a47323811e27ae11357d..4fad0e6fca6447d72388e7ea44e90f34924beb03 100644 (file)
--- a/kernel/freezer.c
+++ b/kernel/freezer.c
@@ -13,10 +13,11 @@
  #include <linux/kthread.h>
  
  /* total number of freezing conditions in effect */
-atomic_t system_freezing_cnt = ATOMIC_INIT(0);
-EXPORT_SYMBOL(system_freezing_cnt);
+DEFINE_STATIC_KEY_FALSE(freezer_active);
+EXPORT_SYMBOL(freezer_active);
  
-/* indicate whether PM freezing is in effect, protected by
+/*
+ * indicate whether PM freezing is in effect, protected by
   * system_transition_mutex
   */
  bool pm_freezing;
@@ -29,7 +30,7 @@ static DEFINE_SPINLOCK(freezer_lock);
   * freezing_slow_path - slow path for testing whether a task needs to be frozen
   * @p: task to be tested
   *
- * This function is called by freezing() if system_freezing_cnt isn't zero
+ * This function is called by freezing() if freezer_active isn't zero
   * and tests whether @p needs to enter and stay in frozen state.  Can be
   * called under any context.  The freezers are responsible for ensuring the
   * target tasks see the updated state.
@@ -52,41 +53,40 @@ bool freezing_slow_path(struct task_struct *p)
  }
  EXPORT_SYMBOL(freezing_slow_path);
  
+bool frozen(struct task_struct *p)
+{
+       return READ_ONCE(p->__state) & TASK_FROZEN;
+}
+
  /* Refrigerator is place where frozen processes are stored :-). */
  bool __refrigerator(bool check_kthr_stop)
  {
-       /* Hmm, should we be allowed to suspend when there are realtime
-          processes around? */
+       unsigned int state = get_current_state();
         bool was_frozen = false;
-       unsigned int save = get_current_state();
  
         pr_debug("%s entered refrigerator\n", current->comm);
  
+       WARN_ON_ONCE(state && !(state & TASK_NORMAL));
+
         for (;;) {
-               set_current_state(TASK_UNINTERRUPTIBLE);
+               bool freeze;
+
+               set_current_state(TASK_FROZEN);
  
                 spin_lock_irq(&freezer_lock);
-               current->flags |= PF_FROZEN;
-               if (!freezing(current) ||
-                   (check_kthr_stop && kthread_should_stop()))
-                       current->flags &= ~PF_FROZEN;
+               freeze = freezing(current) && !(check_kthr_stop && kthread_should_stop());
                 spin_unlock_irq(&freezer_lock);
  
-               if (!(current->flags & PF_FROZEN))
+               if (!freeze)
                         break;
+
                 was_frozen = true;
                 schedule();
         }
+       __set_current_state(TASK_RUNNING);
  
         pr_debug("%s left refrigerator\n", current->comm);
  
-       /*
-        * Restore saved task state before returning.  The mb'd version
-        * needs to be used; otherwise, it might silently break
-        * synchronization which depends on ordered task state change.
-        */
-       set_current_state(save);
-
         return was_frozen;
  }
  EXPORT_SYMBOL(__refrigerator);
@@ -101,6 +101,44 @@ static void fake_signal_wake_up(struct task_struct *p)
         }
  }
  
+static int __set_task_frozen(struct task_struct *p, void *arg)
+{
+       unsigned int state = READ_ONCE(p->__state);
+
+       if (p->on_rq)
+               return 0;
+
+       if (p != current && task_curr(p))
+               return 0;
+
+       if (!(state & (TASK_FREEZABLE | __TASK_STOPPED | __TASK_TRACED)))
+               return 0;
+
+       /*
+        * Only TASK_NORMAL can be augmented with TASK_FREEZABLE, since they
+        * can suffer spurious wakeups.
+        */
+       if (state & TASK_FREEZABLE)
+               WARN_ON_ONCE(!(state & TASK_NORMAL));
+
+#ifdef CONFIG_LOCKDEP
+       /*
+        * It's dangerous to freeze with locks held; there be dragons there.
+        */
+       if (!(state & __TASK_FREEZABLE_UNSAFE))
+               WARN_ON_ONCE(debug_locks && p->lockdep_depth);
+#endif
+
+       WRITE_ONCE(p->__state, TASK_FROZEN);
+       return TASK_FROZEN;
+}
+
+static bool __freeze_task(struct task_struct *p)
+{
+       /* TASK_FREEZABLE|TASK_STOPPED|TASK_TRACED -> TASK_FROZEN */
+       return task_call_func(p, __set_task_frozen, NULL);
+}
+
  /**
   * freeze_task - send a freeze request to given task
   * @p: task to send the request to
@@ -116,20 +154,8 @@ bool freeze_task(struct task_struct *p)
  {
         unsigned long flags;
  
-       /*
-        * This check can race with freezer_do_not_count, but worst case that
-        * will result in an extra wakeup being sent to the task.  It does not
-        * race with freezer_count(), the barriers in freezer_count() and
-        * freezer_should_skip() ensure that either freezer_count() sees
-        * freezing == true in try_to_freeze() and freezes, or
-        * freezer_should_skip() sees !PF_FREEZE_SKIP and freezes the task
-        * normally.
-        */
-       if (freezer_should_skip(p))
-               return false;
-
         spin_lock_irqsave(&freezer_lock, flags);
-       if (!freezing(p) || frozen(p)) {
+       if (!freezing(p) || frozen(p) || __freeze_task(p)) {
                 spin_unlock_irqrestore(&freezer_lock, flags);
                 return false;
         }
@@ -137,19 +163,52 @@ bool freeze_task(struct task_struct *p)
         if (!(p->flags & PF_KTHREAD))
                 fake_signal_wake_up(p);
         else
-               wake_up_state(p, TASK_INTERRUPTIBLE);
+               wake_up_state(p, TASK_NORMAL);
  
         spin_unlock_irqrestore(&freezer_lock, flags);
         return true;
  }
  
+/*
+ * The special task states (TASK_STOPPED, TASK_TRACED) keep their canonical
+ * state in p->jobctl. If either of them got a wakeup that was missed because
+ * TASK_FROZEN, then their canonical state reflects that and the below will
+ * refuse to restore the special state and instead issue the wakeup.
+ */
+static int __set_task_special(struct task_struct *p, void *arg)
+{
+       unsigned int state = 0;
+
+       if (p->jobctl & JOBCTL_TRACED)
+               state = TASK_TRACED;
+
+       else if (p->jobctl & JOBCTL_STOPPED)
+               state = TASK_STOPPED;
+
+       if (state)
+               WRITE_ONCE(p->__state, state);
+
+       return state;
+}
+
  void __thaw_task(struct task_struct *p)
  {
-       unsigned long flags;
+       unsigned long flags, flags2;
  
         spin_lock_irqsave(&freezer_lock, flags);
-       if (frozen(p))
-               wake_up_process(p);
+       if (WARN_ON_ONCE(freezing(p)))
+               goto unlock;
+
+       if (lock_task_sighand(p, &flags2)) {
+               /* TASK_FROZEN -> TASK_{STOPPED,TRACED} */
+               bool ret = task_call_func(p, __set_task_special, NULL);
+               unlock_task_sighand(p, &flags2);
+               if (ret)
+                       goto unlock;
+       }
+
+       wake_up_state(p, TASK_FROZEN);
+unlock:
         spin_unlock_irqrestore(&freezer_lock, flags);
  }
  
diff --git a/kernel/futex/waitwake.c b/kernel/futex/waitwake.c

index 4ce0923f1ce39e4226992efa097cd6ce824570e0..ba01b94082033b18e2c07e7f67599862f5f12929 100644 (file)
--- a/kernel/futex/waitwake.c
+++ b/kernel/futex/waitwake.c
@@ -334,7 +334,7 @@ void futex_wait_queue(struct futex_hash_bucket *hb, struct futex_q *q,
          * futex_queue() calls spin_unlock() upon completion, both serializing
          * access to the hash list and forcing another memory barrier.
          */
-       set_current_state(TASK_INTERRUPTIBLE);
+       set_current_state(TASK_INTERRUPTIBLE|TASK_FREEZABLE);
         futex_queue(q, hb);
  
         /* Arm the timer */
@@ -352,7 +352,7 @@ void futex_wait_queue(struct futex_hash_bucket *hb, struct futex_q *q,
                  * is no timeout, or if it has yet to expire.
                  */
                 if (!timeout || timeout->task)
-                       freezable_schedule();
+                       schedule();
         }
         __set_current_state(TASK_RUNNING);
  }
@@ -430,7 +430,7 @@ retry:
                         return ret;
         }
  
-       set_current_state(TASK_INTERRUPTIBLE);
+       set_current_state(TASK_INTERRUPTIBLE|TASK_FREEZABLE);
  
         for (i = 0; i < count; i++) {
                 u32 __user *uaddr = (u32 __user *)(unsigned long)vs[i].w.uaddr;
@@ -504,7 +504,7 @@ static void futex_sleep_multiple(struct futex_vector *vs, unsigned int count,
                         return;
         }
  
-       freezable_schedule();
+       schedule();
  }
  
  /**
diff --git a/kernel/hung_task.c b/kernel/hung_task.c

index bb2354f73dedcaf2c2d82ebebca2d5b9b86d2bf0..f1321c03c32af47c20aaf18ed0fc9a89a57e0be5 100644 (file)
--- a/kernel/hung_task.c
+++ b/kernel/hung_task.c
@@ -95,8 +95,8 @@ static void check_hung_task(struct task_struct *t, unsigned long timeout)
          * Ensure the task is not frozen.
          * Also, skip vfork and any other user process that freezer should skip.
          */
-       if (unlikely(t->flags & (PF_FROZEN | PF_FREEZER_SKIP)))
-           return;
+       if (unlikely(READ_ONCE(t->__state) & (TASK_FREEZABLE | TASK_FROZEN)))
+               return;
  
         /*
          * When a freshly created task is scheduled once, changes its state to
diff --git a/kernel/power/main.c b/kernel/power/main.c

index dae3d17919e6f3710d2e7c007ec7a96bfcaa5bb6..31ec4a9b9d7045315ed60c26c8b385be74eed652 100644 (file)
--- a/kernel/power/main.c
+++ b/kernel/power/main.c
@@ -24,7 +24,7 @@
  unsigned int lock_system_sleep(void)
  {
         unsigned int flags = current->flags;
-       current->flags |= PF_FREEZER_SKIP;
+       current->flags |= PF_NOFREEZE;
         mutex_lock(&system_transition_mutex);
         return flags;
  }
@@ -48,8 +48,8 @@ void unlock_system_sleep(unsigned int flags)
          * Which means, if we use try_to_freeze() here, it would make them
          * enter the refrigerator, thus causing hibernation to lockup.
          */
-       if (!(flags & PF_FREEZER_SKIP))
-               current->flags &= ~PF_FREEZER_SKIP;
+       if (!(flags & PF_NOFREEZE))
+               current->flags &= ~PF_NOFREEZE;
         mutex_unlock(&system_transition_mutex);
  }
  EXPORT_SYMBOL_GPL(unlock_system_sleep);
diff --git a/kernel/power/process.c b/kernel/power/process.c

index 3068601e585a8fd5066d5b0bfd4c1c1fb7ddaee0..ddd9988327fe2b107046747a32fbe25caf31697a 100644 (file)
--- a/kernel/power/process.c
+++ b/kernel/power/process.c
@@ -50,8 +50,7 @@ static int try_to_freeze_tasks(bool user_only)
                         if (p == current || !freeze_task(p))
                                 continue;
  
-                       if (!freezer_should_skip(p))
-                               todo++;
+                       todo++;
                 }
                 read_unlock(&tasklist_lock);
  
@@ -96,8 +95,7 @@ static int try_to_freeze_tasks(bool user_only)
                 if (!wakeup || pm_debug_messages_on) {
                         read_lock(&tasklist_lock);
                         for_each_process_thread(g, p) {
-                               if (p != current && !freezer_should_skip(p)
-                                   && freezing(p) && !frozen(p))
+                               if (p != current && freezing(p) && !frozen(p))
                                         sched_show_task(p);
                         }
                         read_unlock(&tasklist_lock);
@@ -129,7 +127,7 @@ int freeze_processes(void)
         current->flags |= PF_SUSPEND_TASK;
  
         if (!pm_freezing)
-               atomic_inc(&system_freezing_cnt);
+               static_branch_inc(&freezer_active);
  
         pm_wakeup_clear(0);
         pr_info("Freezing user space processes ... ");
@@ -190,7 +188,7 @@ void thaw_processes(void)
  
         trace_suspend_resume(TPS("thaw_processes"), 0, true);
         if (pm_freezing)
-               atomic_dec(&system_freezing_cnt);
+               static_branch_dec(&freezer_active);
         pm_freezing = false;
         pm_nosig_freezing = false;
  
diff --git a/kernel/ptrace.c b/kernel/ptrace.c

index 1893d909e45ca6c575efb105ce12f35da7eadbb7..54482193e1edc2c665a8f32f08c4d81300757dbc 100644 (file)
--- a/kernel/ptrace.c
+++ b/kernel/ptrace.c
@@ -269,7 +269,7 @@ static int ptrace_check_attach(struct task_struct *child, bool ignore_state)
         read_unlock(&tasklist_lock);
  
         if (!ret && !ignore_state &&
-           WARN_ON_ONCE(!wait_task_inactive(child, __TASK_TRACED)))
+           WARN_ON_ONCE(!wait_task_inactive(child, __TASK_TRACED|TASK_FROZEN)))
                 ret = -ESRCH;
  
         return ret;
diff --git a/kernel/sched/core.c b/kernel/sched/core.c

index ea26526b45bbf86a573d8b5ab5daaa21ca231289..2b85d1b5fe0c10d0184ca9537e5569c1ac5af558 100644 (file)
--- a/kernel/sched/core.c
+++ b/kernel/sched/core.c
@@ -6428,7 +6428,7 @@ static void __sched notrace __schedule(unsigned int sched_mode)
                         prev->sched_contributes_to_load =
                                 (prev_state & TASK_UNINTERRUPTIBLE) &&
                                 !(prev_state & TASK_NOLOAD) &&
-                               !(prev->flags & PF_FROZEN);
+                               !(prev_state & TASK_FROZEN);
  
                         if (prev->sched_contributes_to_load)
                                 rq->nr_uninterruptible++;
diff --git a/kernel/signal.c b/kernel/signal.c

index 6f86fda5e432aeb32ae5dbca2c4264a2781b3dde..c2e90d6ca0d10368f2cc4c10e2b9e3a722f69967 100644 (file)
--- a/kernel/signal.c
+++ b/kernel/signal.c
@@ -2304,7 +2304,7 @@ static int ptrace_stop(int exit_code, int why, unsigned long message,
         read_unlock(&tasklist_lock);
         cgroup_enter_frozen();
         preempt_enable_no_resched();
-       freezable_schedule();
+       schedule();
         cgroup_leave_frozen(true);
  
         /*
@@ -2473,7 +2473,7 @@ static bool do_signal_stop(int signr)
  
                 /* Now we don't run again until woken by SIGCONT or SIGKILL */
                 cgroup_enter_frozen();
-               freezable_schedule();
+               schedule();
                 return true;
         } else {
                 /*
@@ -2548,11 +2548,11 @@ static void do_freezer_trap(void)
          * immediately (if there is a non-fatal signal pending), and
          * put the task into sleep.
          */
-       __set_current_state(TASK_INTERRUPTIBLE);
+       __set_current_state(TASK_INTERRUPTIBLE|TASK_FREEZABLE);
         clear_thread_flag(TIF_SIGPENDING);
         spin_unlock_irq(&current->sighand->siglock);
         cgroup_enter_frozen();
-       freezable_schedule();
+       schedule();
  }
  
  static int ptrace_signal(int signr, kernel_siginfo_t *info, enum pid_type type)
@@ -3600,9 +3600,9 @@ static int do_sigtimedwait(const sigset_t *which, kernel_siginfo_t *info,
                 recalc_sigpending();
                 spin_unlock_irq(&tsk->sighand->siglock);
  
-               __set_current_state(TASK_INTERRUPTIBLE);
-               ret = freezable_schedule_hrtimeout_range(to, tsk->timer_slack_ns,
-                                                        HRTIMER_MODE_REL);
+               __set_current_state(TASK_INTERRUPTIBLE|TASK_FREEZABLE);
+               ret = schedule_hrtimeout_range(to, tsk->timer_slack_ns,
+                                              HRTIMER_MODE_REL);
                 spin_lock_irq(&tsk->sighand->siglock);
                 __set_task_blocked(tsk, &tsk->real_blocked);
                 sigemptyset(&tsk->real_blocked);
diff --git a/kernel/time/hrtimer.c b/kernel/time/hrtimer.c

index 23af5eca11b14c81eaba6e5c49f791806f110c2e..3ae661ab62603c4f6ad6a162e4d3586346ead934 100644 (file)
--- a/kernel/time/hrtimer.c
+++ b/kernel/time/hrtimer.c
@@ -2037,11 +2037,11 @@ static int __sched do_nanosleep(struct hrtimer_sleeper *t, enum hrtimer_mode mod
         struct restart_block *restart;
  
         do {
-               set_current_state(TASK_INTERRUPTIBLE);
+               set_current_state(TASK_INTERRUPTIBLE|TASK_FREEZABLE);
                 hrtimer_sleeper_start_expires(t, mode);
  
                 if (likely(t->task))
-                       freezable_schedule();
+                       schedule();
  
                 hrtimer_cancel(&t->timer);
                 mode = HRTIMER_MODE_ABS;
diff --git a/kernel/umh.c b/kernel/umh.c

index 8945eaf4c67179827fe7c571047ced851d448fcc..8506315186652dffd12eb395931c270a82463516 100644 (file)
--- a/kernel/umh.c
+++ b/kernel/umh.c
@@ -404,6 +404,7 @@ EXPORT_SYMBOL(call_usermodehelper_setup);
   */
  int call_usermodehelper_exec(struct subprocess_info *sub_info, int wait)
  {
+       unsigned int state = TASK_UNINTERRUPTIBLE;
         DECLARE_COMPLETION_ONSTACK(done);
         int retval = 0;
  
@@ -437,25 +438,22 @@ int call_usermodehelper_exec(struct subprocess_info *sub_info, int wait)
         if (wait == UMH_NO_WAIT)        /* task has freed sub_info */
                 goto unlock;
  
+       if (wait & UMH_KILLABLE)
+               state |= TASK_KILLABLE;
+
         if (wait & UMH_FREEZABLE)
-               freezer_do_not_count();
+               state |= TASK_FREEZABLE;
  
-       if (wait & UMH_KILLABLE) {
-               retval = wait_for_completion_killable(&done);
-               if (!retval)
-                       goto wait_done;
+       retval = wait_for_completion_state(&done, state);
+       if (!retval)
+               goto wait_done;
  
+       if (wait & UMH_KILLABLE) {
                 /* umh_complete() will see NULL and free sub_info */
                 if (xchg(&sub_info->complete, NULL))
                         goto unlock;
-               /* fallthrough, umh_complete() was already called */
         }
  
-       wait_for_completion(&done);
-
-       if (wait & UMH_FREEZABLE)
-               freezer_count();
-
  wait_done:
         retval = sub_info->retval;
  out:
diff --git a/mm/khugepaged.c b/mm/khugepaged.c

index 01f71786d530353c2c9a14adaf068c13cb204f83..77162fb7e90b0aeccaa4bbda0cd298e2485b1d1e 100644 (file)
--- a/mm/khugepaged.c
+++ b/mm/khugepaged.c
@@ -730,8 +730,8 @@ static void khugepaged_alloc_sleep(void)
         DEFINE_WAIT(wait);
  
         add_wait_queue(&khugepaged_wait, &wait);
-       freezable_schedule_timeout_interruptible(
-               msecs_to_jiffies(khugepaged_alloc_sleep_millisecs));
+       __set_current_state(TASK_INTERRUPTIBLE|TASK_FREEZABLE);
+       schedule_timeout(msecs_to_jiffies(khugepaged_alloc_sleep_millisecs));
         remove_wait_queue(&khugepaged_wait, &wait);
  }
  
diff --git a/net/sunrpc/sched.c b/net/sunrpc/sched.c

index 25b9221950ffbfa43f47498c6af563548f2eb54f..46cbf151a50b1af58a00fde1b0cf4bd7bd76d83e 100644 (file)
--- a/net/sunrpc/sched.c
+++ b/net/sunrpc/sched.c
@@ -269,7 +269,7 @@ EXPORT_SYMBOL_GPL(rpc_destroy_wait_queue);
  
  static int rpc_wait_bit_killable(struct wait_bit_key *key, int mode)
  {
-       freezable_schedule_unsafe();
+       schedule();
         if (signal_pending_state(mode, current))
                 return -ERESTARTSYS;
         return 0;
@@ -333,14 +333,12 @@ static int rpc_complete_task(struct rpc_task *task)
   * to enforce taking of the wq->lock and hence avoid races with
   * rpc_complete_task().
   */
-int __rpc_wait_for_completion_task(struct rpc_task *task, wait_bit_action_f *action)
+int rpc_wait_for_completion_task(struct rpc_task *task)
  {
-       if (action == NULL)
-               action = rpc_wait_bit_killable;
         return out_of_line_wait_on_bit(&task->tk_runstate, RPC_TASK_ACTIVE,
-                       action, TASK_KILLABLE);
+                       rpc_wait_bit_killable, TASK_KILLABLE|TASK_FREEZABLE_UNSAFE);
  }
-EXPORT_SYMBOL_GPL(__rpc_wait_for_completion_task);
+EXPORT_SYMBOL_GPL(rpc_wait_for_completion_task);
  
  /*
   * Make an RPC task runnable.
@@ -964,7 +962,7 @@ static void __rpc_execute(struct rpc_task *task)
                 trace_rpc_task_sync_sleep(task, task->tk_action);
                 status = out_of_line_wait_on_bit(&task->tk_runstate,
                                 RPC_TASK_QUEUED, rpc_wait_bit_killable,
-                               TASK_KILLABLE);
+                               TASK_KILLABLE|TASK_FREEZABLE);
                 if (status < 0) {
                         /*
                          * When a sync task receives a signal, it exits with
diff --git a/net/unix/af_unix.c b/net/unix/af_unix.c

index bf338b782fc4c49c0f59fffe7fbf02f4ec9a2229..dda9eb1ab41f05bb9fedff6781281d49f7694589 100644 (file)
--- a/net/unix/af_unix.c
+++ b/net/unix/af_unix.c
@@ -2543,13 +2543,14 @@ static long unix_stream_data_wait(struct sock *sk, long timeo,
                                   struct sk_buff *last, unsigned int last_len,
                                   bool freezable)
  {
+       unsigned int state = TASK_INTERRUPTIBLE | freezable * TASK_FREEZABLE;
         struct sk_buff *tail;
         DEFINE_WAIT(wait);
  
         unix_state_lock(sk);
  
         for (;;) {
-               prepare_to_wait(sk_sleep(sk), &wait, TASK_INTERRUPTIBLE);
+               prepare_to_wait(sk_sleep(sk), &wait, state);
  
                 tail = skb_peek_tail(&sk->sk_receive_queue);
                 if (tail != last ||
@@ -2562,10 +2563,7 @@ static long unix_stream_data_wait(struct sock *sk, long timeo,
  
                 sk_set_bit(SOCKWQ_ASYNC_WAITDATA, sk);
                 unix_state_unlock(sk);
-               if (freezable)
-                       timeo = freezable_schedule_timeout(timeo);
-               else
-                       timeo = schedule_timeout(timeo);
+               timeo = schedule_timeout(timeo);
                 unix_state_lock(sk);
  
                 if (sock_flag(sk, SOCK_DEAD))
author	Peter Zijlstra <peterz@infradead.org>
	Mon, 22 Aug 2022 11:18:22 +0000 (13:18 +0200)
committer	Peter Zijlstra <peterz@infradead.org>
	Wed, 7 Sep 2022 19:53:50 +0000 (21:53 +0200)
drivers/android/binder.c		patch \| blob \| history
drivers/media/pci/pt3/pt3.c		patch \| blob \| history
fs/cifs/inode.c		patch \| blob \| history
fs/cifs/transport.c		patch \| blob \| history
fs/coredump.c		patch \| blob \| history
fs/nfs/file.c		patch \| blob \| history
fs/nfs/inode.c		patch \| blob \| history
fs/nfs/nfs3proc.c		patch \| blob \| history
fs/nfs/nfs4proc.c		patch \| blob \| history
fs/nfs/nfs4state.c		patch \| blob \| history
fs/nfs/pnfs.c		patch \| blob \| history
fs/xfs/xfs_trans_ail.c		patch \| blob \| history
include/linux/freezer.h		patch \| blob \| history
include/linux/sched.h		patch \| blob \| history
include/linux/sunrpc/sched.h		patch \| blob \| history
include/linux/wait.h		patch \| blob \| history
kernel/cgroup/legacy_freezer.c		patch \| blob \| history
kernel/exit.c		patch \| blob \| history
kernel/fork.c		patch \| blob \| history
kernel/freezer.c		patch \| blob \| history
kernel/futex/waitwake.c		patch \| blob \| history
kernel/hung_task.c		patch \| blob \| history
kernel/power/main.c		patch \| blob \| history
kernel/power/process.c		patch \| blob \| history
kernel/ptrace.c		patch \| blob \| history
kernel/sched/core.c		patch \| blob \| history
kernel/signal.c		patch \| blob \| history
kernel/time/hrtimer.c		patch \| blob \| history
kernel/umh.c		patch \| blob \| history
mm/khugepaged.c		patch \| blob \| history
net/sunrpc/sched.c		patch \| blob \| history
net/unix/af_unix.c		patch \| blob \| history