gfs2: Fix glock_hash_walk bugs
authorAndreas Gruenbacher <agruenba@redhat.com>
Thu, 7 Oct 2021 13:57:44 +0000 (15:57 +0200)
committerAndreas Gruenbacher <agruenba@redhat.com>
Mon, 25 Oct 2021 06:42:20 +0000 (08:42 +0200)
So far, glock_hash_walk took a reference on each glock it iterated over, and it
was the examiner's responsibility to drop those references.  Dropping the final
reference to a glock can sleep and the examiners are called in a RCU critical
section with spin locks held, so examiners that didn't need the extra reference
had to drop it asynchronously via gfs2_glock_queue_put or similar.  This wasn't
done correctly in thaw_glock which did call gfs2_glock_put, and not at all in
dump_glock_func.

Change glock_hash_walk to not take glock references at all.  That way, the
examiners that don't need them won't have to bother with slow asynchronous
puts, and the examiners that do need references can take them themselves.

Reported-by: Alexander Aring <aahringo@redhat.com>
Signed-off-by: Andreas Gruenbacher <agruenba@redhat.com>
fs/gfs2/glock.c

index 190d7eb2d0eae1cc0e86efe3742d39cf33660f65..6e3bd5ab91089d47aef765167f184162615b8136 100644 (file)
@@ -2101,10 +2101,10 @@ static void glock_hash_walk(glock_examiner examiner, const struct gfs2_sbd *sdp)
        do {
                rhashtable_walk_start(&iter);
 
-               while ((gl = rhashtable_walk_next(&iter)) && !IS_ERR(gl))
-                       if (gl->gl_name.ln_sbd == sdp &&
-                           lockref_get_not_dead(&gl->gl_lockref))
+               while ((gl = rhashtable_walk_next(&iter)) && !IS_ERR(gl)) {
+                       if (gl->gl_name.ln_sbd == sdp)
                                examiner(gl);
+               }
 
                rhashtable_walk_stop(&iter);
        } while (cond_resched(), gl == ERR_PTR(-EAGAIN));
@@ -2146,7 +2146,6 @@ static void flush_delete_work(struct gfs2_glock *gl)
                                           &gl->gl_delete, 0);
                }
        }
-       gfs2_glock_queue_work(gl, 0);
 }
 
 void gfs2_flush_delete_work(struct gfs2_sbd *sdp)
@@ -2163,10 +2162,10 @@ void gfs2_flush_delete_work(struct gfs2_sbd *sdp)
 
 static void thaw_glock(struct gfs2_glock *gl)
 {
-       if (!test_and_clear_bit(GLF_FROZEN, &gl->gl_flags)) {
-               gfs2_glock_put(gl);
+       if (!test_and_clear_bit(GLF_FROZEN, &gl->gl_flags))
+               return;
+       if (!lockref_get_not_dead(&gl->gl_lockref))
                return;
-       }
        set_bit(GLF_REPLY_PENDING, &gl->gl_flags);
        gfs2_glock_queue_work(gl, 0);
 }
@@ -2182,9 +2181,12 @@ static void clear_glock(struct gfs2_glock *gl)
        gfs2_glock_remove_from_lru(gl);
 
        spin_lock(&gl->gl_lockref.lock);
-       if (gl->gl_state != LM_ST_UNLOCKED)
-               handle_callback(gl, LM_ST_UNLOCKED, 0, false);
-       __gfs2_glock_queue_work(gl, 0);
+       if (!__lockref_is_dead(&gl->gl_lockref)) {
+               gl->gl_lockref.count++;
+               if (gl->gl_state != LM_ST_UNLOCKED)
+                       handle_callback(gl, LM_ST_UNLOCKED, 0, false);
+               __gfs2_glock_queue_work(gl, 0);
+       }
        spin_unlock(&gl->gl_lockref.lock);
 }