; GFX9-NEXT: v_mad_f32 v2, -v3, v0, v2
; GFX9-NEXT: v_cvt_i32_f32_e32 v3, v3
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v2|, |v0|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s4, 0
; GFX9-NEXT: v_add_u32_e32 v0, s0, v3
; GFX9-NEXT: global_store_short v1, v0, s[2:3]
; GFX90A-NEXT: v_mad_f32 v2, -v3, v0, v2
; GFX90A-NEXT: v_cvt_i32_f32_e32 v3, v3
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v2|, |v0|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s4, 0
; GFX90A-NEXT: v_add_u32_e32 v0, s0, v3
; GFX90A-NEXT: global_store_short v1, v0, s[2:3]
; GFX9-NEXT: v_mad_f32 v1, -v2, v0, v1
; GFX9-NEXT: v_cvt_i32_f32_e32 v2, v2
; GFX9-NEXT: v_cmp_ge_f32_e64 s[2:3], |v1|, |v0|
-; GFX9-NEXT: s_cmp_lg_u64 s[2:3], 0
+; GFX9-NEXT: s_and_b64 s[2:3], s[2:3], exec
; GFX9-NEXT: s_cselect_b32 s2, s6, 0
; GFX9-NEXT: v_add_u32_e32 v0, s2, v2
; GFX9-NEXT: v_mul_lo_u32 v0, v0, s5
; GFX90A-NEXT: v_mad_f32 v2, -v3, v0, v2
; GFX90A-NEXT: v_cvt_i32_f32_e32 v3, v3
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v2|, |v0|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s6, 0
; GFX90A-NEXT: v_add_u32_e32 v0, s0, v3
; GFX90A-NEXT: v_mul_lo_u32 v0, v0, s5
; GFX9-NEXT: v_mad_f32 v2, -v3, v0, v2
; GFX9-NEXT: v_cvt_i32_f32_e32 v3, v3
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v2|, |v0|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s4, 0
; GFX9-NEXT: v_add_u32_e32 v0, s0, v3
; GFX9-NEXT: global_store_byte v1, v0, s[2:3]
; GFX90A-NEXT: v_mad_f32 v2, -v3, v0, v2
; GFX90A-NEXT: v_cvt_i32_f32_e32 v3, v3
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v2|, |v0|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s4, 0
; GFX90A-NEXT: v_add_u32_e32 v0, s0, v3
; GFX90A-NEXT: global_store_byte v1, v0, s[2:3]
; GFX9-NEXT: v_mad_f32 v1, -v2, v0, v1
; GFX9-NEXT: v_cvt_i32_f32_e32 v2, v2
; GFX9-NEXT: v_cmp_ge_f32_e64 s[2:3], |v1|, |v0|
-; GFX9-NEXT: s_cmp_lg_u64 s[2:3], 0
+; GFX9-NEXT: s_and_b64 s[2:3], s[2:3], exec
; GFX9-NEXT: s_cselect_b32 s2, s6, 0
; GFX9-NEXT: v_add_u32_e32 v0, s2, v2
; GFX9-NEXT: v_mul_lo_u32 v0, v0, s5
; GFX90A-NEXT: v_mad_f32 v2, -v3, v1, v2
; GFX90A-NEXT: v_cvt_i32_f32_e32 v3, v3
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v2|, |v1|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s6, 0
; GFX90A-NEXT: v_add_u32_e32 v1, s0, v3
; GFX90A-NEXT: v_mul_lo_u32 v1, v1, s5
; GFX9-NEXT: v_trunc_f32_e32 v3, v3
; GFX9-NEXT: v_mad_f32 v1, -v3, v0, v1
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v1|, |v0|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s8, 0
; GFX9-NEXT: s_ashr_i32 s1, s6, 16
; GFX9-NEXT: v_cvt_f32_i32_e32 v0, s1
; GFX9-NEXT: v_mad_f32 v1, -v4, v0, v1
; GFX9-NEXT: s_or_b32 s4, s0, 1
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v1|, |v0|
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: v_cvt_i32_f32_e32 v4, v4
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
; GFX9-NEXT: s_sext_i32_i16 s1, s7
; GFX9-NEXT: v_cvt_f32_i32_e32 v0, s1
; GFX9-NEXT: s_cselect_b32 s0, s4, 0
; GFX9-NEXT: v_trunc_f32_e32 v5, v5
; GFX9-NEXT: v_mad_f32 v1, -v5, v0, v1
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v1|, |v0|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: v_cvt_i32_f32_e32 v5, v5
; GFX9-NEXT: s_cselect_b32 s0, s4, 0
; GFX9-NEXT: s_ashr_i32 s1, s7, 16
; GFX9-NEXT: v_mad_f32 v5, -v6, v0, v5
; GFX9-NEXT: v_cvt_i32_f32_e32 v6, v6
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v5|, |v0|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s4, 0
; GFX9-NEXT: v_mov_b32_e32 v5, 0xffff
; GFX9-NEXT: v_add_u32_e32 v0, s0, v6
; GFX90A-NEXT: v_trunc_f32_e32 v3, v3
; GFX90A-NEXT: v_mad_f32 v1, -v3, v0, v1
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v1|, |v0|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s8, 0
; GFX90A-NEXT: s_ashr_i32 s1, s6, 16
; GFX90A-NEXT: v_cvt_f32_i32_e32 v0, s1
; GFX90A-NEXT: v_mad_f32 v1, -v4, v0, v1
; GFX90A-NEXT: s_or_b32 s4, s0, 1
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v1|, |v0|
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: v_cvt_i32_f32_e32 v4, v4
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
; GFX90A-NEXT: s_sext_i32_i16 s1, s7
; GFX90A-NEXT: v_cvt_f32_i32_e32 v0, s1
; GFX90A-NEXT: s_cselect_b32 s0, s4, 0
; GFX90A-NEXT: v_trunc_f32_e32 v5, v5
; GFX90A-NEXT: v_mad_f32 v1, -v5, v0, v1
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v1|, |v0|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: v_cvt_i32_f32_e32 v5, v5
; GFX90A-NEXT: s_cselect_b32 s0, s4, 0
; GFX90A-NEXT: s_ashr_i32 s1, s7, 16
; GFX90A-NEXT: v_mad_f32 v5, -v6, v0, v5
; GFX90A-NEXT: v_cvt_i32_f32_e32 v6, v6
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v5|, |v0|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s4, 0
; GFX90A-NEXT: v_mov_b32_e32 v5, 0xffff
; GFX90A-NEXT: v_add_u32_e32 v0, s0, v6
; GFX9-NEXT: v_trunc_f32_e32 v3, v3
; GFX9-NEXT: v_mad_f32 v1, -v3, v0, v1
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v1|, |v0|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s8, 0
; GFX9-NEXT: s_ashr_i32 s9, s6, 16
; GFX9-NEXT: v_cvt_i32_f32_e32 v3, v3
; GFX9-NEXT: v_cvt_i32_f32_e32 v4, v4
; GFX9-NEXT: s_or_b32 s6, s0, 1
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v3|, |v0|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s6, 0
; GFX9-NEXT: v_add_u32_e32 v0, s0, v4
; GFX9-NEXT: s_sext_i32_i16 s0, s7
; GFX9-NEXT: v_mad_f32 v4, -v5, v3, v4
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v4|, |v3|
; GFX9-NEXT: v_cvt_i32_f32_e32 v5, v5
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s6, 0
; GFX9-NEXT: s_ashr_i32 s6, s7, 16
; GFX9-NEXT: v_cvt_f32_i32_e32 v4, s6
; GFX9-NEXT: v_mad_f32 v5, -v6, v4, v5
; GFX9-NEXT: v_cvt_i32_f32_e32 v6, v6
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v5|, |v4|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s9, 0
; GFX9-NEXT: v_add_u32_e32 v4, s0, v6
; GFX9-NEXT: v_mul_lo_u32 v4, v4, s6
; GFX90A-NEXT: v_mad_f32 v1, -v3, v0, v1
; GFX90A-NEXT: v_cvt_i32_f32_e32 v3, v3
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v1|, |v0|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s8, 0
; GFX90A-NEXT: s_ashr_i32 s8, s6, 16
; GFX90A-NEXT: v_cvt_f32_i32_e32 v1, s8
; GFX90A-NEXT: v_mad_f32 v3, -v4, v1, v3
; GFX90A-NEXT: v_cvt_i32_f32_e32 v4, v4
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v3|, |v1|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s6, 0
; GFX90A-NEXT: v_add_u32_e32 v1, s0, v4
; GFX90A-NEXT: s_sext_i32_i16 s0, s7
; GFX90A-NEXT: v_mad_f32 v1, -v5, v3, v1
; GFX90A-NEXT: v_cvt_i32_f32_e32 v5, v5
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v1|, |v3|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s4, 0
; GFX90A-NEXT: s_ashr_i32 s4, s7, 16
; GFX90A-NEXT: v_cvt_f32_i32_e32 v3, s4
; GFX90A-NEXT: v_mad_f32 v5, -v6, v3, v5
; GFX90A-NEXT: v_cvt_i32_f32_e32 v6, v6
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v5|, |v3|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s6, 0
; GFX90A-NEXT: v_add_u32_e32 v3, s0, v6
; GFX90A-NEXT: v_mul_lo_u32 v3, v3, s4
; GFX9-NEXT: v_mad_f32 v2, -v3, v0, v2
; GFX9-NEXT: v_cvt_i32_f32_e32 v3, v3
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v2|, |v0|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s4, 0
; GFX9-NEXT: v_add_u32_e32 v0, s0, v3
; GFX9-NEXT: v_and_b32_e32 v0, 7, v0
; GFX90A-NEXT: v_mad_f32 v2, -v3, v0, v2
; GFX90A-NEXT: v_cvt_i32_f32_e32 v3, v3
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v2|, |v0|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s4, 0
; GFX90A-NEXT: v_add_u32_e32 v0, s0, v3
; GFX90A-NEXT: v_and_b32_e32 v0, 7, v0
; GFX9-NEXT: v_mad_f32 v1, -v2, v0, v1
; GFX9-NEXT: v_cvt_i32_f32_e32 v2, v2
; GFX9-NEXT: v_cmp_ge_f32_e64 s[2:3], |v1|, |v0|
-; GFX9-NEXT: s_cmp_lg_u64 s[2:3], 0
+; GFX9-NEXT: s_and_b64 s[2:3], s[2:3], exec
; GFX9-NEXT: s_cselect_b32 s2, s6, 0
; GFX9-NEXT: v_add_u32_e32 v0, s2, v2
; GFX9-NEXT: v_mul_lo_u32 v0, v0, s5
; GFX90A-NEXT: v_mad_f32 v2, -v3, v1, v2
; GFX90A-NEXT: v_cvt_i32_f32_e32 v3, v3
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v2|, |v1|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s6, 0
; GFX90A-NEXT: v_add_u32_e32 v1, s0, v3
; GFX90A-NEXT: v_mul_lo_u32 v1, v1, s5
; GFX9-NEXT: v_trunc_f32_e32 v3, v3
; GFX9-NEXT: v_mad_f32 v2, -v3, v0, v2
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v2|, |v0|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s8, 0
; GFX9-NEXT: s_ashr_i32 s1, s6, 16
; GFX9-NEXT: v_cvt_i32_f32_e32 v3, v3
; GFX9-NEXT: v_trunc_f32_e32 v4, v4
; GFX9-NEXT: v_mad_f32 v3, -v4, v0, v3
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v3|, |v0|
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: v_cvt_i32_f32_e32 v4, v4
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
; GFX9-NEXT: s_sext_i32_i16 s1, s7
; GFX9-NEXT: v_cvt_f32_i32_e32 v0, s1
; GFX9-NEXT: s_cselect_b32 s0, s4, 0
; GFX9-NEXT: v_mad_f32 v4, -v5, v0, v4
; GFX9-NEXT: v_cvt_i32_f32_e32 v5, v5
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v4|, |v0|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s4, 0
; GFX9-NEXT: v_add_u32_e32 v0, s0, v5
; GFX9-NEXT: v_and_b32_e32 v2, 0xffff, v2
; GFX90A-NEXT: v_trunc_f32_e32 v3, v3
; GFX90A-NEXT: v_mad_f32 v2, -v3, v0, v2
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v2|, |v0|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s8, 0
; GFX90A-NEXT: s_ashr_i32 s1, s6, 16
; GFX90A-NEXT: v_cvt_i32_f32_e32 v3, v3
; GFX90A-NEXT: v_trunc_f32_e32 v4, v4
; GFX90A-NEXT: v_mad_f32 v3, -v4, v0, v3
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v3|, |v0|
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: v_cvt_i32_f32_e32 v4, v4
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
; GFX90A-NEXT: s_sext_i32_i16 s1, s7
; GFX90A-NEXT: v_cvt_f32_i32_e32 v0, s1
; GFX90A-NEXT: s_cselect_b32 s0, s4, 0
; GFX90A-NEXT: v_mad_f32 v4, -v5, v0, v4
; GFX90A-NEXT: v_cvt_i32_f32_e32 v5, v5
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v4|, |v0|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s4, 0
; GFX90A-NEXT: v_add_u32_e32 v0, s0, v5
; GFX90A-NEXT: v_and_b32_e32 v2, 0xffff, v2
; GFX9-NEXT: v_trunc_f32_e32 v2, v2
; GFX9-NEXT: v_mad_f32 v1, -v2, v0, v1
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v1|, |v0|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s10, 0
; GFX9-NEXT: s_ashr_i32 s2, s2, 16
; GFX9-NEXT: v_cvt_i32_f32_e32 v2, v2
; GFX9-NEXT: v_cvt_i32_f32_e32 v3, v3
; GFX9-NEXT: s_or_b32 s8, s0, 1
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v2|, |v0|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: v_cvt_f32_i32_e32 v2, s3
; GFX9-NEXT: s_cselect_b32 s0, s8, 0
; GFX9-NEXT: v_add_u32_e32 v0, s0, v3
; GFX9-NEXT: v_mad_f32 v3, -v4, v2, v3
; GFX9-NEXT: v_cvt_i32_f32_e32 v4, v4
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v3|, |v2|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s7, 0
; GFX9-NEXT: v_add_u32_e32 v2, s0, v4
; GFX9-NEXT: v_mul_lo_u32 v2, v2, s3
; GFX90A-NEXT: v_trunc_f32_e32 v3, v3
; GFX90A-NEXT: v_mad_f32 v2, -v3, v0, v2
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v2|, |v0|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s10, 0
; GFX90A-NEXT: s_ashr_i32 s6, s6, 16
; GFX90A-NEXT: v_cvt_i32_f32_e32 v3, v3
; GFX90A-NEXT: v_cvt_i32_f32_e32 v4, v4
; GFX90A-NEXT: s_or_b32 s8, s0, 1
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v3|, |v2|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s8, 0
; GFX90A-NEXT: v_add_u32_e32 v2, s0, v4
; GFX90A-NEXT: v_mul_lo_u32 v2, v2, s6
; GFX90A-NEXT: v_mad_f32 v4, -v5, v3, v4
; GFX90A-NEXT: v_cvt_i32_f32_e32 v5, v5
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v4|, |v3|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s5, 0
; GFX90A-NEXT: v_add_u32_e32 v3, s0, v5
; GFX90A-NEXT: v_sub_u32_e32 v0, s9, v0
; GFX9-NEXT: v_trunc_f32_e32 v5, v5
; GFX9-NEXT: v_mad_f32 v4, -v5, v3, v4
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v4|, |v3|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: v_cvt_i32_f32_e32 v5, v5
; GFX9-NEXT: s_cselect_b32 s0, s5, 0
; GFX9-NEXT: s_bfe_i32 s1, s6, 0xf000f
; GFX9-NEXT: v_cvt_i32_f32_e32 v6, v6
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v5|, |v3|
; GFX9-NEXT: v_cvt_f32_i32_e32 v3, v1
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s4, 0
; GFX9-NEXT: v_bfe_i32 v0, v0, 0, 15
; GFX9-NEXT: v_add_u32_e32 v5, s0, v6
; GFX90A-NEXT: v_trunc_f32_e32 v5, v5
; GFX90A-NEXT: v_mad_f32 v4, -v5, v3, v4
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v4|, |v3|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: v_cvt_i32_f32_e32 v5, v5
; GFX90A-NEXT: s_cselect_b32 s0, s5, 0
; GFX90A-NEXT: s_bfe_i32 s1, s6, 0xf000f
; GFX90A-NEXT: v_cvt_i32_f32_e32 v6, v6
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v5|, |v3|
; GFX90A-NEXT: v_cvt_f32_i32_e32 v3, v1
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s4, 0
; GFX90A-NEXT: v_bfe_i32 v0, v0, 0, 15
; GFX90A-NEXT: v_add_u32_e32 v5, s0, v6
; GFX9-NEXT: s_bfe_u32 s10, s6, 0xf000f
; GFX9-NEXT: s_or_b32 s11, s0, 1
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v3|, |v2|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s11, 0
; GFX9-NEXT: v_add_u32_e32 v2, s0, v4
; GFX9-NEXT: s_bfe_i32 s0, s10, 0xf0000
; GFX9-NEXT: v_mad_f32 v4, -v5, v3, v4
; GFX9-NEXT: v_cvt_i32_f32_e32 v5, v5
; GFX9-NEXT: v_cmp_ge_f32_e64 s[0:1], |v4|, |v3|
-; GFX9-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX9-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX9-NEXT: s_cselect_b32 s0, s5, 0
; GFX9-NEXT: v_bfe_i32 v4, v1, 0, 15
; GFX9-NEXT: v_add_u32_e32 v3, s0, v5
; GFX90A-NEXT: s_bfe_u32 s10, s6, 0xf000f
; GFX90A-NEXT: s_or_b32 s11, s0, 1
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v4|, |v3|
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s11, 0
; GFX90A-NEXT: v_add_u32_e32 v3, s0, v5
; GFX90A-NEXT: s_bfe_i32 s0, s10, 0xf0000
; GFX90A-NEXT: s_or_b32 s4, s0, 1
; GFX90A-NEXT: v_cmp_ge_f32_e64 s[0:1], |v5|, |v4|
; GFX90A-NEXT: v_and_b32_e32 v1, s8, v1
-; GFX90A-NEXT: s_cmp_lg_u64 s[0:1], 0
+; GFX90A-NEXT: s_and_b64 s[0:1], s[0:1], exec
; GFX90A-NEXT: s_cselect_b32 s0, s4, 0
; GFX90A-NEXT: v_bfe_i32 v5, v1, 0, 15
; GFX90A-NEXT: v_add_u32_e32 v4, s0, v6