-; RUN: llc -march=mipsel --disable-machine-licm -mcpu=mips32 -relocation-model=pic < %s | \
-; RUN: FileCheck %s -check-prefixes=ALL,MIPS32-ANY,NO-SEB-SEH,CHECK-EL,NOT-MICROMIPS
-; RUN: llc -march=mipsel --disable-machine-licm -mcpu=mips32r2 -relocation-model=pic -verify-machineinstrs < %s | \
-; RUN: FileCheck %s -check-prefixes=ALL,MIPS32-ANY,HAS-SEB-SEH,CHECK-EL,NOT-MICROMIPS
-; RUN: llc -march=mipsel --disable-machine-licm -mcpu=mips32r6 -relocation-model=pic -verify-machineinstrs < %s | \
-; RUN: FileCheck %s -check-prefixes=ALL,MIPS32-ANY,HAS-SEB-SEH,CHECK-EL,MIPSR6
-; RUN: llc -march=mips64el --disable-machine-licm -mcpu=mips4 -relocation-model=pic < %s | \
-; RUN: FileCheck %s -check-prefixes=ALL,MIPS64-ANY,NO-SEB-SEH,CHECK-EL,NOT-MICROMIPS
-; RUN: llc -march=mips64el --disable-machine-licm -mcpu=mips64 -relocation-model=pic < %s | \
-; RUN: FileCheck %s -check-prefixes=ALL,MIPS64-ANY,NO-SEB-SEH,CHECK-EL,NOT-MICROMIPS
-; RUN: llc -march=mips64el --disable-machine-licm -mcpu=mips64r2 -relocation-model=pic -verify-machineinstrs < %s | \
-; RUN: FileCheck %s -check-prefixes=ALL,MIPS64-ANY,HAS-SEB-SEH,CHECK-EL,NOT-MICROMIPS
-; RUN: llc -march=mips64el --disable-machine-licm -mcpu=mips64r6 -relocation-model=pic < %s | \
-; RUN: FileCheck %s -check-prefixes=ALL,MIPS64-ANY,HAS-SEB-SEH,CHECK-EL,MIPSR6
-; RUN: llc -march=mips64 -O0 -mcpu=mips64r6 -relocation-model=pic -verify-machineinstrs < %s | \
-; RUN: FileCheck %s -check-prefixes=ALL-LABEL,MIPS64-ANY,O0
-; RUN: llc -march=mipsel --disable-machine-licm -mcpu=mips32r2 -mattr=micromips -relocation-model=pic < %s | \
-; RUN: FileCheck %s -check-prefixes=ALL,MIPS32-ANY,HAS-SEB-SEH,CHECK-EL,MICROMIPS
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
+; RUN: llc -mtriple=mipsel-unknown-linux-gnu --disable-machine-licm -mcpu=mips32 -relocation-model=pic -verify-machineinstrs < %s | \
+; RUN: FileCheck %s -check-prefix=MIPS32
+; RUN: llc -mtriple=mipsel-unknown-linux-gnu -O0 --disable-machine-licm -mcpu=mips32 -relocation-model=pic -verify-machineinstrs < %s | \
+; RUN: FileCheck %s -check-prefix=MIPS32O0
+; RUN: llc -mtriple=mipsel-unknown-linux-gnu --disable-machine-licm -mcpu=mips32r2 -relocation-model=pic -verify-machineinstrs < %s | \
+; RUN: FileCheck %s -check-prefix=MIPS32R2
+; RUN: llc -mtriple=mipsel-unknown-linux-gnu --disable-machine-licm -mcpu=mips32r6 -relocation-model=pic -verify-machineinstrs < %s | \
+; RUN: FileCheck %s -check-prefix=MIPS32R6
+; RUN: llc -mtriple=mipsel-unknown-linux-gnu -O0 --disable-machine-licm -mcpu=mips32r6 -relocation-model=pic -verify-machineinstrs < %s | \
+; RUN: FileCheck %s -check-prefix=MIPS32R6O0
+; RUN: llc -mtriple=mips64el-unknown-linux-gnu --disable-machine-licm -mcpu=mips4 -relocation-model=pic -verify-machineinstrs < %s | \
+; RUN: FileCheck %s -check-prefix=MIPS4
+; RUN: llc -mtriple=mips64el-unknown-linux-gnu --disable-machine-licm -mcpu=mips64 -relocation-model=pic -verify-machineinstrs < %s | \
+; RUN: FileCheck %s -check-prefix=MIPS64
+; RUN: llc -mtriple=mips64el-unknown-linux-gnu --disable-machine-licm -mcpu=mips64r2 -relocation-model=pic -verify-machineinstrs < %s | \
+; RUN: FileCheck %s -check-prefix=MIPS64R2
+; RUN: llc -mtriple=mips64el-unknown-linux-gnu --disable-machine-licm -mcpu=mips64r6 -relocation-model=pic -verify-machineinstrs < %s | \
+; RUN: FileCheck %s -check-prefix=MIPS64R6
+; RUN: llc -mtriple=mips64-unknown-linux-gnu -O0 -mcpu=mips64r6 -relocation-model=pic -verify-machineinstrs -verify-machineinstrs < %s | \
+; RUN: FileCheck %s -check-prefix=MIPS64R6O0
+; RUN: llc -mtriple=mipsel-unknown-linux-gnu --disable-machine-licm -mcpu=mips32r2 -mattr=micromips -relocation-model=pic -verify-machineinstrs < %s | \
+; RUN: FileCheck %s -check-prefix=MM32
+
+; We want to verify the produced code is well formed all optimization levels, the rest of the tests which ensure correctness.
+; RUN: llc -mtriple=mipsel-unknown-linux-gnu -O1 --disable-machine-licm -mcpu=mips32 -relocation-model=pic -verify-machineinstrs < %s | FileCheck %s --check-prefix=O1
+; RUN: llc -mtriple=mipsel-unknown-linux-gnu -O2 --disable-machine-licm -mcpu=mips32 -relocation-model=pic -verify-machineinstrs < %s | FileCheck %s --check-prefix=O2
+; RUN: llc -mtriple=mipsel-unknown-linux-gnu -O3 --disable-machine-licm -mcpu=mips32 -relocation-model=pic -verify-machineinstrs < %s | FileCheck %s --check-prefix=O3
; Keep one big-endian check so that we don't reduce testing, but don't add more
; since endianness doesn't affect the body of the atomic operations.
-; RUN: llc -march=mips --disable-machine-licm -mcpu=mips32 -relocation-model=pic < %s | \
-; RUN: FileCheck %s -check-prefixes=ALL,MIPS32-ANY,NO-SEB-SEH,CHECK-EB,NOT-MICROMIPS
+; RUN: llc -mtriple=mips-unknown-linux-gnu --disable-machine-licm -mcpu=mips32 -relocation-model=pic -verify-machineinstrs < %s | \
+; RUN: FileCheck %s -check-prefix=MIPS32EB
@x = common global i32 0, align 4
define i32 @AtomicLoadAdd32(i32 signext %incr) nounwind {
+; MIPS32-LABEL: AtomicLoadAdd32:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: lw $1, %got(x)($1)
+; MIPS32-NEXT: $BB0_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $2, 0($1)
+; MIPS32-NEXT: addu $3, $2, $4
+; MIPS32-NEXT: sc $3, 0($1)
+; MIPS32-NEXT: beqz $3, $BB0_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: nop
+;
+; MIPS32O0-LABEL: AtomicLoadAdd32:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: lw $2, %got(x)($2)
+; MIPS32O0-NEXT: $BB0_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $25, 0($2)
+; MIPS32O0-NEXT: addu $1, $25, $4
+; MIPS32O0-NEXT: sc $1, 0($2)
+; MIPS32O0-NEXT: beqz $1, $BB0_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: move $2, $25
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicLoadAdd32:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: lw $1, %got(x)($1)
+; MIPS32R2-NEXT: $BB0_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $2, 0($1)
+; MIPS32R2-NEXT: addu $3, $2, $4
+; MIPS32R2-NEXT: sc $3, 0($1)
+; MIPS32R2-NEXT: beqz $3, $BB0_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: nop
+;
+; MIPS32R6-LABEL: AtomicLoadAdd32:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: lw $1, %got(x)($1)
+; MIPS32R6-NEXT: $BB0_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $2, 0($1)
+; MIPS32R6-NEXT: addu $3, $2, $4
+; MIPS32R6-NEXT: sc $3, 0($1)
+; MIPS32R6-NEXT: beqzc $3, $BB0_1
+; MIPS32R6-NEXT: nop
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: jrc $ra
+;
+; MIPS32R6O0-LABEL: AtomicLoadAdd32:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -8
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $4
+; MIPS32R6O0-NEXT: lw $2, %got(x)($2)
+; MIPS32R6O0-NEXT: $BB0_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $1, 0($2)
+; MIPS32R6O0-NEXT: addu $3, $1, $4
+; MIPS32R6O0-NEXT: sc $3, 0($2)
+; MIPS32R6O0-NEXT: beqzc $3, $BB0_1
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: move $2, $1
+; MIPS32R6O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 8
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicLoadAdd32:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd32)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd32)))
+; MIPS4-NEXT: ld $1, %got_disp(x)($1)
+; MIPS4-NEXT: .LBB0_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $2, 0($1)
+; MIPS4-NEXT: addu $3, $2, $4
+; MIPS4-NEXT: sc $3, 0($1)
+; MIPS4-NEXT: beqz $3, .LBB0_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: nop
+;
+; MIPS64-LABEL: AtomicLoadAdd32:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd32)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd32)))
+; MIPS64-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64-NEXT: .LBB0_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $2, 0($1)
+; MIPS64-NEXT: addu $3, $2, $4
+; MIPS64-NEXT: sc $3, 0($1)
+; MIPS64-NEXT: beqz $3, .LBB0_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: nop
+;
+; MIPS64R2-LABEL: AtomicLoadAdd32:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd32)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd32)))
+; MIPS64R2-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R2-NEXT: .LBB0_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $2, 0($1)
+; MIPS64R2-NEXT: addu $3, $2, $4
+; MIPS64R2-NEXT: sc $3, 0($1)
+; MIPS64R2-NEXT: beqz $3, .LBB0_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: nop
+;
+; MIPS64R6-LABEL: AtomicLoadAdd32:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd32)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd32)))
+; MIPS64R6-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6-NEXT: .LBB0_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $2, 0($1)
+; MIPS64R6-NEXT: addu $3, $2, $4
+; MIPS64R6-NEXT: sc $3, 0($1)
+; MIPS64R6-NEXT: beqzc $3, .LBB0_1
+; MIPS64R6-NEXT: nop
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: jrc $ra
+;
+; MIPS64R6O0-LABEL: AtomicLoadAdd32:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd32)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd32)))
+; MIPS64R6O0-NEXT: move $2, $4
+; MIPS64R6O0-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6O0-NEXT: .LBB0_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $3, 0($1)
+; MIPS64R6O0-NEXT: addu $5, $3, $2
+; MIPS64R6O0-NEXT: sc $5, 0($1)
+; MIPS64R6O0-NEXT: beqzc $5, .LBB0_1
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: move $2, $3
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicLoadAdd32:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: lw $1, %got(x)($2)
+; MM32-NEXT: $BB0_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $2, 0($1)
+; MM32-NEXT: addu16 $3, $2, $4
+; MM32-NEXT: sc $3, 0($1)
+; MM32-NEXT: beqzc $3, $BB0_1
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: jrc $ra
+;
+; O1-LABEL: AtomicLoadAdd32:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: lw $1, %got(x)($1)
+; O1-NEXT: $BB0_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $2, 0($1)
+; O1-NEXT: addu $3, $2, $4
+; O1-NEXT: sc $3, 0($1)
+; O1-NEXT: beqz $3, $BB0_1
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: jr $ra
+; O1-NEXT: nop
+;
+; O2-LABEL: AtomicLoadAdd32:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: lw $1, %got(x)($1)
+; O2-NEXT: $BB0_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $2, 0($1)
+; O2-NEXT: addu $3, $2, $4
+; O2-NEXT: sc $3, 0($1)
+; O2-NEXT: beqz $3, $BB0_1
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: jr $ra
+; O2-NEXT: nop
+;
+; O3-LABEL: AtomicLoadAdd32:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: lw $1, %got(x)($1)
+; O3-NEXT: $BB0_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $2, 0($1)
+; O3-NEXT: addu $3, $2, $4
+; O3-NEXT: sc $3, 0($1)
+; O3-NEXT: beqz $3, $BB0_1
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: jr $ra
+; O3-NEXT: nop
+;
+; MIPS32EB-LABEL: AtomicLoadAdd32:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: lw $1, %got(x)($1)
+; MIPS32EB-NEXT: $BB0_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $2, 0($1)
+; MIPS32EB-NEXT: addu $3, $2, $4
+; MIPS32EB-NEXT: sc $3, 0($1)
+; MIPS32EB-NEXT: beqz $3, $BB0_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: nop
entry:
%0 = atomicrmw add i32* @x, i32 %incr monotonic
ret i32 %0
-; ALL-LABEL: AtomicLoadAdd32:
-
-; MIPS32-ANY: lw $[[R0:[0-9]+]], %got(x)
-; MIPS64-ANY: ld $[[R0:[0-9]+]], %got_disp(x)(
+}
-; O0: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; O0: ld $[[R1:[0-9]+]]
-; O0-NEXT: ll $[[R2:[0-9]+]], 0($[[R1]])
+define i32 @AtomicLoadSub32(i32 signext %incr) nounwind {
+; MIPS32-LABEL: AtomicLoadSub32:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: lw $1, %got(x)($1)
+; MIPS32-NEXT: $BB1_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $2, 0($1)
+; MIPS32-NEXT: subu $3, $2, $4
+; MIPS32-NEXT: sc $3, 0($1)
+; MIPS32-NEXT: beqz $3, $BB1_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: nop
+;
+; MIPS32O0-LABEL: AtomicLoadSub32:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: lw $2, %got(x)($2)
+; MIPS32O0-NEXT: $BB1_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $25, 0($2)
+; MIPS32O0-NEXT: subu $1, $25, $4
+; MIPS32O0-NEXT: sc $1, 0($2)
+; MIPS32O0-NEXT: beqz $1, $BB1_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: move $2, $25
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicLoadSub32:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: lw $1, %got(x)($1)
+; MIPS32R2-NEXT: $BB1_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $2, 0($1)
+; MIPS32R2-NEXT: subu $3, $2, $4
+; MIPS32R2-NEXT: sc $3, 0($1)
+; MIPS32R2-NEXT: beqz $3, $BB1_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: nop
+;
+; MIPS32R6-LABEL: AtomicLoadSub32:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: lw $1, %got(x)($1)
+; MIPS32R6-NEXT: $BB1_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $2, 0($1)
+; MIPS32R6-NEXT: subu $3, $2, $4
+; MIPS32R6-NEXT: sc $3, 0($1)
+; MIPS32R6-NEXT: beqzc $3, $BB1_1
+; MIPS32R6-NEXT: nop
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: jrc $ra
+;
+; MIPS32R6O0-LABEL: AtomicLoadSub32:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -8
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $4
+; MIPS32R6O0-NEXT: lw $2, %got(x)($2)
+; MIPS32R6O0-NEXT: $BB1_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $1, 0($2)
+; MIPS32R6O0-NEXT: subu $3, $1, $4
+; MIPS32R6O0-NEXT: sc $3, 0($2)
+; MIPS32R6O0-NEXT: beqzc $3, $BB1_1
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: move $2, $1
+; MIPS32R6O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 8
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicLoadSub32:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadSub32)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadSub32)))
+; MIPS4-NEXT: ld $1, %got_disp(x)($1)
+; MIPS4-NEXT: .LBB1_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $2, 0($1)
+; MIPS4-NEXT: subu $3, $2, $4
+; MIPS4-NEXT: sc $3, 0($1)
+; MIPS4-NEXT: beqz $3, .LBB1_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: nop
+;
+; MIPS64-LABEL: AtomicLoadSub32:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadSub32)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadSub32)))
+; MIPS64-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64-NEXT: .LBB1_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $2, 0($1)
+; MIPS64-NEXT: subu $3, $2, $4
+; MIPS64-NEXT: sc $3, 0($1)
+; MIPS64-NEXT: beqz $3, .LBB1_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: nop
+;
+; MIPS64R2-LABEL: AtomicLoadSub32:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadSub32)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadSub32)))
+; MIPS64R2-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R2-NEXT: .LBB1_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $2, 0($1)
+; MIPS64R2-NEXT: subu $3, $2, $4
+; MIPS64R2-NEXT: sc $3, 0($1)
+; MIPS64R2-NEXT: beqz $3, .LBB1_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: nop
+;
+; MIPS64R6-LABEL: AtomicLoadSub32:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadSub32)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadSub32)))
+; MIPS64R6-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6-NEXT: .LBB1_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $2, 0($1)
+; MIPS64R6-NEXT: subu $3, $2, $4
+; MIPS64R6-NEXT: sc $3, 0($1)
+; MIPS64R6-NEXT: beqzc $3, .LBB1_1
+; MIPS64R6-NEXT: nop
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: jrc $ra
+;
+; MIPS64R6O0-LABEL: AtomicLoadSub32:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadSub32)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadSub32)))
+; MIPS64R6O0-NEXT: move $2, $4
+; MIPS64R6O0-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6O0-NEXT: .LBB1_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $3, 0($1)
+; MIPS64R6O0-NEXT: subu $5, $3, $2
+; MIPS64R6O0-NEXT: sc $5, 0($1)
+; MIPS64R6O0-NEXT: beqzc $5, .LBB1_1
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: move $2, $3
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicLoadSub32:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: lw $1, %got(x)($2)
+; MM32-NEXT: $BB1_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $2, 0($1)
+; MM32-NEXT: subu16 $3, $2, $4
+; MM32-NEXT: sc $3, 0($1)
+; MM32-NEXT: beqzc $3, $BB1_1
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: jrc $ra
+;
+; O1-LABEL: AtomicLoadSub32:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: lw $1, %got(x)($1)
+; O1-NEXT: $BB1_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $2, 0($1)
+; O1-NEXT: subu $3, $2, $4
+; O1-NEXT: sc $3, 0($1)
+; O1-NEXT: beqz $3, $BB1_1
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: jr $ra
+; O1-NEXT: nop
+;
+; O2-LABEL: AtomicLoadSub32:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: lw $1, %got(x)($1)
+; O2-NEXT: $BB1_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $2, 0($1)
+; O2-NEXT: subu $3, $2, $4
+; O2-NEXT: sc $3, 0($1)
+; O2-NEXT: beqz $3, $BB1_1
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: jr $ra
+; O2-NEXT: nop
+;
+; O3-LABEL: AtomicLoadSub32:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: lw $1, %got(x)($1)
+; O3-NEXT: $BB1_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $2, 0($1)
+; O3-NEXT: subu $3, $2, $4
+; O3-NEXT: sc $3, 0($1)
+; O3-NEXT: beqz $3, $BB1_1
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: jr $ra
+; O3-NEXT: nop
+;
+; MIPS32EB-LABEL: AtomicLoadSub32:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: lw $1, %got(x)($1)
+; MIPS32EB-NEXT: $BB1_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $2, 0($1)
+; MIPS32EB-NEXT: subu $3, $2, $4
+; MIPS32EB-NEXT: sc $3, 0($1)
+; MIPS32EB-NEXT: beqz $3, $BB1_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: nop
+entry:
+ %0 = atomicrmw sub i32* @x, i32 %incr monotonic
+ ret i32 %0
-; ALL: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; ALL: ll $[[R3:[0-9]+]], 0($[[R0]])
-; ALL: addu $[[R4:[0-9]+]], $[[R3]], $4
-; ALL: sc $[[R4]], 0($[[R0]])
-; NOT-MICROMIPS: beqz $[[R4]], [[BB0]]
-; MICROMIPS: beqzc $[[R4]], [[BB0]]
-; MIPSR6: beqzc $[[R4]], [[BB0]]
}
-define i32 @AtomicLoadNand32(i32 signext %incr) nounwind {
+define i32 @AtomicLoadXor32(i32 signext %incr) nounwind {
+; MIPS32-LABEL: AtomicLoadXor32:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: lw $1, %got(x)($1)
+; MIPS32-NEXT: $BB2_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $2, 0($1)
+; MIPS32-NEXT: xor $3, $2, $4
+; MIPS32-NEXT: sc $3, 0($1)
+; MIPS32-NEXT: beqz $3, $BB2_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: nop
+;
+; MIPS32O0-LABEL: AtomicLoadXor32:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: lw $2, %got(x)($2)
+; MIPS32O0-NEXT: $BB2_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $25, 0($2)
+; MIPS32O0-NEXT: xor $1, $25, $4
+; MIPS32O0-NEXT: sc $1, 0($2)
+; MIPS32O0-NEXT: beqz $1, $BB2_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: move $2, $25
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicLoadXor32:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: lw $1, %got(x)($1)
+; MIPS32R2-NEXT: $BB2_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $2, 0($1)
+; MIPS32R2-NEXT: xor $3, $2, $4
+; MIPS32R2-NEXT: sc $3, 0($1)
+; MIPS32R2-NEXT: beqz $3, $BB2_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: nop
+;
+; MIPS32R6-LABEL: AtomicLoadXor32:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: lw $1, %got(x)($1)
+; MIPS32R6-NEXT: $BB2_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $2, 0($1)
+; MIPS32R6-NEXT: xor $3, $2, $4
+; MIPS32R6-NEXT: sc $3, 0($1)
+; MIPS32R6-NEXT: beqzc $3, $BB2_1
+; MIPS32R6-NEXT: nop
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: jrc $ra
+;
+; MIPS32R6O0-LABEL: AtomicLoadXor32:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -8
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $4
+; MIPS32R6O0-NEXT: lw $2, %got(x)($2)
+; MIPS32R6O0-NEXT: $BB2_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $1, 0($2)
+; MIPS32R6O0-NEXT: xor $3, $1, $4
+; MIPS32R6O0-NEXT: sc $3, 0($2)
+; MIPS32R6O0-NEXT: beqzc $3, $BB2_1
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: move $2, $1
+; MIPS32R6O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 8
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicLoadXor32:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadXor32)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadXor32)))
+; MIPS4-NEXT: ld $1, %got_disp(x)($1)
+; MIPS4-NEXT: .LBB2_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $2, 0($1)
+; MIPS4-NEXT: xor $3, $2, $4
+; MIPS4-NEXT: sc $3, 0($1)
+; MIPS4-NEXT: beqz $3, .LBB2_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: nop
+;
+; MIPS64-LABEL: AtomicLoadXor32:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadXor32)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadXor32)))
+; MIPS64-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64-NEXT: .LBB2_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $2, 0($1)
+; MIPS64-NEXT: xor $3, $2, $4
+; MIPS64-NEXT: sc $3, 0($1)
+; MIPS64-NEXT: beqz $3, .LBB2_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: nop
+;
+; MIPS64R2-LABEL: AtomicLoadXor32:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadXor32)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadXor32)))
+; MIPS64R2-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R2-NEXT: .LBB2_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $2, 0($1)
+; MIPS64R2-NEXT: xor $3, $2, $4
+; MIPS64R2-NEXT: sc $3, 0($1)
+; MIPS64R2-NEXT: beqz $3, .LBB2_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: nop
+;
+; MIPS64R6-LABEL: AtomicLoadXor32:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadXor32)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadXor32)))
+; MIPS64R6-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6-NEXT: .LBB2_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $2, 0($1)
+; MIPS64R6-NEXT: xor $3, $2, $4
+; MIPS64R6-NEXT: sc $3, 0($1)
+; MIPS64R6-NEXT: beqzc $3, .LBB2_1
+; MIPS64R6-NEXT: nop
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: jrc $ra
+;
+; MIPS64R6O0-LABEL: AtomicLoadXor32:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadXor32)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadXor32)))
+; MIPS64R6O0-NEXT: move $2, $4
+; MIPS64R6O0-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6O0-NEXT: .LBB2_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $3, 0($1)
+; MIPS64R6O0-NEXT: xor $5, $3, $2
+; MIPS64R6O0-NEXT: sc $5, 0($1)
+; MIPS64R6O0-NEXT: beqzc $5, .LBB2_1
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: move $2, $3
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicLoadXor32:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: lw $1, %got(x)($2)
+; MM32-NEXT: $BB2_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $2, 0($1)
+; MM32-NEXT: xor $3, $2, $4
+; MM32-NEXT: sc $3, 0($1)
+; MM32-NEXT: beqzc $3, $BB2_1
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: jrc $ra
+;
+; O1-LABEL: AtomicLoadXor32:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: lw $1, %got(x)($1)
+; O1-NEXT: $BB2_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $2, 0($1)
+; O1-NEXT: xor $3, $2, $4
+; O1-NEXT: sc $3, 0($1)
+; O1-NEXT: beqz $3, $BB2_1
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: jr $ra
+; O1-NEXT: nop
+;
+; O2-LABEL: AtomicLoadXor32:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: lw $1, %got(x)($1)
+; O2-NEXT: $BB2_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $2, 0($1)
+; O2-NEXT: xor $3, $2, $4
+; O2-NEXT: sc $3, 0($1)
+; O2-NEXT: beqz $3, $BB2_1
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: jr $ra
+; O2-NEXT: nop
+;
+; O3-LABEL: AtomicLoadXor32:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: lw $1, %got(x)($1)
+; O3-NEXT: $BB2_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $2, 0($1)
+; O3-NEXT: xor $3, $2, $4
+; O3-NEXT: sc $3, 0($1)
+; O3-NEXT: beqz $3, $BB2_1
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: jr $ra
+; O3-NEXT: nop
+;
+; MIPS32EB-LABEL: AtomicLoadXor32:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: lw $1, %got(x)($1)
+; MIPS32EB-NEXT: $BB2_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $2, 0($1)
+; MIPS32EB-NEXT: xor $3, $2, $4
+; MIPS32EB-NEXT: sc $3, 0($1)
+; MIPS32EB-NEXT: beqz $3, $BB2_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: nop
entry:
- %0 = atomicrmw nand i32* @x, i32 %incr monotonic
+ %0 = atomicrmw xor i32* @x, i32 %incr monotonic
ret i32 %0
+}
-; ALL-LABEL: AtomicLoadNand32:
-
-; MIPS32-ANY: lw $[[R0:[0-9]+]], %got(x)
-; MIPS64-ANY: ld $[[R0:[0-9]+]], %got_disp(x)(
+define i32 @AtomicLoadOr32(i32 signext %incr) nounwind {
+; MIPS32-LABEL: AtomicLoadOr32:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: lw $1, %got(x)($1)
+; MIPS32-NEXT: $BB3_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $2, 0($1)
+; MIPS32-NEXT: or $3, $2, $4
+; MIPS32-NEXT: sc $3, 0($1)
+; MIPS32-NEXT: beqz $3, $BB3_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: nop
+;
+; MIPS32O0-LABEL: AtomicLoadOr32:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: lw $2, %got(x)($2)
+; MIPS32O0-NEXT: $BB3_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $25, 0($2)
+; MIPS32O0-NEXT: or $1, $25, $4
+; MIPS32O0-NEXT: sc $1, 0($2)
+; MIPS32O0-NEXT: beqz $1, $BB3_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: move $2, $25
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicLoadOr32:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: lw $1, %got(x)($1)
+; MIPS32R2-NEXT: $BB3_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $2, 0($1)
+; MIPS32R2-NEXT: or $3, $2, $4
+; MIPS32R2-NEXT: sc $3, 0($1)
+; MIPS32R2-NEXT: beqz $3, $BB3_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: nop
+;
+; MIPS32R6-LABEL: AtomicLoadOr32:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: lw $1, %got(x)($1)
+; MIPS32R6-NEXT: $BB3_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $2, 0($1)
+; MIPS32R6-NEXT: or $3, $2, $4
+; MIPS32R6-NEXT: sc $3, 0($1)
+; MIPS32R6-NEXT: beqzc $3, $BB3_1
+; MIPS32R6-NEXT: nop
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: jrc $ra
+;
+; MIPS32R6O0-LABEL: AtomicLoadOr32:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -8
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $4
+; MIPS32R6O0-NEXT: lw $2, %got(x)($2)
+; MIPS32R6O0-NEXT: $BB3_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $1, 0($2)
+; MIPS32R6O0-NEXT: or $3, $1, $4
+; MIPS32R6O0-NEXT: sc $3, 0($2)
+; MIPS32R6O0-NEXT: beqzc $3, $BB3_1
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: move $2, $1
+; MIPS32R6O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 8
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicLoadOr32:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadOr32)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadOr32)))
+; MIPS4-NEXT: ld $1, %got_disp(x)($1)
+; MIPS4-NEXT: .LBB3_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $2, 0($1)
+; MIPS4-NEXT: or $3, $2, $4
+; MIPS4-NEXT: sc $3, 0($1)
+; MIPS4-NEXT: beqz $3, .LBB3_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: nop
+;
+; MIPS64-LABEL: AtomicLoadOr32:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadOr32)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadOr32)))
+; MIPS64-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64-NEXT: .LBB3_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $2, 0($1)
+; MIPS64-NEXT: or $3, $2, $4
+; MIPS64-NEXT: sc $3, 0($1)
+; MIPS64-NEXT: beqz $3, .LBB3_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: nop
+;
+; MIPS64R2-LABEL: AtomicLoadOr32:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadOr32)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadOr32)))
+; MIPS64R2-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R2-NEXT: .LBB3_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $2, 0($1)
+; MIPS64R2-NEXT: or $3, $2, $4
+; MIPS64R2-NEXT: sc $3, 0($1)
+; MIPS64R2-NEXT: beqz $3, .LBB3_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: nop
+;
+; MIPS64R6-LABEL: AtomicLoadOr32:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadOr32)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadOr32)))
+; MIPS64R6-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6-NEXT: .LBB3_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $2, 0($1)
+; MIPS64R6-NEXT: or $3, $2, $4
+; MIPS64R6-NEXT: sc $3, 0($1)
+; MIPS64R6-NEXT: beqzc $3, .LBB3_1
+; MIPS64R6-NEXT: nop
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: jrc $ra
+;
+; MIPS64R6O0-LABEL: AtomicLoadOr32:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadOr32)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadOr32)))
+; MIPS64R6O0-NEXT: move $2, $4
+; MIPS64R6O0-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6O0-NEXT: .LBB3_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $3, 0($1)
+; MIPS64R6O0-NEXT: or $5, $3, $2
+; MIPS64R6O0-NEXT: sc $5, 0($1)
+; MIPS64R6O0-NEXT: beqzc $5, .LBB3_1
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: move $2, $3
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicLoadOr32:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: lw $1, %got(x)($2)
+; MM32-NEXT: $BB3_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $2, 0($1)
+; MM32-NEXT: or $3, $2, $4
+; MM32-NEXT: sc $3, 0($1)
+; MM32-NEXT: beqzc $3, $BB3_1
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: jrc $ra
+;
+; O1-LABEL: AtomicLoadOr32:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: lw $1, %got(x)($1)
+; O1-NEXT: $BB3_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $2, 0($1)
+; O1-NEXT: or $3, $2, $4
+; O1-NEXT: sc $3, 0($1)
+; O1-NEXT: beqz $3, $BB3_1
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: jr $ra
+; O1-NEXT: nop
+;
+; O2-LABEL: AtomicLoadOr32:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: lw $1, %got(x)($1)
+; O2-NEXT: $BB3_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $2, 0($1)
+; O2-NEXT: or $3, $2, $4
+; O2-NEXT: sc $3, 0($1)
+; O2-NEXT: beqz $3, $BB3_1
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: jr $ra
+; O2-NEXT: nop
+;
+; O3-LABEL: AtomicLoadOr32:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: lw $1, %got(x)($1)
+; O3-NEXT: $BB3_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $2, 0($1)
+; O3-NEXT: or $3, $2, $4
+; O3-NEXT: sc $3, 0($1)
+; O3-NEXT: beqz $3, $BB3_1
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: jr $ra
+; O3-NEXT: nop
+;
+; MIPS32EB-LABEL: AtomicLoadOr32:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: lw $1, %got(x)($1)
+; MIPS32EB-NEXT: $BB3_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $2, 0($1)
+; MIPS32EB-NEXT: or $3, $2, $4
+; MIPS32EB-NEXT: sc $3, 0($1)
+; MIPS32EB-NEXT: beqz $3, $BB3_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: nop
+entry:
+ %0 = atomicrmw or i32* @x, i32 %incr monotonic
+ ret i32 %0
+}
+define i32 @AtomicLoadAnd32(i32 signext %incr) nounwind {
+; MIPS32-LABEL: AtomicLoadAnd32:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: lw $1, %got(x)($1)
+; MIPS32-NEXT: $BB4_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $2, 0($1)
+; MIPS32-NEXT: and $3, $2, $4
+; MIPS32-NEXT: sc $3, 0($1)
+; MIPS32-NEXT: beqz $3, $BB4_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: nop
+;
+; MIPS32O0-LABEL: AtomicLoadAnd32:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: lw $2, %got(x)($2)
+; MIPS32O0-NEXT: $BB4_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $25, 0($2)
+; MIPS32O0-NEXT: and $1, $25, $4
+; MIPS32O0-NEXT: sc $1, 0($2)
+; MIPS32O0-NEXT: beqz $1, $BB4_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: move $2, $25
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicLoadAnd32:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: lw $1, %got(x)($1)
+; MIPS32R2-NEXT: $BB4_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $2, 0($1)
+; MIPS32R2-NEXT: and $3, $2, $4
+; MIPS32R2-NEXT: sc $3, 0($1)
+; MIPS32R2-NEXT: beqz $3, $BB4_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: nop
+;
+; MIPS32R6-LABEL: AtomicLoadAnd32:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: lw $1, %got(x)($1)
+; MIPS32R6-NEXT: $BB4_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $2, 0($1)
+; MIPS32R6-NEXT: and $3, $2, $4
+; MIPS32R6-NEXT: sc $3, 0($1)
+; MIPS32R6-NEXT: beqzc $3, $BB4_1
+; MIPS32R6-NEXT: nop
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: jrc $ra
+;
+; MIPS32R6O0-LABEL: AtomicLoadAnd32:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -8
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $4
+; MIPS32R6O0-NEXT: lw $2, %got(x)($2)
+; MIPS32R6O0-NEXT: $BB4_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $1, 0($2)
+; MIPS32R6O0-NEXT: and $3, $1, $4
+; MIPS32R6O0-NEXT: sc $3, 0($2)
+; MIPS32R6O0-NEXT: beqzc $3, $BB4_1
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: move $2, $1
+; MIPS32R6O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 8
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicLoadAnd32:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAnd32)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAnd32)))
+; MIPS4-NEXT: ld $1, %got_disp(x)($1)
+; MIPS4-NEXT: .LBB4_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $2, 0($1)
+; MIPS4-NEXT: and $3, $2, $4
+; MIPS4-NEXT: sc $3, 0($1)
+; MIPS4-NEXT: beqz $3, .LBB4_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: nop
+;
+; MIPS64-LABEL: AtomicLoadAnd32:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAnd32)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAnd32)))
+; MIPS64-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64-NEXT: .LBB4_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $2, 0($1)
+; MIPS64-NEXT: and $3, $2, $4
+; MIPS64-NEXT: sc $3, 0($1)
+; MIPS64-NEXT: beqz $3, .LBB4_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: nop
+;
+; MIPS64R2-LABEL: AtomicLoadAnd32:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAnd32)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAnd32)))
+; MIPS64R2-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R2-NEXT: .LBB4_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $2, 0($1)
+; MIPS64R2-NEXT: and $3, $2, $4
+; MIPS64R2-NEXT: sc $3, 0($1)
+; MIPS64R2-NEXT: beqz $3, .LBB4_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: nop
+;
+; MIPS64R6-LABEL: AtomicLoadAnd32:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAnd32)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAnd32)))
+; MIPS64R6-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6-NEXT: .LBB4_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $2, 0($1)
+; MIPS64R6-NEXT: and $3, $2, $4
+; MIPS64R6-NEXT: sc $3, 0($1)
+; MIPS64R6-NEXT: beqzc $3, .LBB4_1
+; MIPS64R6-NEXT: nop
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: jrc $ra
+;
+; MIPS64R6O0-LABEL: AtomicLoadAnd32:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAnd32)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAnd32)))
+; MIPS64R6O0-NEXT: move $2, $4
+; MIPS64R6O0-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6O0-NEXT: .LBB4_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $3, 0($1)
+; MIPS64R6O0-NEXT: and $5, $3, $2
+; MIPS64R6O0-NEXT: sc $5, 0($1)
+; MIPS64R6O0-NEXT: beqzc $5, .LBB4_1
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: move $2, $3
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicLoadAnd32:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: lw $1, %got(x)($2)
+; MM32-NEXT: $BB4_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $2, 0($1)
+; MM32-NEXT: and $3, $2, $4
+; MM32-NEXT: sc $3, 0($1)
+; MM32-NEXT: beqzc $3, $BB4_1
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: jrc $ra
+;
+; O1-LABEL: AtomicLoadAnd32:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: lw $1, %got(x)($1)
+; O1-NEXT: $BB4_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $2, 0($1)
+; O1-NEXT: and $3, $2, $4
+; O1-NEXT: sc $3, 0($1)
+; O1-NEXT: beqz $3, $BB4_1
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: jr $ra
+; O1-NEXT: nop
+;
+; O2-LABEL: AtomicLoadAnd32:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: lw $1, %got(x)($1)
+; O2-NEXT: $BB4_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $2, 0($1)
+; O2-NEXT: and $3, $2, $4
+; O2-NEXT: sc $3, 0($1)
+; O2-NEXT: beqz $3, $BB4_1
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: jr $ra
+; O2-NEXT: nop
+;
+; O3-LABEL: AtomicLoadAnd32:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: lw $1, %got(x)($1)
+; O3-NEXT: $BB4_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $2, 0($1)
+; O3-NEXT: and $3, $2, $4
+; O3-NEXT: sc $3, 0($1)
+; O3-NEXT: beqz $3, $BB4_1
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: jr $ra
+; O3-NEXT: nop
+;
+; MIPS32EB-LABEL: AtomicLoadAnd32:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: lw $1, %got(x)($1)
+; MIPS32EB-NEXT: $BB4_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $2, 0($1)
+; MIPS32EB-NEXT: and $3, $2, $4
+; MIPS32EB-NEXT: sc $3, 0($1)
+; MIPS32EB-NEXT: beqz $3, $BB4_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: nop
+entry:
+ %0 = atomicrmw and i32* @x, i32 %incr monotonic
+ ret i32 %0
+}
+define i32 @AtomicLoadNand32(i32 signext %incr) nounwind {
+; MIPS32-LABEL: AtomicLoadNand32:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: lw $1, %got(x)($1)
+; MIPS32-NEXT: $BB5_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $2, 0($1)
+; MIPS32-NEXT: and $3, $2, $4
+; MIPS32-NEXT: nor $3, $zero, $3
+; MIPS32-NEXT: sc $3, 0($1)
+; MIPS32-NEXT: beqz $3, $BB5_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: nop
+;
+; MIPS32O0-LABEL: AtomicLoadNand32:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: lw $2, %got(x)($2)
+; MIPS32O0-NEXT: $BB5_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $25, 0($2)
+; MIPS32O0-NEXT: and $1, $25, $4
+; MIPS32O0-NEXT: nor $1, $zero, $1
+; MIPS32O0-NEXT: sc $1, 0($2)
+; MIPS32O0-NEXT: beqz $1, $BB5_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: move $2, $25
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicLoadNand32:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: lw $1, %got(x)($1)
+; MIPS32R2-NEXT: $BB5_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $2, 0($1)
+; MIPS32R2-NEXT: and $3, $2, $4
+; MIPS32R2-NEXT: nor $3, $zero, $3
+; MIPS32R2-NEXT: sc $3, 0($1)
+; MIPS32R2-NEXT: beqz $3, $BB5_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: nop
+;
+; MIPS32R6-LABEL: AtomicLoadNand32:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: lw $1, %got(x)($1)
+; MIPS32R6-NEXT: $BB5_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $2, 0($1)
+; MIPS32R6-NEXT: and $3, $2, $4
+; MIPS32R6-NEXT: nor $3, $zero, $3
+; MIPS32R6-NEXT: sc $3, 0($1)
+; MIPS32R6-NEXT: beqzc $3, $BB5_1
+; MIPS32R6-NEXT: nop
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: jrc $ra
+;
+; MIPS32R6O0-LABEL: AtomicLoadNand32:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -8
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $4
+; MIPS32R6O0-NEXT: lw $2, %got(x)($2)
+; MIPS32R6O0-NEXT: $BB5_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $1, 0($2)
+; MIPS32R6O0-NEXT: and $3, $1, $4
+; MIPS32R6O0-NEXT: nor $3, $zero, $3
+; MIPS32R6O0-NEXT: sc $3, 0($2)
+; MIPS32R6O0-NEXT: beqzc $3, $BB5_1
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: move $2, $1
+; MIPS32R6O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 8
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicLoadNand32:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadNand32)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadNand32)))
+; MIPS4-NEXT: ld $1, %got_disp(x)($1)
+; MIPS4-NEXT: .LBB5_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $2, 0($1)
+; MIPS4-NEXT: and $3, $2, $4
+; MIPS4-NEXT: nor $3, $zero, $3
+; MIPS4-NEXT: sc $3, 0($1)
+; MIPS4-NEXT: beqz $3, .LBB5_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: nop
+;
+; MIPS64-LABEL: AtomicLoadNand32:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadNand32)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadNand32)))
+; MIPS64-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64-NEXT: .LBB5_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $2, 0($1)
+; MIPS64-NEXT: and $3, $2, $4
+; MIPS64-NEXT: nor $3, $zero, $3
+; MIPS64-NEXT: sc $3, 0($1)
+; MIPS64-NEXT: beqz $3, .LBB5_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: nop
+;
+; MIPS64R2-LABEL: AtomicLoadNand32:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadNand32)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadNand32)))
+; MIPS64R2-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R2-NEXT: .LBB5_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $2, 0($1)
+; MIPS64R2-NEXT: and $3, $2, $4
+; MIPS64R2-NEXT: nor $3, $zero, $3
+; MIPS64R2-NEXT: sc $3, 0($1)
+; MIPS64R2-NEXT: beqz $3, .LBB5_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: nop
+;
+; MIPS64R6-LABEL: AtomicLoadNand32:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadNand32)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadNand32)))
+; MIPS64R6-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6-NEXT: .LBB5_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $2, 0($1)
+; MIPS64R6-NEXT: and $3, $2, $4
+; MIPS64R6-NEXT: nor $3, $zero, $3
+; MIPS64R6-NEXT: sc $3, 0($1)
+; MIPS64R6-NEXT: beqzc $3, .LBB5_1
+; MIPS64R6-NEXT: nop
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: jrc $ra
+;
+; MIPS64R6O0-LABEL: AtomicLoadNand32:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadNand32)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadNand32)))
+; MIPS64R6O0-NEXT: move $2, $4
+; MIPS64R6O0-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6O0-NEXT: .LBB5_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $3, 0($1)
+; MIPS64R6O0-NEXT: and $5, $3, $2
+; MIPS64R6O0-NEXT: nor $5, $zero, $5
+; MIPS64R6O0-NEXT: sc $5, 0($1)
+; MIPS64R6O0-NEXT: beqzc $5, .LBB5_1
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: move $2, $3
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicLoadNand32:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: lw $1, %got(x)($2)
+; MM32-NEXT: $BB5_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $2, 0($1)
+; MM32-NEXT: and $3, $2, $4
+; MM32-NEXT: nor $3, $zero, $3
+; MM32-NEXT: sc $3, 0($1)
+; MM32-NEXT: beqzc $3, $BB5_1
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: jrc $ra
+;
+; O1-LABEL: AtomicLoadNand32:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: lw $1, %got(x)($1)
+; O1-NEXT: $BB5_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $2, 0($1)
+; O1-NEXT: and $3, $2, $4
+; O1-NEXT: nor $3, $zero, $3
+; O1-NEXT: sc $3, 0($1)
+; O1-NEXT: beqz $3, $BB5_1
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: jr $ra
+; O1-NEXT: nop
+;
+; O2-LABEL: AtomicLoadNand32:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: lw $1, %got(x)($1)
+; O2-NEXT: $BB5_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $2, 0($1)
+; O2-NEXT: and $3, $2, $4
+; O2-NEXT: nor $3, $zero, $3
+; O2-NEXT: sc $3, 0($1)
+; O2-NEXT: beqz $3, $BB5_1
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: jr $ra
+; O2-NEXT: nop
+;
+; O3-LABEL: AtomicLoadNand32:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: lw $1, %got(x)($1)
+; O3-NEXT: $BB5_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $2, 0($1)
+; O3-NEXT: and $3, $2, $4
+; O3-NEXT: nor $3, $zero, $3
+; O3-NEXT: sc $3, 0($1)
+; O3-NEXT: beqz $3, $BB5_1
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: jr $ra
+; O3-NEXT: nop
+;
+; MIPS32EB-LABEL: AtomicLoadNand32:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: lw $1, %got(x)($1)
+; MIPS32EB-NEXT: $BB5_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $2, 0($1)
+; MIPS32EB-NEXT: and $3, $2, $4
+; MIPS32EB-NEXT: nor $3, $zero, $3
+; MIPS32EB-NEXT: sc $3, 0($1)
+; MIPS32EB-NEXT: beqz $3, $BB5_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: nop
+entry:
+ %0 = atomicrmw nand i32* @x, i32 %incr monotonic
+ ret i32 %0
-; ALL: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; ALL: ll $[[R1:[0-9]+]], 0($[[R0]])
-; ALL: and $[[R3:[0-9]+]], $[[R1]], $4
-; ALL: nor $[[R2:[0-9]+]], $zero, $[[R3]]
-; ALL: sc $[[R2]], 0($[[R0]])
-; NOT-MICROMIPS: beqz $[[R2]], [[BB0]]
-; MICROMIPS: beqzc $[[R2]], [[BB0]]
-; MIPSR6: beqzc $[[R2]], [[BB0]]
}
define i32 @AtomicSwap32(i32 signext %newval) nounwind {
+; MIPS32-LABEL: AtomicSwap32:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addiu $sp, $sp, -8
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: sw $4, 4($sp)
+; MIPS32-NEXT: lw $1, %got(x)($1)
+; MIPS32-NEXT: $BB6_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $2, 0($1)
+; MIPS32-NEXT: move $3, $4
+; MIPS32-NEXT: sc $3, 0($1)
+; MIPS32-NEXT: beqz $3, $BB6_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: addiu $sp, $sp, 8
+;
+; MIPS32O0-LABEL: AtomicSwap32:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addiu $sp, $sp, -8
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: sw $4, 4($sp)
+; MIPS32O0-NEXT: lw $4, 4($sp)
+; MIPS32O0-NEXT: lw $2, %got(x)($2)
+; MIPS32O0-NEXT: $BB6_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $25, 0($2)
+; MIPS32O0-NEXT: move $1, $4
+; MIPS32O0-NEXT: sc $1, 0($2)
+; MIPS32O0-NEXT: beqz $1, $BB6_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: move $2, $25
+; MIPS32O0-NEXT: addiu $sp, $sp, 8
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicSwap32:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addiu $sp, $sp, -8
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: sw $4, 4($sp)
+; MIPS32R2-NEXT: lw $1, %got(x)($1)
+; MIPS32R2-NEXT: $BB6_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $2, 0($1)
+; MIPS32R2-NEXT: move $3, $4
+; MIPS32R2-NEXT: sc $3, 0($1)
+; MIPS32R2-NEXT: beqz $3, $BB6_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: addiu $sp, $sp, 8
+;
+; MIPS32R6-LABEL: AtomicSwap32:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addiu $sp, $sp, -8
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: sw $4, 4($sp)
+; MIPS32R6-NEXT: lw $1, %got(x)($1)
+; MIPS32R6-NEXT: $BB6_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $2, 0($1)
+; MIPS32R6-NEXT: move $3, $4
+; MIPS32R6-NEXT: sc $3, 0($1)
+; MIPS32R6-NEXT: beqzc $3, $BB6_1
+; MIPS32R6-NEXT: nop
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: jr $ra
+; MIPS32R6-NEXT: addiu $sp, $sp, 8
+;
+; MIPS32R6O0-LABEL: AtomicSwap32:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -8
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $4
+; MIPS32R6O0-NEXT: sw $4, 4($sp)
+; MIPS32R6O0-NEXT: lw $4, 4($sp)
+; MIPS32R6O0-NEXT: lw $2, %got(x)($2)
+; MIPS32R6O0-NEXT: $BB6_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $1, 0($2)
+; MIPS32R6O0-NEXT: move $3, $4
+; MIPS32R6O0-NEXT: sc $3, 0($2)
+; MIPS32R6O0-NEXT: beqzc $3, $BB6_1
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: move $2, $1
+; MIPS32R6O0-NEXT: sw $25, 0($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 8
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicSwap32:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: daddiu $sp, $sp, -16
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicSwap32)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicSwap32)))
+; MIPS4-NEXT: sw $4, 12($sp)
+; MIPS4-NEXT: ld $1, %got_disp(x)($1)
+; MIPS4-NEXT: .LBB6_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $2, 0($1)
+; MIPS4-NEXT: move $3, $4
+; MIPS4-NEXT: sc $3, 0($1)
+; MIPS4-NEXT: beqz $3, .LBB6_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: daddiu $sp, $sp, 16
+;
+; MIPS64-LABEL: AtomicSwap32:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: daddiu $sp, $sp, -16
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicSwap32)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicSwap32)))
+; MIPS64-NEXT: sw $4, 12($sp)
+; MIPS64-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64-NEXT: .LBB6_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $2, 0($1)
+; MIPS64-NEXT: move $3, $4
+; MIPS64-NEXT: sc $3, 0($1)
+; MIPS64-NEXT: beqz $3, .LBB6_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: daddiu $sp, $sp, 16
+;
+; MIPS64R2-LABEL: AtomicSwap32:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: daddiu $sp, $sp, -16
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicSwap32)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicSwap32)))
+; MIPS64R2-NEXT: sw $4, 12($sp)
+; MIPS64R2-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R2-NEXT: .LBB6_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $2, 0($1)
+; MIPS64R2-NEXT: move $3, $4
+; MIPS64R2-NEXT: sc $3, 0($1)
+; MIPS64R2-NEXT: beqz $3, .LBB6_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: daddiu $sp, $sp, 16
+;
+; MIPS64R6-LABEL: AtomicSwap32:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: daddiu $sp, $sp, -16
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicSwap32)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicSwap32)))
+; MIPS64R6-NEXT: sw $4, 12($sp)
+; MIPS64R6-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6-NEXT: .LBB6_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $2, 0($1)
+; MIPS64R6-NEXT: move $3, $4
+; MIPS64R6-NEXT: sc $3, 0($1)
+; MIPS64R6-NEXT: beqzc $3, .LBB6_1
+; MIPS64R6-NEXT: nop
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: jr $ra
+; MIPS64R6-NEXT: daddiu $sp, $sp, 16
+;
+; MIPS64R6O0-LABEL: AtomicSwap32:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, -16
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicSwap32)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicSwap32)))
+; MIPS64R6O0-NEXT: move $2, $4
+; MIPS64R6O0-NEXT: sw $2, 12($sp)
+; MIPS64R6O0-NEXT: lw $2, 12($sp)
+; MIPS64R6O0-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6O0-NEXT: .LBB6_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $3, 0($1)
+; MIPS64R6O0-NEXT: move $5, $2
+; MIPS64R6O0-NEXT: sc $5, 0($1)
+; MIPS64R6O0-NEXT: beqzc $5, .LBB6_1
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: move $2, $3
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, 16
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicSwap32:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addiu $sp, $sp, -8
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: sw $4, 4($sp)
+; MM32-NEXT: lw $1, %got(x)($2)
+; MM32-NEXT: $BB6_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $2, 0($1)
+; MM32-NEXT: move $3, $4
+; MM32-NEXT: sc $3, 0($1)
+; MM32-NEXT: beqzc $3, $BB6_1
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: addiusp 8
+; MM32-NEXT: jrc $ra
+;
+; O1-LABEL: AtomicSwap32:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addiu $sp, $sp, -8
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: sw $4, 4($sp)
+; O1-NEXT: lw $1, %got(x)($1)
+; O1-NEXT: $BB6_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $2, 0($1)
+; O1-NEXT: move $3, $4
+; O1-NEXT: sc $3, 0($1)
+; O1-NEXT: beqz $3, $BB6_1
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: jr $ra
+; O1-NEXT: addiu $sp, $sp, 8
+;
+; O2-LABEL: AtomicSwap32:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addiu $sp, $sp, -8
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: sw $4, 4($sp)
+; O2-NEXT: lw $1, %got(x)($1)
+; O2-NEXT: $BB6_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $2, 0($1)
+; O2-NEXT: move $3, $4
+; O2-NEXT: sc $3, 0($1)
+; O2-NEXT: beqz $3, $BB6_1
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: jr $ra
+; O2-NEXT: addiu $sp, $sp, 8
+;
+; O3-LABEL: AtomicSwap32:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addiu $sp, $sp, -8
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: sw $4, 4($sp)
+; O3-NEXT: lw $1, %got(x)($1)
+; O3-NEXT: $BB6_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $2, 0($1)
+; O3-NEXT: move $3, $4
+; O3-NEXT: sc $3, 0($1)
+; O3-NEXT: beqz $3, $BB6_1
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: jr $ra
+; O3-NEXT: addiu $sp, $sp, 8
+;
+; MIPS32EB-LABEL: AtomicSwap32:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addiu $sp, $sp, -8
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: sw $4, 4($sp)
+; MIPS32EB-NEXT: lw $1, %got(x)($1)
+; MIPS32EB-NEXT: $BB6_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $2, 0($1)
+; MIPS32EB-NEXT: move $3, $4
+; MIPS32EB-NEXT: sc $3, 0($1)
+; MIPS32EB-NEXT: beqz $3, $BB6_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: addiu $sp, $sp, 8
entry:
%newval.addr = alloca i32, align 4
store i32 %newval, i32* %newval.addr, align 4
%0 = atomicrmw xchg i32* @x, i32 %tmp monotonic
ret i32 %0
-; ALL-LABEL: AtomicSwap32:
-
-; MIPS32-ANY: lw $[[R0:[0-9]+]], %got(x)
-; MIPS64-ANY: ld $[[R0:[0-9]+]], %got_disp(x)
-
-; ALL: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; ALL: ll ${{[0-9]+}}, 0($[[R0]])
-; ALL: sc $[[R2:[0-9]+]], 0($[[R0]])
-; NOT-MICROMIPS: beqz $[[R2]], [[BB0]]
-; MICROMIPS: beqzc $[[R2]], [[BB0]]
-; MIPSR6: beqzc $[[R2]], [[BB0]]
}
define i32 @AtomicCmpSwap32(i32 signext %oldval, i32 signext %newval) nounwind {
+; MIPS32-LABEL: AtomicCmpSwap32:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addiu $sp, $sp, -8
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: sw $5, 4($sp)
+; MIPS32-NEXT: lw $1, %got(x)($1)
+; MIPS32-NEXT: $BB7_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $2, 0($1)
+; MIPS32-NEXT: bne $2, $4, $BB7_3
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: # in Loop: Header=BB7_1 Depth=1
+; MIPS32-NEXT: move $3, $5
+; MIPS32-NEXT: sc $3, 0($1)
+; MIPS32-NEXT: beqz $3, $BB7_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: $BB7_3: # %entry
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: addiu $sp, $sp, 8
+;
+; MIPS32O0-LABEL: AtomicCmpSwap32:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addiu $sp, $sp, -16
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: sw $5, 12($sp)
+; MIPS32O0-NEXT: lw $5, 12($sp)
+; MIPS32O0-NEXT: lw $2, %got(x)($2)
+; MIPS32O0-NEXT: lw $25, 8($sp) # 4-byte Folded Reload
+; MIPS32O0-NEXT: move $1, $4
+; MIPS32O0-NEXT: $BB7_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $3, 0($2)
+; MIPS32O0-NEXT: bne $3, $1, $BB7_3
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: # in Loop: Header=BB7_1 Depth=1
+; MIPS32O0-NEXT: move $6, $5
+; MIPS32O0-NEXT: sc $6, 0($2)
+; MIPS32O0-NEXT: beqz $6, $BB7_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: $BB7_3: # %entry
+; MIPS32O0-NEXT: xor $1, $3, $4
+; MIPS32O0-NEXT: sltiu $1, $1, 1
+; MIPS32O0-NEXT: move $2, $3
+; MIPS32O0-NEXT: sw $3, 8($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: sw $1, 0($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: addiu $sp, $sp, 16
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicCmpSwap32:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addiu $sp, $sp, -8
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: sw $5, 4($sp)
+; MIPS32R2-NEXT: lw $1, %got(x)($1)
+; MIPS32R2-NEXT: $BB7_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $2, 0($1)
+; MIPS32R2-NEXT: bne $2, $4, $BB7_3
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: # in Loop: Header=BB7_1 Depth=1
+; MIPS32R2-NEXT: move $3, $5
+; MIPS32R2-NEXT: sc $3, 0($1)
+; MIPS32R2-NEXT: beqz $3, $BB7_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: $BB7_3: # %entry
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: addiu $sp, $sp, 8
+;
+; MIPS32R6-LABEL: AtomicCmpSwap32:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addiu $sp, $sp, -8
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: sw $5, 4($sp)
+; MIPS32R6-NEXT: lw $1, %got(x)($1)
+; MIPS32R6-NEXT: $BB7_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $2, 0($1)
+; MIPS32R6-NEXT: bnec $2, $4, $BB7_3
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: # in Loop: Header=BB7_1 Depth=1
+; MIPS32R6-NEXT: move $3, $5
+; MIPS32R6-NEXT: sc $3, 0($1)
+; MIPS32R6-NEXT: beqzc $3, $BB7_1
+; MIPS32R6-NEXT: nop
+; MIPS32R6-NEXT: $BB7_3: # %entry
+; MIPS32R6-NEXT: jr $ra
+; MIPS32R6-NEXT: addiu $sp, $sp, 8
+;
+; MIPS32R6O0-LABEL: AtomicCmpSwap32:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -24
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $5
+; MIPS32R6O0-NEXT: move $1, $4
+; MIPS32R6O0-NEXT: sw $5, 20($sp)
+; MIPS32R6O0-NEXT: lw $5, 20($sp)
+; MIPS32R6O0-NEXT: lw $2, %got(x)($2)
+; MIPS32R6O0-NEXT: lw $3, 16($sp) # 4-byte Folded Reload
+; MIPS32R6O0-NEXT: $BB7_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $6, 0($2)
+; MIPS32R6O0-NEXT: bnec $6, $4, $BB7_3
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: # in Loop: Header=BB7_1 Depth=1
+; MIPS32R6O0-NEXT: move $7, $5
+; MIPS32R6O0-NEXT: sc $7, 0($2)
+; MIPS32R6O0-NEXT: beqzc $7, $BB7_1
+; MIPS32R6O0-NEXT: $BB7_3: # %entry
+; MIPS32R6O0-NEXT: move $2, $6
+; MIPS32R6O0-NEXT: sw $6, 16($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $1, 12($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $3, 8($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 24
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicCmpSwap32:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: daddiu $sp, $sp, -16
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicCmpSwap32)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicCmpSwap32)))
+; MIPS4-NEXT: sw $5, 12($sp)
+; MIPS4-NEXT: ld $1, %got_disp(x)($1)
+; MIPS4-NEXT: .LBB7_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $2, 0($1)
+; MIPS4-NEXT: bne $2, $4, .LBB7_3
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: # in Loop: Header=BB7_1 Depth=1
+; MIPS4-NEXT: move $3, $5
+; MIPS4-NEXT: sc $3, 0($1)
+; MIPS4-NEXT: beqz $3, .LBB7_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: .LBB7_3: # %entry
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: daddiu $sp, $sp, 16
+;
+; MIPS64-LABEL: AtomicCmpSwap32:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: daddiu $sp, $sp, -16
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicCmpSwap32)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicCmpSwap32)))
+; MIPS64-NEXT: sw $5, 12($sp)
+; MIPS64-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64-NEXT: .LBB7_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $2, 0($1)
+; MIPS64-NEXT: bne $2, $4, .LBB7_3
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: # in Loop: Header=BB7_1 Depth=1
+; MIPS64-NEXT: move $3, $5
+; MIPS64-NEXT: sc $3, 0($1)
+; MIPS64-NEXT: beqz $3, .LBB7_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: .LBB7_3: # %entry
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: daddiu $sp, $sp, 16
+;
+; MIPS64R2-LABEL: AtomicCmpSwap32:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: daddiu $sp, $sp, -16
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicCmpSwap32)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicCmpSwap32)))
+; MIPS64R2-NEXT: sw $5, 12($sp)
+; MIPS64R2-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R2-NEXT: .LBB7_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $2, 0($1)
+; MIPS64R2-NEXT: bne $2, $4, .LBB7_3
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: # in Loop: Header=BB7_1 Depth=1
+; MIPS64R2-NEXT: move $3, $5
+; MIPS64R2-NEXT: sc $3, 0($1)
+; MIPS64R2-NEXT: beqz $3, .LBB7_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: .LBB7_3: # %entry
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: daddiu $sp, $sp, 16
+;
+; MIPS64R6-LABEL: AtomicCmpSwap32:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: daddiu $sp, $sp, -16
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicCmpSwap32)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicCmpSwap32)))
+; MIPS64R6-NEXT: sw $5, 12($sp)
+; MIPS64R6-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6-NEXT: .LBB7_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $2, 0($1)
+; MIPS64R6-NEXT: bnec $2, $4, .LBB7_3
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: # in Loop: Header=BB7_1 Depth=1
+; MIPS64R6-NEXT: move $3, $5
+; MIPS64R6-NEXT: sc $3, 0($1)
+; MIPS64R6-NEXT: beqzc $3, .LBB7_1
+; MIPS64R6-NEXT: nop
+; MIPS64R6-NEXT: .LBB7_3: # %entry
+; MIPS64R6-NEXT: jr $ra
+; MIPS64R6-NEXT: daddiu $sp, $sp, 16
+;
+; MIPS64R6O0-LABEL: AtomicCmpSwap32:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, -16
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicCmpSwap32)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicCmpSwap32)))
+; MIPS64R6O0-NEXT: move $2, $4
+; MIPS64R6O0-NEXT: move $3, $5
+; MIPS64R6O0-NEXT: sw $3, 12($sp)
+; MIPS64R6O0-NEXT: lw $3, 12($sp)
+; MIPS64R6O0-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6O0-NEXT: lw $6, 8($sp) # 4-byte Folded Reload
+; MIPS64R6O0-NEXT: .LBB7_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $7, 0($1)
+; MIPS64R6O0-NEXT: bnec $7, $2, .LBB7_3
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: # in Loop: Header=BB7_1 Depth=1
+; MIPS64R6O0-NEXT: move $8, $3
+; MIPS64R6O0-NEXT: sc $8, 0($1)
+; MIPS64R6O0-NEXT: beqzc $8, .LBB7_1
+; MIPS64R6O0-NEXT: .LBB7_3: # %entry
+; MIPS64R6O0-NEXT: move $2, $7
+; MIPS64R6O0-NEXT: sw $7, 8($sp) # 4-byte Folded Spill
+; MIPS64R6O0-NEXT: sw $6, 4($sp) # 4-byte Folded Spill
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, 16
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicCmpSwap32:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addiu $sp, $sp, -8
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: sw $5, 4($sp)
+; MM32-NEXT: lw $1, %got(x)($2)
+; MM32-NEXT: $BB7_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $2, 0($1)
+; MM32-NEXT: bne $2, $4, $BB7_3
+; MM32-NEXT: nop
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: # in Loop: Header=BB7_1 Depth=1
+; MM32-NEXT: move $3, $5
+; MM32-NEXT: sc $3, 0($1)
+; MM32-NEXT: beqzc $3, $BB7_1
+; MM32-NEXT: $BB7_3: # %entry
+; MM32-NEXT: addiusp 8
+; MM32-NEXT: jrc $ra
+;
+; O1-LABEL: AtomicCmpSwap32:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addiu $sp, $sp, -8
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: sw $5, 4($sp)
+; O1-NEXT: lw $1, %got(x)($1)
+; O1-NEXT: $BB7_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $2, 0($1)
+; O1-NEXT: bne $2, $4, $BB7_3
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: # in Loop: Header=BB7_1 Depth=1
+; O1-NEXT: move $3, $5
+; O1-NEXT: sc $3, 0($1)
+; O1-NEXT: beqz $3, $BB7_1
+; O1-NEXT: nop
+; O1-NEXT: $BB7_3: # %entry
+; O1-NEXT: jr $ra
+; O1-NEXT: addiu $sp, $sp, 8
+;
+; O2-LABEL: AtomicCmpSwap32:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addiu $sp, $sp, -8
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: sw $5, 4($sp)
+; O2-NEXT: lw $1, %got(x)($1)
+; O2-NEXT: $BB7_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $2, 0($1)
+; O2-NEXT: bne $2, $4, $BB7_3
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: # in Loop: Header=BB7_1 Depth=1
+; O2-NEXT: move $3, $5
+; O2-NEXT: sc $3, 0($1)
+; O2-NEXT: beqz $3, $BB7_1
+; O2-NEXT: nop
+; O2-NEXT: $BB7_3: # %entry
+; O2-NEXT: jr $ra
+; O2-NEXT: addiu $sp, $sp, 8
+;
+; O3-LABEL: AtomicCmpSwap32:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addiu $sp, $sp, -8
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: sw $5, 4($sp)
+; O3-NEXT: lw $1, %got(x)($1)
+; O3-NEXT: $BB7_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $2, 0($1)
+; O3-NEXT: bne $2, $4, $BB7_3
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: # in Loop: Header=BB7_1 Depth=1
+; O3-NEXT: move $3, $5
+; O3-NEXT: sc $3, 0($1)
+; O3-NEXT: beqz $3, $BB7_1
+; O3-NEXT: nop
+; O3-NEXT: $BB7_3: # %entry
+; O3-NEXT: jr $ra
+; O3-NEXT: addiu $sp, $sp, 8
+;
+; MIPS32EB-LABEL: AtomicCmpSwap32:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addiu $sp, $sp, -8
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: sw $5, 4($sp)
+; MIPS32EB-NEXT: lw $1, %got(x)($1)
+; MIPS32EB-NEXT: $BB7_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $2, 0($1)
+; MIPS32EB-NEXT: bne $2, $4, $BB7_3
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: # in Loop: Header=BB7_1 Depth=1
+; MIPS32EB-NEXT: move $3, $5
+; MIPS32EB-NEXT: sc $3, 0($1)
+; MIPS32EB-NEXT: beqz $3, $BB7_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: $BB7_3: # %entry
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: addiu $sp, $sp, 8
entry:
%newval.addr = alloca i32, align 4
store i32 %newval, i32* %newval.addr, align 4
%1 = extractvalue { i32, i1 } %0, 0
ret i32 %1
-; ALL-LABEL: AtomicCmpSwap32:
-
-; MIPS32-ANY: lw $[[R0:[0-9]+]], %got(x)
-; MIPS64-ANY: ld $[[R0:[0-9]+]], %got_disp(x)(
-
-; ALL: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; ALL: ll $2, 0($[[R0]])
-; NOT-MICROMIPS: bne $2, $4, [[BB1:(\$|\.L)[A-Z_0-9]+]]
-; MICROMIPS: bne $2, $4, [[BB1:(\$|\.L)[A-Z_0-9]+]]
-; MIPSR6: bnec $2, $4, [[BB1:(\$|\.L)[A-Z_0-9]+]]
-; ALL: sc $[[R2:[0-9]+]], 0($[[R0]])
-; NOT-MICROMIPS: beqz $[[R2]], [[BB0]]
-; MICROMIPS: beqzc $[[R2]], [[BB0]]
-; MIPSR6: beqzc $[[R2]], [[BB0]]
-; ALL: [[BB1]]:
}
-
-
@y = common global i8 0, align 1
define signext i8 @AtomicLoadAdd8(i8 signext %incr) nounwind {
+; MIPS32-LABEL: AtomicLoadAdd8:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: lw $1, %got(y)($1)
+; MIPS32-NEXT: addiu $2, $zero, -4
+; MIPS32-NEXT: and $2, $1, $2
+; MIPS32-NEXT: andi $1, $1, 3
+; MIPS32-NEXT: sll $3, $1, 3
+; MIPS32-NEXT: ori $1, $zero, 255
+; MIPS32-NEXT: sllv $5, $1, $3
+; MIPS32-NEXT: nor $6, $zero, $5
+; MIPS32-NEXT: sllv $4, $4, $3
+; MIPS32-NEXT: $BB8_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $7, 0($2)
+; MIPS32-NEXT: addu $8, $7, $4
+; MIPS32-NEXT: and $8, $8, $5
+; MIPS32-NEXT: and $9, $7, $6
+; MIPS32-NEXT: or $9, $9, $8
+; MIPS32-NEXT: sc $9, 0($2)
+; MIPS32-NEXT: beqz $9, $BB8_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: and $1, $7, $5
+; MIPS32-NEXT: srlv $1, $1, $3
+; MIPS32-NEXT: sll $1, $1, 24
+; MIPS32-NEXT: sra $1, $1, 24
+; MIPS32-NEXT: # %bb.3: # %entry
+; MIPS32-NEXT: sll $1, $1, 24
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: sra $2, $1, 24
+;
+; MIPS32O0-LABEL: AtomicLoadAdd8:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addiu $sp, $sp, -8
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: lw $2, %got(y)($2)
+; MIPS32O0-NEXT: addiu $25, $zero, -4
+; MIPS32O0-NEXT: and $25, $2, $25
+; MIPS32O0-NEXT: andi $2, $2, 3
+; MIPS32O0-NEXT: sll $2, $2, 3
+; MIPS32O0-NEXT: ori $1, $zero, 255
+; MIPS32O0-NEXT: sllv $1, $1, $2
+; MIPS32O0-NEXT: nor $3, $zero, $1
+; MIPS32O0-NEXT: sllv $4, $4, $2
+; MIPS32O0-NEXT: $BB8_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $6, 0($25)
+; MIPS32O0-NEXT: addu $7, $6, $4
+; MIPS32O0-NEXT: and $7, $7, $1
+; MIPS32O0-NEXT: and $8, $6, $3
+; MIPS32O0-NEXT: or $8, $8, $7
+; MIPS32O0-NEXT: sc $8, 0($25)
+; MIPS32O0-NEXT: beqz $8, $BB8_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: and $5, $6, $1
+; MIPS32O0-NEXT: srlv $5, $5, $2
+; MIPS32O0-NEXT: sll $5, $5, 24
+; MIPS32O0-NEXT: sra $5, $5, 24
+; MIPS32O0-NEXT: # %bb.3: # %entry
+; MIPS32O0-NEXT: sw $5, 4($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: # %bb.4: # %entry
+; MIPS32O0-NEXT: lw $1, 4($sp) # 4-byte Folded Reload
+; MIPS32O0-NEXT: sll $2, $1, 24
+; MIPS32O0-NEXT: sra $2, $2, 24
+; MIPS32O0-NEXT: addiu $sp, $sp, 8
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicLoadAdd8:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: lw $1, %got(y)($1)
+; MIPS32R2-NEXT: addiu $2, $zero, -4
+; MIPS32R2-NEXT: and $2, $1, $2
+; MIPS32R2-NEXT: andi $1, $1, 3
+; MIPS32R2-NEXT: sll $3, $1, 3
+; MIPS32R2-NEXT: ori $1, $zero, 255
+; MIPS32R2-NEXT: sllv $5, $1, $3
+; MIPS32R2-NEXT: nor $6, $zero, $5
+; MIPS32R2-NEXT: sllv $4, $4, $3
+; MIPS32R2-NEXT: $BB8_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $7, 0($2)
+; MIPS32R2-NEXT: addu $8, $7, $4
+; MIPS32R2-NEXT: and $8, $8, $5
+; MIPS32R2-NEXT: and $9, $7, $6
+; MIPS32R2-NEXT: or $9, $9, $8
+; MIPS32R2-NEXT: sc $9, 0($2)
+; MIPS32R2-NEXT: beqz $9, $BB8_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: and $1, $7, $5
+; MIPS32R2-NEXT: srlv $1, $1, $3
+; MIPS32R2-NEXT: seb $1, $1
+; MIPS32R2-NEXT: # %bb.3: # %entry
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: seb $2, $1
+;
+; MIPS32R6-LABEL: AtomicLoadAdd8:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: lw $1, %got(y)($1)
+; MIPS32R6-NEXT: addiu $2, $zero, -4
+; MIPS32R6-NEXT: and $2, $1, $2
+; MIPS32R6-NEXT: andi $1, $1, 3
+; MIPS32R6-NEXT: sll $3, $1, 3
+; MIPS32R6-NEXT: ori $1, $zero, 255
+; MIPS32R6-NEXT: sllv $5, $1, $3
+; MIPS32R6-NEXT: nor $6, $zero, $5
+; MIPS32R6-NEXT: sllv $4, $4, $3
+; MIPS32R6-NEXT: $BB8_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $7, 0($2)
+; MIPS32R6-NEXT: addu $8, $7, $4
+; MIPS32R6-NEXT: and $8, $8, $5
+; MIPS32R6-NEXT: and $9, $7, $6
+; MIPS32R6-NEXT: or $9, $9, $8
+; MIPS32R6-NEXT: sc $9, 0($2)
+; MIPS32R6-NEXT: beqzc $9, $BB8_1
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: and $1, $7, $5
+; MIPS32R6-NEXT: srlv $1, $1, $3
+; MIPS32R6-NEXT: seb $1, $1
+; MIPS32R6-NEXT: # %bb.3: # %entry
+; MIPS32R6-NEXT: jr $ra
+; MIPS32R6-NEXT: seb $2, $1
+;
+; MIPS32R6O0-LABEL: AtomicLoadAdd8:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -8
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $4
+; MIPS32R6O0-NEXT: lw $2, %got(y)($2)
+; MIPS32R6O0-NEXT: addiu $1, $zero, -4
+; MIPS32R6O0-NEXT: and $1, $2, $1
+; MIPS32R6O0-NEXT: andi $2, $2, 3
+; MIPS32R6O0-NEXT: sll $2, $2, 3
+; MIPS32R6O0-NEXT: ori $3, $zero, 255
+; MIPS32R6O0-NEXT: sllv $3, $3, $2
+; MIPS32R6O0-NEXT: nor $5, $zero, $3
+; MIPS32R6O0-NEXT: sllv $4, $4, $2
+; MIPS32R6O0-NEXT: $BB8_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $7, 0($1)
+; MIPS32R6O0-NEXT: addu $8, $7, $4
+; MIPS32R6O0-NEXT: and $8, $8, $3
+; MIPS32R6O0-NEXT: and $9, $7, $5
+; MIPS32R6O0-NEXT: or $9, $9, $8
+; MIPS32R6O0-NEXT: sc $9, 0($1)
+; MIPS32R6O0-NEXT: beqzc $9, $BB8_1
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: and $6, $7, $3
+; MIPS32R6O0-NEXT: srlv $6, $6, $2
+; MIPS32R6O0-NEXT: seb $6, $6
+; MIPS32R6O0-NEXT: # %bb.3: # %entry
+; MIPS32R6O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $6, 0($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: # %bb.4: # %entry
+; MIPS32R6O0-NEXT: lw $1, 0($sp) # 4-byte Folded Reload
+; MIPS32R6O0-NEXT: seb $2, $1
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 8
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicLoadAdd8:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd8)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd8)))
+; MIPS4-NEXT: ld $1, %got_disp(y)($1)
+; MIPS4-NEXT: daddiu $2, $zero, -4
+; MIPS4-NEXT: and $2, $1, $2
+; MIPS4-NEXT: andi $1, $1, 3
+; MIPS4-NEXT: sll $3, $1, 3
+; MIPS4-NEXT: ori $1, $zero, 255
+; MIPS4-NEXT: sllv $5, $1, $3
+; MIPS4-NEXT: nor $6, $zero, $5
+; MIPS4-NEXT: sllv $4, $4, $3
+; MIPS4-NEXT: .LBB8_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $7, 0($2)
+; MIPS4-NEXT: addu $8, $7, $4
+; MIPS4-NEXT: and $8, $8, $5
+; MIPS4-NEXT: and $9, $7, $6
+; MIPS4-NEXT: or $9, $9, $8
+; MIPS4-NEXT: sc $9, 0($2)
+; MIPS4-NEXT: beqz $9, .LBB8_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: and $1, $7, $5
+; MIPS4-NEXT: srlv $1, $1, $3
+; MIPS4-NEXT: sll $1, $1, 24
+; MIPS4-NEXT: sra $1, $1, 24
+; MIPS4-NEXT: # %bb.3: # %entry
+; MIPS4-NEXT: sll $1, $1, 24
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: sra $2, $1, 24
+;
+; MIPS64-LABEL: AtomicLoadAdd8:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd8)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd8)))
+; MIPS64-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64-NEXT: daddiu $2, $zero, -4
+; MIPS64-NEXT: and $2, $1, $2
+; MIPS64-NEXT: andi $1, $1, 3
+; MIPS64-NEXT: sll $3, $1, 3
+; MIPS64-NEXT: ori $1, $zero, 255
+; MIPS64-NEXT: sllv $5, $1, $3
+; MIPS64-NEXT: nor $6, $zero, $5
+; MIPS64-NEXT: sllv $4, $4, $3
+; MIPS64-NEXT: .LBB8_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $7, 0($2)
+; MIPS64-NEXT: addu $8, $7, $4
+; MIPS64-NEXT: and $8, $8, $5
+; MIPS64-NEXT: and $9, $7, $6
+; MIPS64-NEXT: or $9, $9, $8
+; MIPS64-NEXT: sc $9, 0($2)
+; MIPS64-NEXT: beqz $9, .LBB8_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: and $1, $7, $5
+; MIPS64-NEXT: srlv $1, $1, $3
+; MIPS64-NEXT: sll $1, $1, 24
+; MIPS64-NEXT: sra $1, $1, 24
+; MIPS64-NEXT: # %bb.3: # %entry
+; MIPS64-NEXT: sll $1, $1, 24
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: sra $2, $1, 24
+;
+; MIPS64R2-LABEL: AtomicLoadAdd8:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd8)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd8)))
+; MIPS64R2-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64R2-NEXT: daddiu $2, $zero, -4
+; MIPS64R2-NEXT: and $2, $1, $2
+; MIPS64R2-NEXT: andi $1, $1, 3
+; MIPS64R2-NEXT: sll $3, $1, 3
+; MIPS64R2-NEXT: ori $1, $zero, 255
+; MIPS64R2-NEXT: sllv $5, $1, $3
+; MIPS64R2-NEXT: nor $6, $zero, $5
+; MIPS64R2-NEXT: sllv $4, $4, $3
+; MIPS64R2-NEXT: .LBB8_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $7, 0($2)
+; MIPS64R2-NEXT: addu $8, $7, $4
+; MIPS64R2-NEXT: and $8, $8, $5
+; MIPS64R2-NEXT: and $9, $7, $6
+; MIPS64R2-NEXT: or $9, $9, $8
+; MIPS64R2-NEXT: sc $9, 0($2)
+; MIPS64R2-NEXT: beqz $9, .LBB8_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: and $1, $7, $5
+; MIPS64R2-NEXT: srlv $1, $1, $3
+; MIPS64R2-NEXT: seb $1, $1
+; MIPS64R2-NEXT: # %bb.3: # %entry
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: seb $2, $1
+;
+; MIPS64R6-LABEL: AtomicLoadAdd8:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd8)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd8)))
+; MIPS64R6-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64R6-NEXT: daddiu $2, $zero, -4
+; MIPS64R6-NEXT: and $2, $1, $2
+; MIPS64R6-NEXT: andi $1, $1, 3
+; MIPS64R6-NEXT: sll $3, $1, 3
+; MIPS64R6-NEXT: ori $1, $zero, 255
+; MIPS64R6-NEXT: sllv $5, $1, $3
+; MIPS64R6-NEXT: nor $6, $zero, $5
+; MIPS64R6-NEXT: sllv $4, $4, $3
+; MIPS64R6-NEXT: .LBB8_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $7, 0($2)
+; MIPS64R6-NEXT: addu $8, $7, $4
+; MIPS64R6-NEXT: and $8, $8, $5
+; MIPS64R6-NEXT: and $9, $7, $6
+; MIPS64R6-NEXT: or $9, $9, $8
+; MIPS64R6-NEXT: sc $9, 0($2)
+; MIPS64R6-NEXT: beqzc $9, .LBB8_1
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: and $1, $7, $5
+; MIPS64R6-NEXT: srlv $1, $1, $3
+; MIPS64R6-NEXT: seb $1, $1
+; MIPS64R6-NEXT: # %bb.3: # %entry
+; MIPS64R6-NEXT: jr $ra
+; MIPS64R6-NEXT: seb $2, $1
+;
+; MIPS64R6O0-LABEL: AtomicLoadAdd8:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, -16
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd8)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd8)))
+; MIPS64R6O0-NEXT: move $2, $4
+; MIPS64R6O0-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64R6O0-NEXT: daddiu $4, $zero, -4
+; MIPS64R6O0-NEXT: and $4, $1, $4
+; MIPS64R6O0-NEXT: andi $3, $1, 3
+; MIPS64R6O0-NEXT: xori $3, $3, 3
+; MIPS64R6O0-NEXT: sll $3, $3, 3
+; MIPS64R6O0-NEXT: ori $5, $zero, 255
+; MIPS64R6O0-NEXT: sllv $5, $5, $3
+; MIPS64R6O0-NEXT: nor $6, $zero, $5
+; MIPS64R6O0-NEXT: sllv $2, $2, $3
+; MIPS64R6O0-NEXT: .LBB8_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $8, 0($4)
+; MIPS64R6O0-NEXT: addu $9, $8, $2
+; MIPS64R6O0-NEXT: and $9, $9, $5
+; MIPS64R6O0-NEXT: and $10, $8, $6
+; MIPS64R6O0-NEXT: or $10, $10, $9
+; MIPS64R6O0-NEXT: sc $10, 0($4)
+; MIPS64R6O0-NEXT: beqzc $10, .LBB8_1
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: and $7, $8, $5
+; MIPS64R6O0-NEXT: srlv $7, $7, $3
+; MIPS64R6O0-NEXT: seb $7, $7
+; MIPS64R6O0-NEXT: # %bb.3: # %entry
+; MIPS64R6O0-NEXT: sw $7, 12($sp) # 4-byte Folded Spill
+; MIPS64R6O0-NEXT: # %bb.4: # %entry
+; MIPS64R6O0-NEXT: lw $1, 12($sp) # 4-byte Folded Reload
+; MIPS64R6O0-NEXT: seb $2, $1
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, 16
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicLoadAdd8:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: lw $1, %got(y)($2)
+; MM32-NEXT: addiu $2, $zero, -4
+; MM32-NEXT: and $2, $1, $2
+; MM32-NEXT: andi $1, $1, 3
+; MM32-NEXT: sll $3, $1, 3
+; MM32-NEXT: ori $1, $zero, 255
+; MM32-NEXT: sllv $5, $1, $3
+; MM32-NEXT: nor $6, $zero, $5
+; MM32-NEXT: sllv $4, $4, $3
+; MM32-NEXT: $BB8_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $7, 0($2)
+; MM32-NEXT: addu $8, $7, $4
+; MM32-NEXT: and $8, $8, $5
+; MM32-NEXT: and $9, $7, $6
+; MM32-NEXT: or $9, $9, $8
+; MM32-NEXT: sc $9, 0($2)
+; MM32-NEXT: beqzc $9, $BB8_1
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: and $1, $7, $5
+; MM32-NEXT: srlv $1, $1, $3
+; MM32-NEXT: seb $1, $1
+; MM32-NEXT: # %bb.3: # %entry
+; MM32-NEXT: jr $ra
+; MM32-NEXT: seb $2, $1
+;
+; O1-LABEL: AtomicLoadAdd8:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: lw $1, %got(y)($1)
+; O1-NEXT: addiu $2, $zero, -4
+; O1-NEXT: and $2, $1, $2
+; O1-NEXT: andi $1, $1, 3
+; O1-NEXT: sll $3, $1, 3
+; O1-NEXT: ori $1, $zero, 255
+; O1-NEXT: sllv $5, $1, $3
+; O1-NEXT: nor $6, $zero, $5
+; O1-NEXT: sllv $4, $4, $3
+; O1-NEXT: $BB8_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $7, 0($2)
+; O1-NEXT: addu $8, $7, $4
+; O1-NEXT: and $8, $8, $5
+; O1-NEXT: and $9, $7, $6
+; O1-NEXT: or $9, $9, $8
+; O1-NEXT: sc $9, 0($2)
+; O1-NEXT: beqz $9, $BB8_1
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: and $1, $7, $5
+; O1-NEXT: srlv $1, $1, $3
+; O1-NEXT: sll $1, $1, 24
+; O1-NEXT: sra $1, $1, 24
+; O1-NEXT: # %bb.3: # %entry
+; O1-NEXT: sll $1, $1, 24
+; O1-NEXT: jr $ra
+; O1-NEXT: sra $2, $1, 24
+;
+; O2-LABEL: AtomicLoadAdd8:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: lw $1, %got(y)($1)
+; O2-NEXT: addiu $2, $zero, -4
+; O2-NEXT: and $2, $1, $2
+; O2-NEXT: andi $1, $1, 3
+; O2-NEXT: sll $3, $1, 3
+; O2-NEXT: ori $1, $zero, 255
+; O2-NEXT: sllv $5, $1, $3
+; O2-NEXT: nor $6, $zero, $5
+; O2-NEXT: sllv $4, $4, $3
+; O2-NEXT: $BB8_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $7, 0($2)
+; O2-NEXT: addu $8, $7, $4
+; O2-NEXT: and $8, $8, $5
+; O2-NEXT: and $9, $7, $6
+; O2-NEXT: or $9, $9, $8
+; O2-NEXT: sc $9, 0($2)
+; O2-NEXT: beqz $9, $BB8_1
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: and $1, $7, $5
+; O2-NEXT: srlv $1, $1, $3
+; O2-NEXT: sll $1, $1, 24
+; O2-NEXT: sra $1, $1, 24
+; O2-NEXT: # %bb.3: # %entry
+; O2-NEXT: sll $1, $1, 24
+; O2-NEXT: jr $ra
+; O2-NEXT: sra $2, $1, 24
+;
+; O3-LABEL: AtomicLoadAdd8:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: addiu $2, $zero, -4
+; O3-NEXT: lw $1, %got(y)($1)
+; O3-NEXT: and $2, $1, $2
+; O3-NEXT: andi $1, $1, 3
+; O3-NEXT: sll $3, $1, 3
+; O3-NEXT: ori $1, $zero, 255
+; O3-NEXT: sllv $5, $1, $3
+; O3-NEXT: sllv $4, $4, $3
+; O3-NEXT: nor $6, $zero, $5
+; O3-NEXT: $BB8_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $7, 0($2)
+; O3-NEXT: addu $8, $7, $4
+; O3-NEXT: and $8, $8, $5
+; O3-NEXT: and $9, $7, $6
+; O3-NEXT: or $9, $9, $8
+; O3-NEXT: sc $9, 0($2)
+; O3-NEXT: beqz $9, $BB8_1
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: and $1, $7, $5
+; O3-NEXT: srlv $1, $1, $3
+; O3-NEXT: sll $1, $1, 24
+; O3-NEXT: sra $1, $1, 24
+; O3-NEXT: # %bb.3: # %entry
+; O3-NEXT: sll $1, $1, 24
+; O3-NEXT: jr $ra
+; O3-NEXT: sra $2, $1, 24
+;
+; MIPS32EB-LABEL: AtomicLoadAdd8:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: lw $1, %got(y)($1)
+; MIPS32EB-NEXT: addiu $2, $zero, -4
+; MIPS32EB-NEXT: and $2, $1, $2
+; MIPS32EB-NEXT: andi $1, $1, 3
+; MIPS32EB-NEXT: xori $1, $1, 3
+; MIPS32EB-NEXT: sll $3, $1, 3
+; MIPS32EB-NEXT: ori $1, $zero, 255
+; MIPS32EB-NEXT: sllv $5, $1, $3
+; MIPS32EB-NEXT: nor $6, $zero, $5
+; MIPS32EB-NEXT: sllv $4, $4, $3
+; MIPS32EB-NEXT: $BB8_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $7, 0($2)
+; MIPS32EB-NEXT: addu $8, $7, $4
+; MIPS32EB-NEXT: and $8, $8, $5
+; MIPS32EB-NEXT: and $9, $7, $6
+; MIPS32EB-NEXT: or $9, $9, $8
+; MIPS32EB-NEXT: sc $9, 0($2)
+; MIPS32EB-NEXT: beqz $9, $BB8_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: and $1, $7, $5
+; MIPS32EB-NEXT: srlv $1, $1, $3
+; MIPS32EB-NEXT: sll $1, $1, 24
+; MIPS32EB-NEXT: sra $1, $1, 24
+; MIPS32EB-NEXT: # %bb.3: # %entry
+; MIPS32EB-NEXT: sll $1, $1, 24
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: sra $2, $1, 24
entry:
%0 = atomicrmw add i8* @y, i8 %incr monotonic
ret i8 %0
-
-; ALL-LABEL: AtomicLoadAdd8:
-
-; MIPS32-ANY: lw $[[R0:[0-9]+]], %got(y)
-; MIPS64-ANY: ld $[[R0:[0-9]+]], %got_disp(y)(
-
-; ALL: addiu $[[R1:[0-9]+]], $zero, -4
-; ALL: and $[[R2:[0-9]+]], $[[R0]], $[[R1]]
-; ALL: andi $[[R3:[0-9]+]], $[[R0]], 3
-; CHECK-EB: xori $[[R4:[0-9]+]], $[[R3]], 3
-; CHECK-EB: sll $[[R5:[0-9]+]], $[[R4]], 3
-; CHECK-EL: sll $[[R5:[0-9]+]], $[[R3]], 3
-; ALL: ori $[[R6:[0-9]+]], $zero, 255
-; ALL: sllv $[[R7:[0-9]+]], $[[R6]], $[[R5]]
-; ALL: nor $[[R8:[0-9]+]], $zero, $[[R7]]
-; ALL: sllv $[[R9:[0-9]+]], $4, $[[R5]]
-
-; O0: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; O0: ld $[[R10:[0-9]+]]
-; O0-NEXT: ll $[[R11:[0-9]+]], 0($[[R10]])
-
-; ALL: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; ALL: ll $[[R12:[0-9]+]], 0($[[R2]])
-; ALL: addu $[[R13:[0-9]+]], $[[R12]], $[[R9]]
-; ALL: and $[[R14:[0-9]+]], $[[R13]], $[[R7]]
-; ALL: and $[[R15:[0-9]+]], $[[R12]], $[[R8]]
-; ALL: or $[[R16:[0-9]+]], $[[R15]], $[[R14]]
-; ALL: sc $[[R16]], 0($[[R2]])
-; NOT-MICROMIPS: beqz $[[R16]], [[BB0]]
-; MICROMIPS: beqzc $[[R16]], [[BB0]]
-; MIPSR6: beqzc $[[R16]], [[BB0]]
-
-; ALL: and $[[R17:[0-9]+]], $[[R12]], $[[R7]]
-; ALL: srlv $[[R18:[0-9]+]], $[[R17]], $[[R5]]
-
-; NO-SEB-SEH: sll $[[R19:[0-9]+]], $[[R18]], 24
-; NO-SEB-SEH: sra $2, $[[R19]], 24
-
-; HAS-SEB-SEH: seb $2, $[[R18]]
}
define signext i8 @AtomicLoadSub8(i8 signext %incr) nounwind {
+; MIPS32-LABEL: AtomicLoadSub8:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: lw $1, %got(y)($1)
+; MIPS32-NEXT: addiu $2, $zero, -4
+; MIPS32-NEXT: and $2, $1, $2
+; MIPS32-NEXT: andi $1, $1, 3
+; MIPS32-NEXT: sll $3, $1, 3
+; MIPS32-NEXT: ori $1, $zero, 255
+; MIPS32-NEXT: sllv $5, $1, $3
+; MIPS32-NEXT: nor $6, $zero, $5
+; MIPS32-NEXT: sllv $4, $4, $3
+; MIPS32-NEXT: $BB9_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $7, 0($2)
+; MIPS32-NEXT: subu $8, $7, $4
+; MIPS32-NEXT: and $8, $8, $5
+; MIPS32-NEXT: and $9, $7, $6
+; MIPS32-NEXT: or $9, $9, $8
+; MIPS32-NEXT: sc $9, 0($2)
+; MIPS32-NEXT: beqz $9, $BB9_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: and $1, $7, $5
+; MIPS32-NEXT: srlv $1, $1, $3
+; MIPS32-NEXT: sll $1, $1, 24
+; MIPS32-NEXT: sra $1, $1, 24
+; MIPS32-NEXT: # %bb.3: # %entry
+; MIPS32-NEXT: sll $1, $1, 24
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: sra $2, $1, 24
+;
+; MIPS32O0-LABEL: AtomicLoadSub8:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addiu $sp, $sp, -8
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: lw $2, %got(y)($2)
+; MIPS32O0-NEXT: addiu $25, $zero, -4
+; MIPS32O0-NEXT: and $25, $2, $25
+; MIPS32O0-NEXT: andi $2, $2, 3
+; MIPS32O0-NEXT: sll $2, $2, 3
+; MIPS32O0-NEXT: ori $1, $zero, 255
+; MIPS32O0-NEXT: sllv $1, $1, $2
+; MIPS32O0-NEXT: nor $3, $zero, $1
+; MIPS32O0-NEXT: sllv $4, $4, $2
+; MIPS32O0-NEXT: $BB9_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $6, 0($25)
+; MIPS32O0-NEXT: subu $7, $6, $4
+; MIPS32O0-NEXT: and $7, $7, $1
+; MIPS32O0-NEXT: and $8, $6, $3
+; MIPS32O0-NEXT: or $8, $8, $7
+; MIPS32O0-NEXT: sc $8, 0($25)
+; MIPS32O0-NEXT: beqz $8, $BB9_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: and $5, $6, $1
+; MIPS32O0-NEXT: srlv $5, $5, $2
+; MIPS32O0-NEXT: sll $5, $5, 24
+; MIPS32O0-NEXT: sra $5, $5, 24
+; MIPS32O0-NEXT: # %bb.3: # %entry
+; MIPS32O0-NEXT: sw $5, 4($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: # %bb.4: # %entry
+; MIPS32O0-NEXT: lw $1, 4($sp) # 4-byte Folded Reload
+; MIPS32O0-NEXT: sll $2, $1, 24
+; MIPS32O0-NEXT: sra $2, $2, 24
+; MIPS32O0-NEXT: addiu $sp, $sp, 8
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicLoadSub8:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: lw $1, %got(y)($1)
+; MIPS32R2-NEXT: addiu $2, $zero, -4
+; MIPS32R2-NEXT: and $2, $1, $2
+; MIPS32R2-NEXT: andi $1, $1, 3
+; MIPS32R2-NEXT: sll $3, $1, 3
+; MIPS32R2-NEXT: ori $1, $zero, 255
+; MIPS32R2-NEXT: sllv $5, $1, $3
+; MIPS32R2-NEXT: nor $6, $zero, $5
+; MIPS32R2-NEXT: sllv $4, $4, $3
+; MIPS32R2-NEXT: $BB9_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $7, 0($2)
+; MIPS32R2-NEXT: subu $8, $7, $4
+; MIPS32R2-NEXT: and $8, $8, $5
+; MIPS32R2-NEXT: and $9, $7, $6
+; MIPS32R2-NEXT: or $9, $9, $8
+; MIPS32R2-NEXT: sc $9, 0($2)
+; MIPS32R2-NEXT: beqz $9, $BB9_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: and $1, $7, $5
+; MIPS32R2-NEXT: srlv $1, $1, $3
+; MIPS32R2-NEXT: seb $1, $1
+; MIPS32R2-NEXT: # %bb.3: # %entry
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: seb $2, $1
+;
+; MIPS32R6-LABEL: AtomicLoadSub8:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: lw $1, %got(y)($1)
+; MIPS32R6-NEXT: addiu $2, $zero, -4
+; MIPS32R6-NEXT: and $2, $1, $2
+; MIPS32R6-NEXT: andi $1, $1, 3
+; MIPS32R6-NEXT: sll $3, $1, 3
+; MIPS32R6-NEXT: ori $1, $zero, 255
+; MIPS32R6-NEXT: sllv $5, $1, $3
+; MIPS32R6-NEXT: nor $6, $zero, $5
+; MIPS32R6-NEXT: sllv $4, $4, $3
+; MIPS32R6-NEXT: $BB9_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $7, 0($2)
+; MIPS32R6-NEXT: subu $8, $7, $4
+; MIPS32R6-NEXT: and $8, $8, $5
+; MIPS32R6-NEXT: and $9, $7, $6
+; MIPS32R6-NEXT: or $9, $9, $8
+; MIPS32R6-NEXT: sc $9, 0($2)
+; MIPS32R6-NEXT: beqzc $9, $BB9_1
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: and $1, $7, $5
+; MIPS32R6-NEXT: srlv $1, $1, $3
+; MIPS32R6-NEXT: seb $1, $1
+; MIPS32R6-NEXT: # %bb.3: # %entry
+; MIPS32R6-NEXT: jr $ra
+; MIPS32R6-NEXT: seb $2, $1
+;
+; MIPS32R6O0-LABEL: AtomicLoadSub8:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -8
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $4
+; MIPS32R6O0-NEXT: lw $2, %got(y)($2)
+; MIPS32R6O0-NEXT: addiu $1, $zero, -4
+; MIPS32R6O0-NEXT: and $1, $2, $1
+; MIPS32R6O0-NEXT: andi $2, $2, 3
+; MIPS32R6O0-NEXT: sll $2, $2, 3
+; MIPS32R6O0-NEXT: ori $3, $zero, 255
+; MIPS32R6O0-NEXT: sllv $3, $3, $2
+; MIPS32R6O0-NEXT: nor $5, $zero, $3
+; MIPS32R6O0-NEXT: sllv $4, $4, $2
+; MIPS32R6O0-NEXT: $BB9_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $7, 0($1)
+; MIPS32R6O0-NEXT: subu $8, $7, $4
+; MIPS32R6O0-NEXT: and $8, $8, $3
+; MIPS32R6O0-NEXT: and $9, $7, $5
+; MIPS32R6O0-NEXT: or $9, $9, $8
+; MIPS32R6O0-NEXT: sc $9, 0($1)
+; MIPS32R6O0-NEXT: beqzc $9, $BB9_1
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: and $6, $7, $3
+; MIPS32R6O0-NEXT: srlv $6, $6, $2
+; MIPS32R6O0-NEXT: seb $6, $6
+; MIPS32R6O0-NEXT: # %bb.3: # %entry
+; MIPS32R6O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $6, 0($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: # %bb.4: # %entry
+; MIPS32R6O0-NEXT: lw $1, 0($sp) # 4-byte Folded Reload
+; MIPS32R6O0-NEXT: seb $2, $1
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 8
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicLoadSub8:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadSub8)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadSub8)))
+; MIPS4-NEXT: ld $1, %got_disp(y)($1)
+; MIPS4-NEXT: daddiu $2, $zero, -4
+; MIPS4-NEXT: and $2, $1, $2
+; MIPS4-NEXT: andi $1, $1, 3
+; MIPS4-NEXT: sll $3, $1, 3
+; MIPS4-NEXT: ori $1, $zero, 255
+; MIPS4-NEXT: sllv $5, $1, $3
+; MIPS4-NEXT: nor $6, $zero, $5
+; MIPS4-NEXT: sllv $4, $4, $3
+; MIPS4-NEXT: .LBB9_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $7, 0($2)
+; MIPS4-NEXT: subu $8, $7, $4
+; MIPS4-NEXT: and $8, $8, $5
+; MIPS4-NEXT: and $9, $7, $6
+; MIPS4-NEXT: or $9, $9, $8
+; MIPS4-NEXT: sc $9, 0($2)
+; MIPS4-NEXT: beqz $9, .LBB9_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: and $1, $7, $5
+; MIPS4-NEXT: srlv $1, $1, $3
+; MIPS4-NEXT: sll $1, $1, 24
+; MIPS4-NEXT: sra $1, $1, 24
+; MIPS4-NEXT: # %bb.3: # %entry
+; MIPS4-NEXT: sll $1, $1, 24
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: sra $2, $1, 24
+;
+; MIPS64-LABEL: AtomicLoadSub8:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadSub8)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadSub8)))
+; MIPS64-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64-NEXT: daddiu $2, $zero, -4
+; MIPS64-NEXT: and $2, $1, $2
+; MIPS64-NEXT: andi $1, $1, 3
+; MIPS64-NEXT: sll $3, $1, 3
+; MIPS64-NEXT: ori $1, $zero, 255
+; MIPS64-NEXT: sllv $5, $1, $3
+; MIPS64-NEXT: nor $6, $zero, $5
+; MIPS64-NEXT: sllv $4, $4, $3
+; MIPS64-NEXT: .LBB9_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $7, 0($2)
+; MIPS64-NEXT: subu $8, $7, $4
+; MIPS64-NEXT: and $8, $8, $5
+; MIPS64-NEXT: and $9, $7, $6
+; MIPS64-NEXT: or $9, $9, $8
+; MIPS64-NEXT: sc $9, 0($2)
+; MIPS64-NEXT: beqz $9, .LBB9_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: and $1, $7, $5
+; MIPS64-NEXT: srlv $1, $1, $3
+; MIPS64-NEXT: sll $1, $1, 24
+; MIPS64-NEXT: sra $1, $1, 24
+; MIPS64-NEXT: # %bb.3: # %entry
+; MIPS64-NEXT: sll $1, $1, 24
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: sra $2, $1, 24
+;
+; MIPS64R2-LABEL: AtomicLoadSub8:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadSub8)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadSub8)))
+; MIPS64R2-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64R2-NEXT: daddiu $2, $zero, -4
+; MIPS64R2-NEXT: and $2, $1, $2
+; MIPS64R2-NEXT: andi $1, $1, 3
+; MIPS64R2-NEXT: sll $3, $1, 3
+; MIPS64R2-NEXT: ori $1, $zero, 255
+; MIPS64R2-NEXT: sllv $5, $1, $3
+; MIPS64R2-NEXT: nor $6, $zero, $5
+; MIPS64R2-NEXT: sllv $4, $4, $3
+; MIPS64R2-NEXT: .LBB9_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $7, 0($2)
+; MIPS64R2-NEXT: subu $8, $7, $4
+; MIPS64R2-NEXT: and $8, $8, $5
+; MIPS64R2-NEXT: and $9, $7, $6
+; MIPS64R2-NEXT: or $9, $9, $8
+; MIPS64R2-NEXT: sc $9, 0($2)
+; MIPS64R2-NEXT: beqz $9, .LBB9_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: and $1, $7, $5
+; MIPS64R2-NEXT: srlv $1, $1, $3
+; MIPS64R2-NEXT: seb $1, $1
+; MIPS64R2-NEXT: # %bb.3: # %entry
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: seb $2, $1
+;
+; MIPS64R6-LABEL: AtomicLoadSub8:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadSub8)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadSub8)))
+; MIPS64R6-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64R6-NEXT: daddiu $2, $zero, -4
+; MIPS64R6-NEXT: and $2, $1, $2
+; MIPS64R6-NEXT: andi $1, $1, 3
+; MIPS64R6-NEXT: sll $3, $1, 3
+; MIPS64R6-NEXT: ori $1, $zero, 255
+; MIPS64R6-NEXT: sllv $5, $1, $3
+; MIPS64R6-NEXT: nor $6, $zero, $5
+; MIPS64R6-NEXT: sllv $4, $4, $3
+; MIPS64R6-NEXT: .LBB9_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $7, 0($2)
+; MIPS64R6-NEXT: subu $8, $7, $4
+; MIPS64R6-NEXT: and $8, $8, $5
+; MIPS64R6-NEXT: and $9, $7, $6
+; MIPS64R6-NEXT: or $9, $9, $8
+; MIPS64R6-NEXT: sc $9, 0($2)
+; MIPS64R6-NEXT: beqzc $9, .LBB9_1
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: and $1, $7, $5
+; MIPS64R6-NEXT: srlv $1, $1, $3
+; MIPS64R6-NEXT: seb $1, $1
+; MIPS64R6-NEXT: # %bb.3: # %entry
+; MIPS64R6-NEXT: jr $ra
+; MIPS64R6-NEXT: seb $2, $1
+;
+; MIPS64R6O0-LABEL: AtomicLoadSub8:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, -16
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadSub8)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadSub8)))
+; MIPS64R6O0-NEXT: move $2, $4
+; MIPS64R6O0-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64R6O0-NEXT: daddiu $4, $zero, -4
+; MIPS64R6O0-NEXT: and $4, $1, $4
+; MIPS64R6O0-NEXT: andi $3, $1, 3
+; MIPS64R6O0-NEXT: xori $3, $3, 3
+; MIPS64R6O0-NEXT: sll $3, $3, 3
+; MIPS64R6O0-NEXT: ori $5, $zero, 255
+; MIPS64R6O0-NEXT: sllv $5, $5, $3
+; MIPS64R6O0-NEXT: nor $6, $zero, $5
+; MIPS64R6O0-NEXT: sllv $2, $2, $3
+; MIPS64R6O0-NEXT: .LBB9_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $8, 0($4)
+; MIPS64R6O0-NEXT: subu $9, $8, $2
+; MIPS64R6O0-NEXT: and $9, $9, $5
+; MIPS64R6O0-NEXT: and $10, $8, $6
+; MIPS64R6O0-NEXT: or $10, $10, $9
+; MIPS64R6O0-NEXT: sc $10, 0($4)
+; MIPS64R6O0-NEXT: beqzc $10, .LBB9_1
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: and $7, $8, $5
+; MIPS64R6O0-NEXT: srlv $7, $7, $3
+; MIPS64R6O0-NEXT: seb $7, $7
+; MIPS64R6O0-NEXT: # %bb.3: # %entry
+; MIPS64R6O0-NEXT: sw $7, 12($sp) # 4-byte Folded Spill
+; MIPS64R6O0-NEXT: # %bb.4: # %entry
+; MIPS64R6O0-NEXT: lw $1, 12($sp) # 4-byte Folded Reload
+; MIPS64R6O0-NEXT: seb $2, $1
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, 16
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicLoadSub8:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: lw $1, %got(y)($2)
+; MM32-NEXT: addiu $2, $zero, -4
+; MM32-NEXT: and $2, $1, $2
+; MM32-NEXT: andi $1, $1, 3
+; MM32-NEXT: sll $3, $1, 3
+; MM32-NEXT: ori $1, $zero, 255
+; MM32-NEXT: sllv $5, $1, $3
+; MM32-NEXT: nor $6, $zero, $5
+; MM32-NEXT: sllv $4, $4, $3
+; MM32-NEXT: $BB9_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $7, 0($2)
+; MM32-NEXT: subu $8, $7, $4
+; MM32-NEXT: and $8, $8, $5
+; MM32-NEXT: and $9, $7, $6
+; MM32-NEXT: or $9, $9, $8
+; MM32-NEXT: sc $9, 0($2)
+; MM32-NEXT: beqzc $9, $BB9_1
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: and $1, $7, $5
+; MM32-NEXT: srlv $1, $1, $3
+; MM32-NEXT: seb $1, $1
+; MM32-NEXT: # %bb.3: # %entry
+; MM32-NEXT: jr $ra
+; MM32-NEXT: seb $2, $1
+;
+; O1-LABEL: AtomicLoadSub8:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: lw $1, %got(y)($1)
+; O1-NEXT: addiu $2, $zero, -4
+; O1-NEXT: and $2, $1, $2
+; O1-NEXT: andi $1, $1, 3
+; O1-NEXT: sll $3, $1, 3
+; O1-NEXT: ori $1, $zero, 255
+; O1-NEXT: sllv $5, $1, $3
+; O1-NEXT: nor $6, $zero, $5
+; O1-NEXT: sllv $4, $4, $3
+; O1-NEXT: $BB9_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $7, 0($2)
+; O1-NEXT: subu $8, $7, $4
+; O1-NEXT: and $8, $8, $5
+; O1-NEXT: and $9, $7, $6
+; O1-NEXT: or $9, $9, $8
+; O1-NEXT: sc $9, 0($2)
+; O1-NEXT: beqz $9, $BB9_1
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: and $1, $7, $5
+; O1-NEXT: srlv $1, $1, $3
+; O1-NEXT: sll $1, $1, 24
+; O1-NEXT: sra $1, $1, 24
+; O1-NEXT: # %bb.3: # %entry
+; O1-NEXT: sll $1, $1, 24
+; O1-NEXT: jr $ra
+; O1-NEXT: sra $2, $1, 24
+;
+; O2-LABEL: AtomicLoadSub8:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: lw $1, %got(y)($1)
+; O2-NEXT: addiu $2, $zero, -4
+; O2-NEXT: and $2, $1, $2
+; O2-NEXT: andi $1, $1, 3
+; O2-NEXT: sll $3, $1, 3
+; O2-NEXT: ori $1, $zero, 255
+; O2-NEXT: sllv $5, $1, $3
+; O2-NEXT: nor $6, $zero, $5
+; O2-NEXT: sllv $4, $4, $3
+; O2-NEXT: $BB9_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $7, 0($2)
+; O2-NEXT: subu $8, $7, $4
+; O2-NEXT: and $8, $8, $5
+; O2-NEXT: and $9, $7, $6
+; O2-NEXT: or $9, $9, $8
+; O2-NEXT: sc $9, 0($2)
+; O2-NEXT: beqz $9, $BB9_1
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: and $1, $7, $5
+; O2-NEXT: srlv $1, $1, $3
+; O2-NEXT: sll $1, $1, 24
+; O2-NEXT: sra $1, $1, 24
+; O2-NEXT: # %bb.3: # %entry
+; O2-NEXT: sll $1, $1, 24
+; O2-NEXT: jr $ra
+; O2-NEXT: sra $2, $1, 24
+;
+; O3-LABEL: AtomicLoadSub8:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: addiu $2, $zero, -4
+; O3-NEXT: lw $1, %got(y)($1)
+; O3-NEXT: and $2, $1, $2
+; O3-NEXT: andi $1, $1, 3
+; O3-NEXT: sll $3, $1, 3
+; O3-NEXT: ori $1, $zero, 255
+; O3-NEXT: sllv $5, $1, $3
+; O3-NEXT: sllv $4, $4, $3
+; O3-NEXT: nor $6, $zero, $5
+; O3-NEXT: $BB9_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $7, 0($2)
+; O3-NEXT: subu $8, $7, $4
+; O3-NEXT: and $8, $8, $5
+; O3-NEXT: and $9, $7, $6
+; O3-NEXT: or $9, $9, $8
+; O3-NEXT: sc $9, 0($2)
+; O3-NEXT: beqz $9, $BB9_1
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: and $1, $7, $5
+; O3-NEXT: srlv $1, $1, $3
+; O3-NEXT: sll $1, $1, 24
+; O3-NEXT: sra $1, $1, 24
+; O3-NEXT: # %bb.3: # %entry
+; O3-NEXT: sll $1, $1, 24
+; O3-NEXT: jr $ra
+; O3-NEXT: sra $2, $1, 24
+;
+; MIPS32EB-LABEL: AtomicLoadSub8:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: lw $1, %got(y)($1)
+; MIPS32EB-NEXT: addiu $2, $zero, -4
+; MIPS32EB-NEXT: and $2, $1, $2
+; MIPS32EB-NEXT: andi $1, $1, 3
+; MIPS32EB-NEXT: xori $1, $1, 3
+; MIPS32EB-NEXT: sll $3, $1, 3
+; MIPS32EB-NEXT: ori $1, $zero, 255
+; MIPS32EB-NEXT: sllv $5, $1, $3
+; MIPS32EB-NEXT: nor $6, $zero, $5
+; MIPS32EB-NEXT: sllv $4, $4, $3
+; MIPS32EB-NEXT: $BB9_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $7, 0($2)
+; MIPS32EB-NEXT: subu $8, $7, $4
+; MIPS32EB-NEXT: and $8, $8, $5
+; MIPS32EB-NEXT: and $9, $7, $6
+; MIPS32EB-NEXT: or $9, $9, $8
+; MIPS32EB-NEXT: sc $9, 0($2)
+; MIPS32EB-NEXT: beqz $9, $BB9_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: and $1, $7, $5
+; MIPS32EB-NEXT: srlv $1, $1, $3
+; MIPS32EB-NEXT: sll $1, $1, 24
+; MIPS32EB-NEXT: sra $1, $1, 24
+; MIPS32EB-NEXT: # %bb.3: # %entry
+; MIPS32EB-NEXT: sll $1, $1, 24
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: sra $2, $1, 24
entry:
%0 = atomicrmw sub i8* @y, i8 %incr monotonic
ret i8 %0
-; ALL-LABEL: AtomicLoadSub8:
-
-; MIPS32-ANY: lw $[[R0:[0-9]+]], %got(y)
-; MIPS64-ANY: ld $[[R0:[0-9]+]], %got_disp(y)(
-
-; ALL: addiu $[[R1:[0-9]+]], $zero, -4
-; ALL: and $[[R2:[0-9]+]], $[[R0]], $[[R1]]
-; ALL: andi $[[R3:[0-9]+]], $[[R0]], 3
-; CHECK-EL: sll $[[R5:[0-9]+]], $[[R3]], 3
-; CHECK-EB: xori $[[R4:[0-9]+]], $[[R3]], 3
-; CHECK-EB: sll $[[R5:[0-9]+]], $[[R4]], 3
-; ALL: ori $[[R6:[0-9]+]], $zero, 255
-; ALL: sllv $[[R7:[0-9]+]], $[[R6]], $[[R5]]
-; ALL: nor $[[R8:[0-9]+]], $zero, $[[R7]]
-; ALL: sllv $[[R9:[0-9]+]], $4, $[[R5]]
-
-; O0: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; O0: ld $[[R10:[0-9]+]]
-; O0-NEXT: ll $[[R11:[0-9]+]], 0($[[R10]])
-
-; ALL: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; ALL: ll $[[R12:[0-9]+]], 0($[[R2]])
-; ALL: subu $[[R13:[0-9]+]], $[[R12]], $[[R9]]
-; ALL: and $[[R14:[0-9]+]], $[[R13]], $[[R7]]
-; ALL: and $[[R15:[0-9]+]], $[[R12]], $[[R8]]
-; ALL: or $[[R16:[0-9]+]], $[[R15]], $[[R14]]
-; ALL: sc $[[R16]], 0($[[R2]])
-; NOT-MICROMIPS: beqz $[[R16]], [[BB0]]
-; MICROMIPS: beqzc $[[R16]], [[BB0]]
-; MIPSR6: beqzc $[[R16]], [[BB0]]
-
-; ALL: and $[[R17:[0-9]+]], $[[R12]], $[[R7]]
-; ALL: srlv $[[R18:[0-9]+]], $[[R17]], $[[R5]]
-
-; NO-SEB-SEH: sll $[[R19:[0-9]+]], $[[R18]], 24
-; NO-SEB-SEH: sra $2, $[[R19]], 24
-
-; HAS-SEB-SEH:seb $2, $[[R18]]
}
define signext i8 @AtomicLoadNand8(i8 signext %incr) nounwind {
+; MIPS32-LABEL: AtomicLoadNand8:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: lw $1, %got(y)($1)
+; MIPS32-NEXT: addiu $2, $zero, -4
+; MIPS32-NEXT: and $2, $1, $2
+; MIPS32-NEXT: andi $1, $1, 3
+; MIPS32-NEXT: sll $3, $1, 3
+; MIPS32-NEXT: ori $1, $zero, 255
+; MIPS32-NEXT: sllv $5, $1, $3
+; MIPS32-NEXT: nor $6, $zero, $5
+; MIPS32-NEXT: sllv $4, $4, $3
+; MIPS32-NEXT: $BB10_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $7, 0($2)
+; MIPS32-NEXT: and $8, $7, $4
+; MIPS32-NEXT: nor $8, $zero, $8
+; MIPS32-NEXT: and $8, $8, $5
+; MIPS32-NEXT: and $9, $7, $6
+; MIPS32-NEXT: or $9, $9, $8
+; MIPS32-NEXT: sc $9, 0($2)
+; MIPS32-NEXT: beqz $9, $BB10_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: and $1, $7, $5
+; MIPS32-NEXT: srlv $1, $1, $3
+; MIPS32-NEXT: sll $1, $1, 24
+; MIPS32-NEXT: sra $1, $1, 24
+; MIPS32-NEXT: # %bb.3: # %entry
+; MIPS32-NEXT: sll $1, $1, 24
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: sra $2, $1, 24
+;
+; MIPS32O0-LABEL: AtomicLoadNand8:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addiu $sp, $sp, -8
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: lw $2, %got(y)($2)
+; MIPS32O0-NEXT: addiu $25, $zero, -4
+; MIPS32O0-NEXT: and $25, $2, $25
+; MIPS32O0-NEXT: andi $2, $2, 3
+; MIPS32O0-NEXT: sll $2, $2, 3
+; MIPS32O0-NEXT: ori $1, $zero, 255
+; MIPS32O0-NEXT: sllv $1, $1, $2
+; MIPS32O0-NEXT: nor $3, $zero, $1
+; MIPS32O0-NEXT: sllv $4, $4, $2
+; MIPS32O0-NEXT: $BB10_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $6, 0($25)
+; MIPS32O0-NEXT: and $7, $6, $4
+; MIPS32O0-NEXT: nor $7, $zero, $7
+; MIPS32O0-NEXT: and $7, $7, $1
+; MIPS32O0-NEXT: and $8, $6, $3
+; MIPS32O0-NEXT: or $8, $8, $7
+; MIPS32O0-NEXT: sc $8, 0($25)
+; MIPS32O0-NEXT: beqz $8, $BB10_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: and $5, $6, $1
+; MIPS32O0-NEXT: srlv $5, $5, $2
+; MIPS32O0-NEXT: sll $5, $5, 24
+; MIPS32O0-NEXT: sra $5, $5, 24
+; MIPS32O0-NEXT: # %bb.3: # %entry
+; MIPS32O0-NEXT: sw $5, 4($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: # %bb.4: # %entry
+; MIPS32O0-NEXT: lw $1, 4($sp) # 4-byte Folded Reload
+; MIPS32O0-NEXT: sll $2, $1, 24
+; MIPS32O0-NEXT: sra $2, $2, 24
+; MIPS32O0-NEXT: addiu $sp, $sp, 8
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicLoadNand8:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: lw $1, %got(y)($1)
+; MIPS32R2-NEXT: addiu $2, $zero, -4
+; MIPS32R2-NEXT: and $2, $1, $2
+; MIPS32R2-NEXT: andi $1, $1, 3
+; MIPS32R2-NEXT: sll $3, $1, 3
+; MIPS32R2-NEXT: ori $1, $zero, 255
+; MIPS32R2-NEXT: sllv $5, $1, $3
+; MIPS32R2-NEXT: nor $6, $zero, $5
+; MIPS32R2-NEXT: sllv $4, $4, $3
+; MIPS32R2-NEXT: $BB10_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $7, 0($2)
+; MIPS32R2-NEXT: and $8, $7, $4
+; MIPS32R2-NEXT: nor $8, $zero, $8
+; MIPS32R2-NEXT: and $8, $8, $5
+; MIPS32R2-NEXT: and $9, $7, $6
+; MIPS32R2-NEXT: or $9, $9, $8
+; MIPS32R2-NEXT: sc $9, 0($2)
+; MIPS32R2-NEXT: beqz $9, $BB10_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: and $1, $7, $5
+; MIPS32R2-NEXT: srlv $1, $1, $3
+; MIPS32R2-NEXT: seb $1, $1
+; MIPS32R2-NEXT: # %bb.3: # %entry
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: seb $2, $1
+;
+; MIPS32R6-LABEL: AtomicLoadNand8:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: lw $1, %got(y)($1)
+; MIPS32R6-NEXT: addiu $2, $zero, -4
+; MIPS32R6-NEXT: and $2, $1, $2
+; MIPS32R6-NEXT: andi $1, $1, 3
+; MIPS32R6-NEXT: sll $3, $1, 3
+; MIPS32R6-NEXT: ori $1, $zero, 255
+; MIPS32R6-NEXT: sllv $5, $1, $3
+; MIPS32R6-NEXT: nor $6, $zero, $5
+; MIPS32R6-NEXT: sllv $4, $4, $3
+; MIPS32R6-NEXT: $BB10_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $7, 0($2)
+; MIPS32R6-NEXT: and $8, $7, $4
+; MIPS32R6-NEXT: nor $8, $zero, $8
+; MIPS32R6-NEXT: and $8, $8, $5
+; MIPS32R6-NEXT: and $9, $7, $6
+; MIPS32R6-NEXT: or $9, $9, $8
+; MIPS32R6-NEXT: sc $9, 0($2)
+; MIPS32R6-NEXT: beqzc $9, $BB10_1
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: and $1, $7, $5
+; MIPS32R6-NEXT: srlv $1, $1, $3
+; MIPS32R6-NEXT: seb $1, $1
+; MIPS32R6-NEXT: # %bb.3: # %entry
+; MIPS32R6-NEXT: jr $ra
+; MIPS32R6-NEXT: seb $2, $1
+;
+; MIPS32R6O0-LABEL: AtomicLoadNand8:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -8
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $4
+; MIPS32R6O0-NEXT: lw $2, %got(y)($2)
+; MIPS32R6O0-NEXT: addiu $1, $zero, -4
+; MIPS32R6O0-NEXT: and $1, $2, $1
+; MIPS32R6O0-NEXT: andi $2, $2, 3
+; MIPS32R6O0-NEXT: sll $2, $2, 3
+; MIPS32R6O0-NEXT: ori $3, $zero, 255
+; MIPS32R6O0-NEXT: sllv $3, $3, $2
+; MIPS32R6O0-NEXT: nor $5, $zero, $3
+; MIPS32R6O0-NEXT: sllv $4, $4, $2
+; MIPS32R6O0-NEXT: $BB10_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $7, 0($1)
+; MIPS32R6O0-NEXT: and $8, $7, $4
+; MIPS32R6O0-NEXT: nor $8, $zero, $8
+; MIPS32R6O0-NEXT: and $8, $8, $3
+; MIPS32R6O0-NEXT: and $9, $7, $5
+; MIPS32R6O0-NEXT: or $9, $9, $8
+; MIPS32R6O0-NEXT: sc $9, 0($1)
+; MIPS32R6O0-NEXT: beqzc $9, $BB10_1
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: and $6, $7, $3
+; MIPS32R6O0-NEXT: srlv $6, $6, $2
+; MIPS32R6O0-NEXT: seb $6, $6
+; MIPS32R6O0-NEXT: # %bb.3: # %entry
+; MIPS32R6O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $6, 0($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: # %bb.4: # %entry
+; MIPS32R6O0-NEXT: lw $1, 0($sp) # 4-byte Folded Reload
+; MIPS32R6O0-NEXT: seb $2, $1
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 8
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicLoadNand8:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadNand8)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadNand8)))
+; MIPS4-NEXT: ld $1, %got_disp(y)($1)
+; MIPS4-NEXT: daddiu $2, $zero, -4
+; MIPS4-NEXT: and $2, $1, $2
+; MIPS4-NEXT: andi $1, $1, 3
+; MIPS4-NEXT: sll $3, $1, 3
+; MIPS4-NEXT: ori $1, $zero, 255
+; MIPS4-NEXT: sllv $5, $1, $3
+; MIPS4-NEXT: nor $6, $zero, $5
+; MIPS4-NEXT: sllv $4, $4, $3
+; MIPS4-NEXT: .LBB10_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $7, 0($2)
+; MIPS4-NEXT: and $8, $7, $4
+; MIPS4-NEXT: nor $8, $zero, $8
+; MIPS4-NEXT: and $8, $8, $5
+; MIPS4-NEXT: and $9, $7, $6
+; MIPS4-NEXT: or $9, $9, $8
+; MIPS4-NEXT: sc $9, 0($2)
+; MIPS4-NEXT: beqz $9, .LBB10_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: and $1, $7, $5
+; MIPS4-NEXT: srlv $1, $1, $3
+; MIPS4-NEXT: sll $1, $1, 24
+; MIPS4-NEXT: sra $1, $1, 24
+; MIPS4-NEXT: # %bb.3: # %entry
+; MIPS4-NEXT: sll $1, $1, 24
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: sra $2, $1, 24
+;
+; MIPS64-LABEL: AtomicLoadNand8:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadNand8)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadNand8)))
+; MIPS64-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64-NEXT: daddiu $2, $zero, -4
+; MIPS64-NEXT: and $2, $1, $2
+; MIPS64-NEXT: andi $1, $1, 3
+; MIPS64-NEXT: sll $3, $1, 3
+; MIPS64-NEXT: ori $1, $zero, 255
+; MIPS64-NEXT: sllv $5, $1, $3
+; MIPS64-NEXT: nor $6, $zero, $5
+; MIPS64-NEXT: sllv $4, $4, $3
+; MIPS64-NEXT: .LBB10_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $7, 0($2)
+; MIPS64-NEXT: and $8, $7, $4
+; MIPS64-NEXT: nor $8, $zero, $8
+; MIPS64-NEXT: and $8, $8, $5
+; MIPS64-NEXT: and $9, $7, $6
+; MIPS64-NEXT: or $9, $9, $8
+; MIPS64-NEXT: sc $9, 0($2)
+; MIPS64-NEXT: beqz $9, .LBB10_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: and $1, $7, $5
+; MIPS64-NEXT: srlv $1, $1, $3
+; MIPS64-NEXT: sll $1, $1, 24
+; MIPS64-NEXT: sra $1, $1, 24
+; MIPS64-NEXT: # %bb.3: # %entry
+; MIPS64-NEXT: sll $1, $1, 24
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: sra $2, $1, 24
+;
+; MIPS64R2-LABEL: AtomicLoadNand8:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadNand8)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadNand8)))
+; MIPS64R2-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64R2-NEXT: daddiu $2, $zero, -4
+; MIPS64R2-NEXT: and $2, $1, $2
+; MIPS64R2-NEXT: andi $1, $1, 3
+; MIPS64R2-NEXT: sll $3, $1, 3
+; MIPS64R2-NEXT: ori $1, $zero, 255
+; MIPS64R2-NEXT: sllv $5, $1, $3
+; MIPS64R2-NEXT: nor $6, $zero, $5
+; MIPS64R2-NEXT: sllv $4, $4, $3
+; MIPS64R2-NEXT: .LBB10_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $7, 0($2)
+; MIPS64R2-NEXT: and $8, $7, $4
+; MIPS64R2-NEXT: nor $8, $zero, $8
+; MIPS64R2-NEXT: and $8, $8, $5
+; MIPS64R2-NEXT: and $9, $7, $6
+; MIPS64R2-NEXT: or $9, $9, $8
+; MIPS64R2-NEXT: sc $9, 0($2)
+; MIPS64R2-NEXT: beqz $9, .LBB10_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: and $1, $7, $5
+; MIPS64R2-NEXT: srlv $1, $1, $3
+; MIPS64R2-NEXT: seb $1, $1
+; MIPS64R2-NEXT: # %bb.3: # %entry
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: seb $2, $1
+;
+; MIPS64R6-LABEL: AtomicLoadNand8:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadNand8)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadNand8)))
+; MIPS64R6-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64R6-NEXT: daddiu $2, $zero, -4
+; MIPS64R6-NEXT: and $2, $1, $2
+; MIPS64R6-NEXT: andi $1, $1, 3
+; MIPS64R6-NEXT: sll $3, $1, 3
+; MIPS64R6-NEXT: ori $1, $zero, 255
+; MIPS64R6-NEXT: sllv $5, $1, $3
+; MIPS64R6-NEXT: nor $6, $zero, $5
+; MIPS64R6-NEXT: sllv $4, $4, $3
+; MIPS64R6-NEXT: .LBB10_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $7, 0($2)
+; MIPS64R6-NEXT: and $8, $7, $4
+; MIPS64R6-NEXT: nor $8, $zero, $8
+; MIPS64R6-NEXT: and $8, $8, $5
+; MIPS64R6-NEXT: and $9, $7, $6
+; MIPS64R6-NEXT: or $9, $9, $8
+; MIPS64R6-NEXT: sc $9, 0($2)
+; MIPS64R6-NEXT: beqzc $9, .LBB10_1
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: and $1, $7, $5
+; MIPS64R6-NEXT: srlv $1, $1, $3
+; MIPS64R6-NEXT: seb $1, $1
+; MIPS64R6-NEXT: # %bb.3: # %entry
+; MIPS64R6-NEXT: jr $ra
+; MIPS64R6-NEXT: seb $2, $1
+;
+; MIPS64R6O0-LABEL: AtomicLoadNand8:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, -16
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadNand8)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadNand8)))
+; MIPS64R6O0-NEXT: move $2, $4
+; MIPS64R6O0-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64R6O0-NEXT: daddiu $4, $zero, -4
+; MIPS64R6O0-NEXT: and $4, $1, $4
+; MIPS64R6O0-NEXT: andi $3, $1, 3
+; MIPS64R6O0-NEXT: xori $3, $3, 3
+; MIPS64R6O0-NEXT: sll $3, $3, 3
+; MIPS64R6O0-NEXT: ori $5, $zero, 255
+; MIPS64R6O0-NEXT: sllv $5, $5, $3
+; MIPS64R6O0-NEXT: nor $6, $zero, $5
+; MIPS64R6O0-NEXT: sllv $2, $2, $3
+; MIPS64R6O0-NEXT: .LBB10_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $8, 0($4)
+; MIPS64R6O0-NEXT: and $9, $8, $2
+; MIPS64R6O0-NEXT: nor $9, $zero, $9
+; MIPS64R6O0-NEXT: and $9, $9, $5
+; MIPS64R6O0-NEXT: and $10, $8, $6
+; MIPS64R6O0-NEXT: or $10, $10, $9
+; MIPS64R6O0-NEXT: sc $10, 0($4)
+; MIPS64R6O0-NEXT: beqzc $10, .LBB10_1
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: and $7, $8, $5
+; MIPS64R6O0-NEXT: srlv $7, $7, $3
+; MIPS64R6O0-NEXT: seb $7, $7
+; MIPS64R6O0-NEXT: # %bb.3: # %entry
+; MIPS64R6O0-NEXT: sw $7, 12($sp) # 4-byte Folded Spill
+; MIPS64R6O0-NEXT: # %bb.4: # %entry
+; MIPS64R6O0-NEXT: lw $1, 12($sp) # 4-byte Folded Reload
+; MIPS64R6O0-NEXT: seb $2, $1
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, 16
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicLoadNand8:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: lw $1, %got(y)($2)
+; MM32-NEXT: addiu $2, $zero, -4
+; MM32-NEXT: and $2, $1, $2
+; MM32-NEXT: andi $1, $1, 3
+; MM32-NEXT: sll $3, $1, 3
+; MM32-NEXT: ori $1, $zero, 255
+; MM32-NEXT: sllv $5, $1, $3
+; MM32-NEXT: nor $6, $zero, $5
+; MM32-NEXT: sllv $4, $4, $3
+; MM32-NEXT: $BB10_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $7, 0($2)
+; MM32-NEXT: and $8, $7, $4
+; MM32-NEXT: nor $8, $zero, $8
+; MM32-NEXT: and $8, $8, $5
+; MM32-NEXT: and $9, $7, $6
+; MM32-NEXT: or $9, $9, $8
+; MM32-NEXT: sc $9, 0($2)
+; MM32-NEXT: beqzc $9, $BB10_1
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: and $1, $7, $5
+; MM32-NEXT: srlv $1, $1, $3
+; MM32-NEXT: seb $1, $1
+; MM32-NEXT: # %bb.3: # %entry
+; MM32-NEXT: jr $ra
+; MM32-NEXT: seb $2, $1
+;
+; O1-LABEL: AtomicLoadNand8:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: lw $1, %got(y)($1)
+; O1-NEXT: addiu $2, $zero, -4
+; O1-NEXT: and $2, $1, $2
+; O1-NEXT: andi $1, $1, 3
+; O1-NEXT: sll $3, $1, 3
+; O1-NEXT: ori $1, $zero, 255
+; O1-NEXT: sllv $5, $1, $3
+; O1-NEXT: nor $6, $zero, $5
+; O1-NEXT: sllv $4, $4, $3
+; O1-NEXT: $BB10_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $7, 0($2)
+; O1-NEXT: and $8, $7, $4
+; O1-NEXT: nor $8, $zero, $8
+; O1-NEXT: and $8, $8, $5
+; O1-NEXT: and $9, $7, $6
+; O1-NEXT: or $9, $9, $8
+; O1-NEXT: sc $9, 0($2)
+; O1-NEXT: beqz $9, $BB10_1
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: and $1, $7, $5
+; O1-NEXT: srlv $1, $1, $3
+; O1-NEXT: sll $1, $1, 24
+; O1-NEXT: sra $1, $1, 24
+; O1-NEXT: # %bb.3: # %entry
+; O1-NEXT: sll $1, $1, 24
+; O1-NEXT: jr $ra
+; O1-NEXT: sra $2, $1, 24
+;
+; O2-LABEL: AtomicLoadNand8:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: lw $1, %got(y)($1)
+; O2-NEXT: addiu $2, $zero, -4
+; O2-NEXT: and $2, $1, $2
+; O2-NEXT: andi $1, $1, 3
+; O2-NEXT: sll $3, $1, 3
+; O2-NEXT: ori $1, $zero, 255
+; O2-NEXT: sllv $5, $1, $3
+; O2-NEXT: nor $6, $zero, $5
+; O2-NEXT: sllv $4, $4, $3
+; O2-NEXT: $BB10_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $7, 0($2)
+; O2-NEXT: and $8, $7, $4
+; O2-NEXT: nor $8, $zero, $8
+; O2-NEXT: and $8, $8, $5
+; O2-NEXT: and $9, $7, $6
+; O2-NEXT: or $9, $9, $8
+; O2-NEXT: sc $9, 0($2)
+; O2-NEXT: beqz $9, $BB10_1
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: and $1, $7, $5
+; O2-NEXT: srlv $1, $1, $3
+; O2-NEXT: sll $1, $1, 24
+; O2-NEXT: sra $1, $1, 24
+; O2-NEXT: # %bb.3: # %entry
+; O2-NEXT: sll $1, $1, 24
+; O2-NEXT: jr $ra
+; O2-NEXT: sra $2, $1, 24
+;
+; O3-LABEL: AtomicLoadNand8:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: addiu $2, $zero, -4
+; O3-NEXT: lw $1, %got(y)($1)
+; O3-NEXT: and $2, $1, $2
+; O3-NEXT: andi $1, $1, 3
+; O3-NEXT: sll $3, $1, 3
+; O3-NEXT: ori $1, $zero, 255
+; O3-NEXT: sllv $5, $1, $3
+; O3-NEXT: sllv $4, $4, $3
+; O3-NEXT: nor $6, $zero, $5
+; O3-NEXT: $BB10_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $7, 0($2)
+; O3-NEXT: and $8, $7, $4
+; O3-NEXT: nor $8, $zero, $8
+; O3-NEXT: and $8, $8, $5
+; O3-NEXT: and $9, $7, $6
+; O3-NEXT: or $9, $9, $8
+; O3-NEXT: sc $9, 0($2)
+; O3-NEXT: beqz $9, $BB10_1
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: and $1, $7, $5
+; O3-NEXT: srlv $1, $1, $3
+; O3-NEXT: sll $1, $1, 24
+; O3-NEXT: sra $1, $1, 24
+; O3-NEXT: # %bb.3: # %entry
+; O3-NEXT: sll $1, $1, 24
+; O3-NEXT: jr $ra
+; O3-NEXT: sra $2, $1, 24
+;
+; MIPS32EB-LABEL: AtomicLoadNand8:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: lw $1, %got(y)($1)
+; MIPS32EB-NEXT: addiu $2, $zero, -4
+; MIPS32EB-NEXT: and $2, $1, $2
+; MIPS32EB-NEXT: andi $1, $1, 3
+; MIPS32EB-NEXT: xori $1, $1, 3
+; MIPS32EB-NEXT: sll $3, $1, 3
+; MIPS32EB-NEXT: ori $1, $zero, 255
+; MIPS32EB-NEXT: sllv $5, $1, $3
+; MIPS32EB-NEXT: nor $6, $zero, $5
+; MIPS32EB-NEXT: sllv $4, $4, $3
+; MIPS32EB-NEXT: $BB10_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $7, 0($2)
+; MIPS32EB-NEXT: and $8, $7, $4
+; MIPS32EB-NEXT: nor $8, $zero, $8
+; MIPS32EB-NEXT: and $8, $8, $5
+; MIPS32EB-NEXT: and $9, $7, $6
+; MIPS32EB-NEXT: or $9, $9, $8
+; MIPS32EB-NEXT: sc $9, 0($2)
+; MIPS32EB-NEXT: beqz $9, $BB10_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: and $1, $7, $5
+; MIPS32EB-NEXT: srlv $1, $1, $3
+; MIPS32EB-NEXT: sll $1, $1, 24
+; MIPS32EB-NEXT: sra $1, $1, 24
+; MIPS32EB-NEXT: # %bb.3: # %entry
+; MIPS32EB-NEXT: sll $1, $1, 24
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: sra $2, $1, 24
entry:
%0 = atomicrmw nand i8* @y, i8 %incr monotonic
ret i8 %0
-; ALL-LABEL: AtomicLoadNand8:
-
-; MIPS32-ANY: lw $[[R0:[0-9]+]], %got(y)
-; MIPS64-ANY: ld $[[R0:[0-9]+]], %got_disp(y)(
-
-; ALL: addiu $[[R1:[0-9]+]], $zero, -4
-; ALL: and $[[R2:[0-9]+]], $[[R0]], $[[R1]]
-; ALL: andi $[[R3:[0-9]+]], $[[R0]], 3
-; CHECK-EL: sll $[[R5:[0-9]+]], $[[R3]], 3
-; CHECK-EB: xori $[[R4:[0-9]+]], $[[R3]], 3
-; CHECK-EB: sll $[[R5:[0-9]+]], $[[R4]], 3
-; ALL: ori $[[R6:[0-9]+]], $zero, 255
-; ALL: sllv $[[R7:[0-9]+]], $[[R6]], $[[R5]]
-; ALL: nor $[[R8:[0-9]+]], $zero, $[[R7]]
-; ALL: sllv $[[R9:[0-9]+]], $4, $[[R5]]
-
-; O0: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; O0: ld $[[R10:[0-9]+]]
-; O0-NEXT: ll $[[R11:[0-9]+]], 0($[[R10]])
-
-; ALL: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; ALL: ll $[[R12:[0-9]+]], 0($[[R2]])
-; ALL: and $[[R13:[0-9]+]], $[[R12]], $[[R9]]
-; ALL: nor $[[R14:[0-9]+]], $zero, $[[R13]]
-; ALL: and $[[R15:[0-9]+]], $[[R14]], $[[R7]]
-; ALL: and $[[R16:[0-9]+]], $[[R12]], $[[R8]]
-; ALL: or $[[R17:[0-9]+]], $[[R16]], $[[R15]]
-; ALL: sc $[[R17]], 0($[[R2]])
-; NOT-MICROMIPS: beqz $[[R17]], [[BB0]]
-; MICROMIPS: beqzc $[[R17]], [[BB0]]
-; MIPSR6: beqzc $[[R17]], [[BB0]]
-
-; ALL: and $[[R18:[0-9]+]], $[[R12]], $[[R7]]
-; ALL: srlv $[[R19:[0-9]+]], $[[R18]], $[[R5]]
-
-; NO-SEB-SEH: sll $[[R20:[0-9]+]], $[[R19]], 24
-; NO-SEB-SEH: sra $2, $[[R20]], 24
-
-; HAS-SEB-SEH: seb $2, $[[R19]]
}
define signext i8 @AtomicSwap8(i8 signext %newval) nounwind {
+; MIPS32-LABEL: AtomicSwap8:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: lw $1, %got(y)($1)
+; MIPS32-NEXT: addiu $2, $zero, -4
+; MIPS32-NEXT: and $2, $1, $2
+; MIPS32-NEXT: andi $1, $1, 3
+; MIPS32-NEXT: sll $3, $1, 3
+; MIPS32-NEXT: ori $1, $zero, 255
+; MIPS32-NEXT: sllv $5, $1, $3
+; MIPS32-NEXT: nor $6, $zero, $5
+; MIPS32-NEXT: sllv $4, $4, $3
+; MIPS32-NEXT: $BB11_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $7, 0($2)
+; MIPS32-NEXT: and $8, $4, $5
+; MIPS32-NEXT: and $9, $7, $6
+; MIPS32-NEXT: or $9, $9, $8
+; MIPS32-NEXT: sc $9, 0($2)
+; MIPS32-NEXT: beqz $9, $BB11_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: and $1, $7, $5
+; MIPS32-NEXT: srlv $1, $1, $3
+; MIPS32-NEXT: sll $1, $1, 24
+; MIPS32-NEXT: sra $1, $1, 24
+; MIPS32-NEXT: # %bb.3: # %entry
+; MIPS32-NEXT: sll $1, $1, 24
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: sra $2, $1, 24
+;
+; MIPS32O0-LABEL: AtomicSwap8:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addiu $sp, $sp, -8
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: lw $2, %got(y)($2)
+; MIPS32O0-NEXT: addiu $25, $zero, -4
+; MIPS32O0-NEXT: and $25, $2, $25
+; MIPS32O0-NEXT: andi $2, $2, 3
+; MIPS32O0-NEXT: sll $2, $2, 3
+; MIPS32O0-NEXT: ori $1, $zero, 255
+; MIPS32O0-NEXT: sllv $1, $1, $2
+; MIPS32O0-NEXT: nor $3, $zero, $1
+; MIPS32O0-NEXT: sllv $4, $4, $2
+; MIPS32O0-NEXT: $BB11_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $6, 0($25)
+; MIPS32O0-NEXT: and $7, $4, $1
+; MIPS32O0-NEXT: and $8, $6, $3
+; MIPS32O0-NEXT: or $8, $8, $7
+; MIPS32O0-NEXT: sc $8, 0($25)
+; MIPS32O0-NEXT: beqz $8, $BB11_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: and $5, $6, $1
+; MIPS32O0-NEXT: srlv $5, $5, $2
+; MIPS32O0-NEXT: sll $5, $5, 24
+; MIPS32O0-NEXT: sra $5, $5, 24
+; MIPS32O0-NEXT: # %bb.3: # %entry
+; MIPS32O0-NEXT: sw $5, 4($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: # %bb.4: # %entry
+; MIPS32O0-NEXT: lw $1, 4($sp) # 4-byte Folded Reload
+; MIPS32O0-NEXT: sll $2, $1, 24
+; MIPS32O0-NEXT: sra $2, $2, 24
+; MIPS32O0-NEXT: addiu $sp, $sp, 8
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicSwap8:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: lw $1, %got(y)($1)
+; MIPS32R2-NEXT: addiu $2, $zero, -4
+; MIPS32R2-NEXT: and $2, $1, $2
+; MIPS32R2-NEXT: andi $1, $1, 3
+; MIPS32R2-NEXT: sll $3, $1, 3
+; MIPS32R2-NEXT: ori $1, $zero, 255
+; MIPS32R2-NEXT: sllv $5, $1, $3
+; MIPS32R2-NEXT: nor $6, $zero, $5
+; MIPS32R2-NEXT: sllv $4, $4, $3
+; MIPS32R2-NEXT: $BB11_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $7, 0($2)
+; MIPS32R2-NEXT: and $8, $4, $5
+; MIPS32R2-NEXT: and $9, $7, $6
+; MIPS32R2-NEXT: or $9, $9, $8
+; MIPS32R2-NEXT: sc $9, 0($2)
+; MIPS32R2-NEXT: beqz $9, $BB11_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: and $1, $7, $5
+; MIPS32R2-NEXT: srlv $1, $1, $3
+; MIPS32R2-NEXT: seb $1, $1
+; MIPS32R2-NEXT: # %bb.3: # %entry
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: seb $2, $1
+;
+; MIPS32R6-LABEL: AtomicSwap8:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: lw $1, %got(y)($1)
+; MIPS32R6-NEXT: addiu $2, $zero, -4
+; MIPS32R6-NEXT: and $2, $1, $2
+; MIPS32R6-NEXT: andi $1, $1, 3
+; MIPS32R6-NEXT: sll $3, $1, 3
+; MIPS32R6-NEXT: ori $1, $zero, 255
+; MIPS32R6-NEXT: sllv $5, $1, $3
+; MIPS32R6-NEXT: nor $6, $zero, $5
+; MIPS32R6-NEXT: sllv $4, $4, $3
+; MIPS32R6-NEXT: $BB11_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $7, 0($2)
+; MIPS32R6-NEXT: and $8, $4, $5
+; MIPS32R6-NEXT: and $9, $7, $6
+; MIPS32R6-NEXT: or $9, $9, $8
+; MIPS32R6-NEXT: sc $9, 0($2)
+; MIPS32R6-NEXT: beqzc $9, $BB11_1
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: and $1, $7, $5
+; MIPS32R6-NEXT: srlv $1, $1, $3
+; MIPS32R6-NEXT: seb $1, $1
+; MIPS32R6-NEXT: # %bb.3: # %entry
+; MIPS32R6-NEXT: jr $ra
+; MIPS32R6-NEXT: seb $2, $1
+;
+; MIPS32R6O0-LABEL: AtomicSwap8:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -8
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $4
+; MIPS32R6O0-NEXT: lw $2, %got(y)($2)
+; MIPS32R6O0-NEXT: addiu $1, $zero, -4
+; MIPS32R6O0-NEXT: and $1, $2, $1
+; MIPS32R6O0-NEXT: andi $2, $2, 3
+; MIPS32R6O0-NEXT: sll $2, $2, 3
+; MIPS32R6O0-NEXT: ori $3, $zero, 255
+; MIPS32R6O0-NEXT: sllv $3, $3, $2
+; MIPS32R6O0-NEXT: nor $5, $zero, $3
+; MIPS32R6O0-NEXT: sllv $4, $4, $2
+; MIPS32R6O0-NEXT: $BB11_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $7, 0($1)
+; MIPS32R6O0-NEXT: and $8, $4, $3
+; MIPS32R6O0-NEXT: and $9, $7, $5
+; MIPS32R6O0-NEXT: or $9, $9, $8
+; MIPS32R6O0-NEXT: sc $9, 0($1)
+; MIPS32R6O0-NEXT: beqzc $9, $BB11_1
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: and $6, $7, $3
+; MIPS32R6O0-NEXT: srlv $6, $6, $2
+; MIPS32R6O0-NEXT: seb $6, $6
+; MIPS32R6O0-NEXT: # %bb.3: # %entry
+; MIPS32R6O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $6, 0($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: # %bb.4: # %entry
+; MIPS32R6O0-NEXT: lw $1, 0($sp) # 4-byte Folded Reload
+; MIPS32R6O0-NEXT: seb $2, $1
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 8
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicSwap8:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicSwap8)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicSwap8)))
+; MIPS4-NEXT: ld $1, %got_disp(y)($1)
+; MIPS4-NEXT: daddiu $2, $zero, -4
+; MIPS4-NEXT: and $2, $1, $2
+; MIPS4-NEXT: andi $1, $1, 3
+; MIPS4-NEXT: sll $3, $1, 3
+; MIPS4-NEXT: ori $1, $zero, 255
+; MIPS4-NEXT: sllv $5, $1, $3
+; MIPS4-NEXT: nor $6, $zero, $5
+; MIPS4-NEXT: sllv $4, $4, $3
+; MIPS4-NEXT: .LBB11_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $7, 0($2)
+; MIPS4-NEXT: and $8, $4, $5
+; MIPS4-NEXT: and $9, $7, $6
+; MIPS4-NEXT: or $9, $9, $8
+; MIPS4-NEXT: sc $9, 0($2)
+; MIPS4-NEXT: beqz $9, .LBB11_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: and $1, $7, $5
+; MIPS4-NEXT: srlv $1, $1, $3
+; MIPS4-NEXT: sll $1, $1, 24
+; MIPS4-NEXT: sra $1, $1, 24
+; MIPS4-NEXT: # %bb.3: # %entry
+; MIPS4-NEXT: sll $1, $1, 24
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: sra $2, $1, 24
+;
+; MIPS64-LABEL: AtomicSwap8:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicSwap8)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicSwap8)))
+; MIPS64-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64-NEXT: daddiu $2, $zero, -4
+; MIPS64-NEXT: and $2, $1, $2
+; MIPS64-NEXT: andi $1, $1, 3
+; MIPS64-NEXT: sll $3, $1, 3
+; MIPS64-NEXT: ori $1, $zero, 255
+; MIPS64-NEXT: sllv $5, $1, $3
+; MIPS64-NEXT: nor $6, $zero, $5
+; MIPS64-NEXT: sllv $4, $4, $3
+; MIPS64-NEXT: .LBB11_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $7, 0($2)
+; MIPS64-NEXT: and $8, $4, $5
+; MIPS64-NEXT: and $9, $7, $6
+; MIPS64-NEXT: or $9, $9, $8
+; MIPS64-NEXT: sc $9, 0($2)
+; MIPS64-NEXT: beqz $9, .LBB11_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: and $1, $7, $5
+; MIPS64-NEXT: srlv $1, $1, $3
+; MIPS64-NEXT: sll $1, $1, 24
+; MIPS64-NEXT: sra $1, $1, 24
+; MIPS64-NEXT: # %bb.3: # %entry
+; MIPS64-NEXT: sll $1, $1, 24
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: sra $2, $1, 24
+;
+; MIPS64R2-LABEL: AtomicSwap8:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicSwap8)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicSwap8)))
+; MIPS64R2-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64R2-NEXT: daddiu $2, $zero, -4
+; MIPS64R2-NEXT: and $2, $1, $2
+; MIPS64R2-NEXT: andi $1, $1, 3
+; MIPS64R2-NEXT: sll $3, $1, 3
+; MIPS64R2-NEXT: ori $1, $zero, 255
+; MIPS64R2-NEXT: sllv $5, $1, $3
+; MIPS64R2-NEXT: nor $6, $zero, $5
+; MIPS64R2-NEXT: sllv $4, $4, $3
+; MIPS64R2-NEXT: .LBB11_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $7, 0($2)
+; MIPS64R2-NEXT: and $8, $4, $5
+; MIPS64R2-NEXT: and $9, $7, $6
+; MIPS64R2-NEXT: or $9, $9, $8
+; MIPS64R2-NEXT: sc $9, 0($2)
+; MIPS64R2-NEXT: beqz $9, .LBB11_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: and $1, $7, $5
+; MIPS64R2-NEXT: srlv $1, $1, $3
+; MIPS64R2-NEXT: seb $1, $1
+; MIPS64R2-NEXT: # %bb.3: # %entry
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: seb $2, $1
+;
+; MIPS64R6-LABEL: AtomicSwap8:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicSwap8)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicSwap8)))
+; MIPS64R6-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64R6-NEXT: daddiu $2, $zero, -4
+; MIPS64R6-NEXT: and $2, $1, $2
+; MIPS64R6-NEXT: andi $1, $1, 3
+; MIPS64R6-NEXT: sll $3, $1, 3
+; MIPS64R6-NEXT: ori $1, $zero, 255
+; MIPS64R6-NEXT: sllv $5, $1, $3
+; MIPS64R6-NEXT: nor $6, $zero, $5
+; MIPS64R6-NEXT: sllv $4, $4, $3
+; MIPS64R6-NEXT: .LBB11_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $7, 0($2)
+; MIPS64R6-NEXT: and $8, $4, $5
+; MIPS64R6-NEXT: and $9, $7, $6
+; MIPS64R6-NEXT: or $9, $9, $8
+; MIPS64R6-NEXT: sc $9, 0($2)
+; MIPS64R6-NEXT: beqzc $9, .LBB11_1
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: and $1, $7, $5
+; MIPS64R6-NEXT: srlv $1, $1, $3
+; MIPS64R6-NEXT: seb $1, $1
+; MIPS64R6-NEXT: # %bb.3: # %entry
+; MIPS64R6-NEXT: jr $ra
+; MIPS64R6-NEXT: seb $2, $1
+;
+; MIPS64R6O0-LABEL: AtomicSwap8:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, -16
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicSwap8)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicSwap8)))
+; MIPS64R6O0-NEXT: move $2, $4
+; MIPS64R6O0-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64R6O0-NEXT: daddiu $4, $zero, -4
+; MIPS64R6O0-NEXT: and $4, $1, $4
+; MIPS64R6O0-NEXT: andi $3, $1, 3
+; MIPS64R6O0-NEXT: xori $3, $3, 3
+; MIPS64R6O0-NEXT: sll $3, $3, 3
+; MIPS64R6O0-NEXT: ori $5, $zero, 255
+; MIPS64R6O0-NEXT: sllv $5, $5, $3
+; MIPS64R6O0-NEXT: nor $6, $zero, $5
+; MIPS64R6O0-NEXT: sllv $2, $2, $3
+; MIPS64R6O0-NEXT: .LBB11_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $8, 0($4)
+; MIPS64R6O0-NEXT: and $9, $2, $5
+; MIPS64R6O0-NEXT: and $10, $8, $6
+; MIPS64R6O0-NEXT: or $10, $10, $9
+; MIPS64R6O0-NEXT: sc $10, 0($4)
+; MIPS64R6O0-NEXT: beqzc $10, .LBB11_1
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: and $7, $8, $5
+; MIPS64R6O0-NEXT: srlv $7, $7, $3
+; MIPS64R6O0-NEXT: seb $7, $7
+; MIPS64R6O0-NEXT: # %bb.3: # %entry
+; MIPS64R6O0-NEXT: sw $7, 12($sp) # 4-byte Folded Spill
+; MIPS64R6O0-NEXT: # %bb.4: # %entry
+; MIPS64R6O0-NEXT: lw $1, 12($sp) # 4-byte Folded Reload
+; MIPS64R6O0-NEXT: seb $2, $1
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, 16
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicSwap8:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: lw $1, %got(y)($2)
+; MM32-NEXT: addiu $2, $zero, -4
+; MM32-NEXT: and $2, $1, $2
+; MM32-NEXT: andi $1, $1, 3
+; MM32-NEXT: sll $3, $1, 3
+; MM32-NEXT: ori $1, $zero, 255
+; MM32-NEXT: sllv $5, $1, $3
+; MM32-NEXT: nor $6, $zero, $5
+; MM32-NEXT: sllv $4, $4, $3
+; MM32-NEXT: $BB11_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $7, 0($2)
+; MM32-NEXT: and $8, $4, $5
+; MM32-NEXT: and $9, $7, $6
+; MM32-NEXT: or $9, $9, $8
+; MM32-NEXT: sc $9, 0($2)
+; MM32-NEXT: beqzc $9, $BB11_1
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: and $1, $7, $5
+; MM32-NEXT: srlv $1, $1, $3
+; MM32-NEXT: seb $1, $1
+; MM32-NEXT: # %bb.3: # %entry
+; MM32-NEXT: jr $ra
+; MM32-NEXT: seb $2, $1
+;
+; O1-LABEL: AtomicSwap8:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: lw $1, %got(y)($1)
+; O1-NEXT: addiu $2, $zero, -4
+; O1-NEXT: and $2, $1, $2
+; O1-NEXT: andi $1, $1, 3
+; O1-NEXT: sll $3, $1, 3
+; O1-NEXT: ori $1, $zero, 255
+; O1-NEXT: sllv $5, $1, $3
+; O1-NEXT: nor $6, $zero, $5
+; O1-NEXT: sllv $4, $4, $3
+; O1-NEXT: $BB11_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $7, 0($2)
+; O1-NEXT: and $8, $4, $5
+; O1-NEXT: and $9, $7, $6
+; O1-NEXT: or $9, $9, $8
+; O1-NEXT: sc $9, 0($2)
+; O1-NEXT: beqz $9, $BB11_1
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: and $1, $7, $5
+; O1-NEXT: srlv $1, $1, $3
+; O1-NEXT: sll $1, $1, 24
+; O1-NEXT: sra $1, $1, 24
+; O1-NEXT: # %bb.3: # %entry
+; O1-NEXT: sll $1, $1, 24
+; O1-NEXT: jr $ra
+; O1-NEXT: sra $2, $1, 24
+;
+; O2-LABEL: AtomicSwap8:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: lw $1, %got(y)($1)
+; O2-NEXT: addiu $2, $zero, -4
+; O2-NEXT: and $2, $1, $2
+; O2-NEXT: andi $1, $1, 3
+; O2-NEXT: sll $3, $1, 3
+; O2-NEXT: ori $1, $zero, 255
+; O2-NEXT: sllv $5, $1, $3
+; O2-NEXT: nor $6, $zero, $5
+; O2-NEXT: sllv $4, $4, $3
+; O2-NEXT: $BB11_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $7, 0($2)
+; O2-NEXT: and $8, $4, $5
+; O2-NEXT: and $9, $7, $6
+; O2-NEXT: or $9, $9, $8
+; O2-NEXT: sc $9, 0($2)
+; O2-NEXT: beqz $9, $BB11_1
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: and $1, $7, $5
+; O2-NEXT: srlv $1, $1, $3
+; O2-NEXT: sll $1, $1, 24
+; O2-NEXT: sra $1, $1, 24
+; O2-NEXT: # %bb.3: # %entry
+; O2-NEXT: sll $1, $1, 24
+; O2-NEXT: jr $ra
+; O2-NEXT: sra $2, $1, 24
+;
+; O3-LABEL: AtomicSwap8:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: addiu $2, $zero, -4
+; O3-NEXT: lw $1, %got(y)($1)
+; O3-NEXT: and $2, $1, $2
+; O3-NEXT: andi $1, $1, 3
+; O3-NEXT: sll $3, $1, 3
+; O3-NEXT: ori $1, $zero, 255
+; O3-NEXT: sllv $5, $1, $3
+; O3-NEXT: sllv $4, $4, $3
+; O3-NEXT: nor $6, $zero, $5
+; O3-NEXT: $BB11_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $7, 0($2)
+; O3-NEXT: and $8, $4, $5
+; O3-NEXT: and $9, $7, $6
+; O3-NEXT: or $9, $9, $8
+; O3-NEXT: sc $9, 0($2)
+; O3-NEXT: beqz $9, $BB11_1
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: and $1, $7, $5
+; O3-NEXT: srlv $1, $1, $3
+; O3-NEXT: sll $1, $1, 24
+; O3-NEXT: sra $1, $1, 24
+; O3-NEXT: # %bb.3: # %entry
+; O3-NEXT: sll $1, $1, 24
+; O3-NEXT: jr $ra
+; O3-NEXT: sra $2, $1, 24
+;
+; MIPS32EB-LABEL: AtomicSwap8:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: lw $1, %got(y)($1)
+; MIPS32EB-NEXT: addiu $2, $zero, -4
+; MIPS32EB-NEXT: and $2, $1, $2
+; MIPS32EB-NEXT: andi $1, $1, 3
+; MIPS32EB-NEXT: xori $1, $1, 3
+; MIPS32EB-NEXT: sll $3, $1, 3
+; MIPS32EB-NEXT: ori $1, $zero, 255
+; MIPS32EB-NEXT: sllv $5, $1, $3
+; MIPS32EB-NEXT: nor $6, $zero, $5
+; MIPS32EB-NEXT: sllv $4, $4, $3
+; MIPS32EB-NEXT: $BB11_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $7, 0($2)
+; MIPS32EB-NEXT: and $8, $4, $5
+; MIPS32EB-NEXT: and $9, $7, $6
+; MIPS32EB-NEXT: or $9, $9, $8
+; MIPS32EB-NEXT: sc $9, 0($2)
+; MIPS32EB-NEXT: beqz $9, $BB11_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: and $1, $7, $5
+; MIPS32EB-NEXT: srlv $1, $1, $3
+; MIPS32EB-NEXT: sll $1, $1, 24
+; MIPS32EB-NEXT: sra $1, $1, 24
+; MIPS32EB-NEXT: # %bb.3: # %entry
+; MIPS32EB-NEXT: sll $1, $1, 24
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: sra $2, $1, 24
entry:
%0 = atomicrmw xchg i8* @y, i8 %newval monotonic
ret i8 %0
-
-; ALL-LABEL: AtomicSwap8:
-
-; MIPS32-ANY: lw $[[R0:[0-9]+]], %got(y)
-; MIPS64-ANY: ld $[[R0:[0-9]+]], %got_disp(y)(
-
-; ALL: addiu $[[R1:[0-9]+]], $zero, -4
-; ALL: and $[[R2:[0-9]+]], $[[R0]], $[[R1]]
-; ALL: andi $[[R3:[0-9]+]], $[[R0]], 3
-; CHECK-EL: sll $[[R5:[0-9]+]], $[[R3]], 3
-; CHECK-EB: xori $[[R4:[0-9]+]], $[[R3]], 3
-; CHECK-EB: sll $[[R5:[0-9]+]], $[[R4]], 3
-; ALL: ori $[[R6:[0-9]+]], $zero, 255
-; ALL: sllv $[[R7:[0-9]+]], $[[R6]], $[[R5]]
-; ALL: nor $[[R8:[0-9]+]], $zero, $[[R7]]
-; ALL: sllv $[[R9:[0-9]+]], $4, $[[R5]]
-
-; ALL: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; ALL: ll $[[R10:[0-9]+]], 0($[[R2]])
-; ALL: and $[[R18:[0-9]+]], $[[R9]], $[[R7]]
-; ALL: and $[[R13:[0-9]+]], $[[R10]], $[[R8]]
-; ALL: or $[[R14:[0-9]+]], $[[R13]], $[[R18]]
-; ALL: sc $[[R14]], 0($[[R2]])
-; NOT-MICROMIPS: beqz $[[R14]], [[BB0]]
-; MICROMIPS: beqzc $[[R14]], [[BB0]]
-; MIPSR6: beqzc $[[R14]], [[BB0]]
-
-; ALL: and $[[R15:[0-9]+]], $[[R10]], $[[R7]]
-; ALL: srlv $[[R16:[0-9]+]], $[[R15]], $[[R5]]
-
-; NO-SEB-SEH: sll $[[R17:[0-9]+]], $[[R16]], 24
-; NO-SEB-SEH: sra $2, $[[R17]], 24
-
-; HAS-SEB-SEH: seb $2, $[[R16]]
-
}
define signext i8 @AtomicCmpSwap8(i8 signext %oldval, i8 signext %newval) nounwind {
+; MIPS32-LABEL: AtomicCmpSwap8:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: lw $1, %got(y)($1)
+; MIPS32-NEXT: addiu $2, $zero, -4
+; MIPS32-NEXT: and $2, $1, $2
+; MIPS32-NEXT: andi $1, $1, 3
+; MIPS32-NEXT: sll $3, $1, 3
+; MIPS32-NEXT: ori $1, $zero, 255
+; MIPS32-NEXT: sllv $6, $1, $3
+; MIPS32-NEXT: nor $7, $zero, $6
+; MIPS32-NEXT: andi $1, $4, 255
+; MIPS32-NEXT: sllv $4, $1, $3
+; MIPS32-NEXT: andi $1, $5, 255
+; MIPS32-NEXT: sllv $5, $1, $3
+; MIPS32-NEXT: $BB12_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $8, 0($2)
+; MIPS32-NEXT: and $9, $8, $6
+; MIPS32-NEXT: bne $9, $4, $BB12_3
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: # in Loop: Header=BB12_1 Depth=1
+; MIPS32-NEXT: and $8, $8, $7
+; MIPS32-NEXT: or $8, $8, $5
+; MIPS32-NEXT: sc $8, 0($2)
+; MIPS32-NEXT: beqz $8, $BB12_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: $BB12_3: # %entry
+; MIPS32-NEXT: srlv $1, $9, $3
+; MIPS32-NEXT: sll $1, $1, 24
+; MIPS32-NEXT: sra $1, $1, 24
+; MIPS32-NEXT: # %bb.4: # %entry
+; MIPS32-NEXT: sll $1, $1, 24
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: sra $2, $1, 24
+;
+; MIPS32O0-LABEL: AtomicCmpSwap8:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addiu $sp, $sp, -8
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: lw $2, %got(y)($2)
+; MIPS32O0-NEXT: addiu $25, $zero, -4
+; MIPS32O0-NEXT: and $25, $2, $25
+; MIPS32O0-NEXT: andi $2, $2, 3
+; MIPS32O0-NEXT: sll $2, $2, 3
+; MIPS32O0-NEXT: ori $1, $zero, 255
+; MIPS32O0-NEXT: sllv $1, $1, $2
+; MIPS32O0-NEXT: nor $3, $zero, $1
+; MIPS32O0-NEXT: andi $4, $4, 255
+; MIPS32O0-NEXT: sllv $4, $4, $2
+; MIPS32O0-NEXT: andi $5, $5, 255
+; MIPS32O0-NEXT: sllv $5, $5, $2
+; MIPS32O0-NEXT: $BB12_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $7, 0($25)
+; MIPS32O0-NEXT: and $8, $7, $1
+; MIPS32O0-NEXT: bne $8, $4, $BB12_3
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: # in Loop: Header=BB12_1 Depth=1
+; MIPS32O0-NEXT: and $7, $7, $3
+; MIPS32O0-NEXT: or $7, $7, $5
+; MIPS32O0-NEXT: sc $7, 0($25)
+; MIPS32O0-NEXT: beqz $7, $BB12_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: $BB12_3: # %entry
+; MIPS32O0-NEXT: srlv $6, $8, $2
+; MIPS32O0-NEXT: sll $6, $6, 24
+; MIPS32O0-NEXT: sra $6, $6, 24
+; MIPS32O0-NEXT: # %bb.4: # %entry
+; MIPS32O0-NEXT: sw $6, 4($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: # %bb.5: # %entry
+; MIPS32O0-NEXT: lw $1, 4($sp) # 4-byte Folded Reload
+; MIPS32O0-NEXT: sll $2, $1, 24
+; MIPS32O0-NEXT: sra $2, $2, 24
+; MIPS32O0-NEXT: addiu $sp, $sp, 8
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicCmpSwap8:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: lw $1, %got(y)($1)
+; MIPS32R2-NEXT: addiu $2, $zero, -4
+; MIPS32R2-NEXT: and $3, $1, $2
+; MIPS32R2-NEXT: andi $1, $1, 3
+; MIPS32R2-NEXT: sll $1, $1, 3
+; MIPS32R2-NEXT: ori $2, $zero, 255
+; MIPS32R2-NEXT: sllv $6, $2, $1
+; MIPS32R2-NEXT: nor $7, $zero, $6
+; MIPS32R2-NEXT: andi $2, $4, 255
+; MIPS32R2-NEXT: sllv $4, $2, $1
+; MIPS32R2-NEXT: andi $2, $5, 255
+; MIPS32R2-NEXT: sllv $5, $2, $1
+; MIPS32R2-NEXT: $BB12_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $8, 0($3)
+; MIPS32R2-NEXT: and $9, $8, $6
+; MIPS32R2-NEXT: bne $9, $4, $BB12_3
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: # in Loop: Header=BB12_1 Depth=1
+; MIPS32R2-NEXT: and $8, $8, $7
+; MIPS32R2-NEXT: or $8, $8, $5
+; MIPS32R2-NEXT: sc $8, 0($3)
+; MIPS32R2-NEXT: beqz $8, $BB12_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: $BB12_3: # %entry
+; MIPS32R2-NEXT: srlv $2, $9, $1
+; MIPS32R2-NEXT: seb $2, $2
+; MIPS32R2-NEXT: # %bb.4: # %entry
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: nop
+;
+; MIPS32R6-LABEL: AtomicCmpSwap8:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: lw $1, %got(y)($1)
+; MIPS32R6-NEXT: addiu $2, $zero, -4
+; MIPS32R6-NEXT: and $3, $1, $2
+; MIPS32R6-NEXT: andi $1, $1, 3
+; MIPS32R6-NEXT: sll $1, $1, 3
+; MIPS32R6-NEXT: ori $2, $zero, 255
+; MIPS32R6-NEXT: sllv $6, $2, $1
+; MIPS32R6-NEXT: nor $7, $zero, $6
+; MIPS32R6-NEXT: andi $2, $4, 255
+; MIPS32R6-NEXT: sllv $4, $2, $1
+; MIPS32R6-NEXT: andi $2, $5, 255
+; MIPS32R6-NEXT: sllv $5, $2, $1
+; MIPS32R6-NEXT: $BB12_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $8, 0($3)
+; MIPS32R6-NEXT: and $9, $8, $6
+; MIPS32R6-NEXT: bnec $9, $4, $BB12_3
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: # in Loop: Header=BB12_1 Depth=1
+; MIPS32R6-NEXT: and $8, $8, $7
+; MIPS32R6-NEXT: or $8, $8, $5
+; MIPS32R6-NEXT: sc $8, 0($3)
+; MIPS32R6-NEXT: beqzc $8, $BB12_1
+; MIPS32R6-NEXT: $BB12_3: # %entry
+; MIPS32R6-NEXT: srlv $2, $9, $1
+; MIPS32R6-NEXT: seb $2, $2
+; MIPS32R6-NEXT: # %bb.4: # %entry
+; MIPS32R6-NEXT: jrc $ra
+;
+; MIPS32R6O0-LABEL: AtomicCmpSwap8:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -16
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $5
+; MIPS32R6O0-NEXT: move $1, $4
+; MIPS32R6O0-NEXT: lw $2, %got(y)($2)
+; MIPS32R6O0-NEXT: addiu $3, $zero, -4
+; MIPS32R6O0-NEXT: and $3, $2, $3
+; MIPS32R6O0-NEXT: andi $2, $2, 3
+; MIPS32R6O0-NEXT: sll $2, $2, 3
+; MIPS32R6O0-NEXT: ori $6, $zero, 255
+; MIPS32R6O0-NEXT: sllv $6, $6, $2
+; MIPS32R6O0-NEXT: nor $7, $zero, $6
+; MIPS32R6O0-NEXT: andi $4, $4, 255
+; MIPS32R6O0-NEXT: sllv $4, $4, $2
+; MIPS32R6O0-NEXT: andi $5, $5, 255
+; MIPS32R6O0-NEXT: sllv $5, $5, $2
+; MIPS32R6O0-NEXT: $BB12_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $9, 0($3)
+; MIPS32R6O0-NEXT: and $10, $9, $6
+; MIPS32R6O0-NEXT: bnec $10, $4, $BB12_3
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: # in Loop: Header=BB12_1 Depth=1
+; MIPS32R6O0-NEXT: and $9, $9, $7
+; MIPS32R6O0-NEXT: or $9, $9, $5
+; MIPS32R6O0-NEXT: sc $9, 0($3)
+; MIPS32R6O0-NEXT: beqzc $9, $BB12_1
+; MIPS32R6O0-NEXT: $BB12_3: # %entry
+; MIPS32R6O0-NEXT: srlv $8, $10, $2
+; MIPS32R6O0-NEXT: seb $8, $8
+; MIPS32R6O0-NEXT: # %bb.4: # %entry
+; MIPS32R6O0-NEXT: sw $1, 12($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $8, 8($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: # %bb.5: # %entry
+; MIPS32R6O0-NEXT: lw $2, 8($sp) # 4-byte Folded Reload
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 16
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicCmpSwap8:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicCmpSwap8)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicCmpSwap8)))
+; MIPS4-NEXT: ld $1, %got_disp(y)($1)
+; MIPS4-NEXT: daddiu $2, $zero, -4
+; MIPS4-NEXT: and $2, $1, $2
+; MIPS4-NEXT: andi $1, $1, 3
+; MIPS4-NEXT: sll $3, $1, 3
+; MIPS4-NEXT: ori $1, $zero, 255
+; MIPS4-NEXT: sllv $6, $1, $3
+; MIPS4-NEXT: nor $7, $zero, $6
+; MIPS4-NEXT: andi $1, $4, 255
+; MIPS4-NEXT: sllv $4, $1, $3
+; MIPS4-NEXT: andi $1, $5, 255
+; MIPS4-NEXT: sllv $5, $1, $3
+; MIPS4-NEXT: .LBB12_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $8, 0($2)
+; MIPS4-NEXT: and $9, $8, $6
+; MIPS4-NEXT: bne $9, $4, .LBB12_3
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: # in Loop: Header=BB12_1 Depth=1
+; MIPS4-NEXT: and $8, $8, $7
+; MIPS4-NEXT: or $8, $8, $5
+; MIPS4-NEXT: sc $8, 0($2)
+; MIPS4-NEXT: beqz $8, .LBB12_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: .LBB12_3: # %entry
+; MIPS4-NEXT: srlv $1, $9, $3
+; MIPS4-NEXT: sll $1, $1, 24
+; MIPS4-NEXT: sra $1, $1, 24
+; MIPS4-NEXT: # %bb.4: # %entry
+; MIPS4-NEXT: sll $1, $1, 24
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: sra $2, $1, 24
+;
+; MIPS64-LABEL: AtomicCmpSwap8:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicCmpSwap8)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicCmpSwap8)))
+; MIPS64-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64-NEXT: daddiu $2, $zero, -4
+; MIPS64-NEXT: and $2, $1, $2
+; MIPS64-NEXT: andi $1, $1, 3
+; MIPS64-NEXT: sll $3, $1, 3
+; MIPS64-NEXT: ori $1, $zero, 255
+; MIPS64-NEXT: sllv $6, $1, $3
+; MIPS64-NEXT: nor $7, $zero, $6
+; MIPS64-NEXT: andi $1, $4, 255
+; MIPS64-NEXT: sllv $4, $1, $3
+; MIPS64-NEXT: andi $1, $5, 255
+; MIPS64-NEXT: sllv $5, $1, $3
+; MIPS64-NEXT: .LBB12_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $8, 0($2)
+; MIPS64-NEXT: and $9, $8, $6
+; MIPS64-NEXT: bne $9, $4, .LBB12_3
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: # in Loop: Header=BB12_1 Depth=1
+; MIPS64-NEXT: and $8, $8, $7
+; MIPS64-NEXT: or $8, $8, $5
+; MIPS64-NEXT: sc $8, 0($2)
+; MIPS64-NEXT: beqz $8, .LBB12_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: .LBB12_3: # %entry
+; MIPS64-NEXT: srlv $1, $9, $3
+; MIPS64-NEXT: sll $1, $1, 24
+; MIPS64-NEXT: sra $1, $1, 24
+; MIPS64-NEXT: # %bb.4: # %entry
+; MIPS64-NEXT: sll $1, $1, 24
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: sra $2, $1, 24
+;
+; MIPS64R2-LABEL: AtomicCmpSwap8:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicCmpSwap8)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicCmpSwap8)))
+; MIPS64R2-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64R2-NEXT: daddiu $2, $zero, -4
+; MIPS64R2-NEXT: and $3, $1, $2
+; MIPS64R2-NEXT: andi $1, $1, 3
+; MIPS64R2-NEXT: sll $1, $1, 3
+; MIPS64R2-NEXT: ori $2, $zero, 255
+; MIPS64R2-NEXT: sllv $6, $2, $1
+; MIPS64R2-NEXT: nor $7, $zero, $6
+; MIPS64R2-NEXT: andi $2, $4, 255
+; MIPS64R2-NEXT: sllv $4, $2, $1
+; MIPS64R2-NEXT: andi $2, $5, 255
+; MIPS64R2-NEXT: sllv $5, $2, $1
+; MIPS64R2-NEXT: .LBB12_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $8, 0($3)
+; MIPS64R2-NEXT: and $9, $8, $6
+; MIPS64R2-NEXT: bne $9, $4, .LBB12_3
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: # in Loop: Header=BB12_1 Depth=1
+; MIPS64R2-NEXT: and $8, $8, $7
+; MIPS64R2-NEXT: or $8, $8, $5
+; MIPS64R2-NEXT: sc $8, 0($3)
+; MIPS64R2-NEXT: beqz $8, .LBB12_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: .LBB12_3: # %entry
+; MIPS64R2-NEXT: srlv $2, $9, $1
+; MIPS64R2-NEXT: seb $2, $2
+; MIPS64R2-NEXT: # %bb.4: # %entry
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: nop
+;
+; MIPS64R6-LABEL: AtomicCmpSwap8:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicCmpSwap8)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicCmpSwap8)))
+; MIPS64R6-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64R6-NEXT: daddiu $2, $zero, -4
+; MIPS64R6-NEXT: and $3, $1, $2
+; MIPS64R6-NEXT: andi $1, $1, 3
+; MIPS64R6-NEXT: sll $1, $1, 3
+; MIPS64R6-NEXT: ori $2, $zero, 255
+; MIPS64R6-NEXT: sllv $6, $2, $1
+; MIPS64R6-NEXT: nor $7, $zero, $6
+; MIPS64R6-NEXT: andi $2, $4, 255
+; MIPS64R6-NEXT: sllv $4, $2, $1
+; MIPS64R6-NEXT: andi $2, $5, 255
+; MIPS64R6-NEXT: sllv $5, $2, $1
+; MIPS64R6-NEXT: .LBB12_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $8, 0($3)
+; MIPS64R6-NEXT: and $9, $8, $6
+; MIPS64R6-NEXT: bnec $9, $4, .LBB12_3
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: # in Loop: Header=BB12_1 Depth=1
+; MIPS64R6-NEXT: and $8, $8, $7
+; MIPS64R6-NEXT: or $8, $8, $5
+; MIPS64R6-NEXT: sc $8, 0($3)
+; MIPS64R6-NEXT: beqzc $8, .LBB12_1
+; MIPS64R6-NEXT: .LBB12_3: # %entry
+; MIPS64R6-NEXT: srlv $2, $9, $1
+; MIPS64R6-NEXT: seb $2, $2
+; MIPS64R6-NEXT: # %bb.4: # %entry
+; MIPS64R6-NEXT: jrc $ra
+;
+; MIPS64R6O0-LABEL: AtomicCmpSwap8:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, -16
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicCmpSwap8)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicCmpSwap8)))
+; MIPS64R6O0-NEXT: move $2, $5
+; MIPS64R6O0-NEXT: move $3, $4
+; MIPS64R6O0-NEXT: ld $1, %got_disp(y)($1)
+; MIPS64R6O0-NEXT: daddiu $4, $zero, -4
+; MIPS64R6O0-NEXT: and $4, $1, $4
+; MIPS64R6O0-NEXT: andi $6, $1, 3
+; MIPS64R6O0-NEXT: xori $6, $6, 3
+; MIPS64R6O0-NEXT: sll $6, $6, 3
+; MIPS64R6O0-NEXT: ori $7, $zero, 255
+; MIPS64R6O0-NEXT: sllv $7, $7, $6
+; MIPS64R6O0-NEXT: nor $8, $zero, $7
+; MIPS64R6O0-NEXT: andi $3, $3, 255
+; MIPS64R6O0-NEXT: sllv $3, $3, $6
+; MIPS64R6O0-NEXT: andi $2, $2, 255
+; MIPS64R6O0-NEXT: sllv $2, $2, $6
+; MIPS64R6O0-NEXT: .LBB12_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $10, 0($4)
+; MIPS64R6O0-NEXT: and $11, $10, $7
+; MIPS64R6O0-NEXT: bnec $11, $3, .LBB12_3
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: # in Loop: Header=BB12_1 Depth=1
+; MIPS64R6O0-NEXT: and $10, $10, $8
+; MIPS64R6O0-NEXT: or $10, $10, $2
+; MIPS64R6O0-NEXT: sc $10, 0($4)
+; MIPS64R6O0-NEXT: beqzc $10, .LBB12_1
+; MIPS64R6O0-NEXT: .LBB12_3: # %entry
+; MIPS64R6O0-NEXT: srlv $9, $11, $6
+; MIPS64R6O0-NEXT: seb $9, $9
+; MIPS64R6O0-NEXT: # %bb.4: # %entry
+; MIPS64R6O0-NEXT: sw $9, 12($sp) # 4-byte Folded Spill
+; MIPS64R6O0-NEXT: # %bb.5: # %entry
+; MIPS64R6O0-NEXT: lw $2, 12($sp) # 4-byte Folded Reload
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, 16
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicCmpSwap8:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: lw $1, %got(y)($2)
+; MM32-NEXT: addiu $2, $zero, -4
+; MM32-NEXT: and $3, $1, $2
+; MM32-NEXT: andi $1, $1, 3
+; MM32-NEXT: sll $1, $1, 3
+; MM32-NEXT: ori $2, $zero, 255
+; MM32-NEXT: sllv $6, $2, $1
+; MM32-NEXT: nor $7, $zero, $6
+; MM32-NEXT: andi $2, $4, 255
+; MM32-NEXT: sllv $4, $2, $1
+; MM32-NEXT: andi $2, $5, 255
+; MM32-NEXT: sllv $5, $2, $1
+; MM32-NEXT: $BB12_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $8, 0($3)
+; MM32-NEXT: and $9, $8, $6
+; MM32-NEXT: bne $9, $4, $BB12_3
+; MM32-NEXT: nop
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: # in Loop: Header=BB12_1 Depth=1
+; MM32-NEXT: and $8, $8, $7
+; MM32-NEXT: or $8, $8, $5
+; MM32-NEXT: sc $8, 0($3)
+; MM32-NEXT: beqzc $8, $BB12_1
+; MM32-NEXT: $BB12_3: # %entry
+; MM32-NEXT: srlv $2, $9, $1
+; MM32-NEXT: seb $2, $2
+; MM32-NEXT: # %bb.4: # %entry
+; MM32-NEXT: jrc $ra
+;
+; O1-LABEL: AtomicCmpSwap8:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: lw $1, %got(y)($1)
+; O1-NEXT: addiu $2, $zero, -4
+; O1-NEXT: and $2, $1, $2
+; O1-NEXT: andi $1, $1, 3
+; O1-NEXT: sll $3, $1, 3
+; O1-NEXT: ori $1, $zero, 255
+; O1-NEXT: sllv $6, $1, $3
+; O1-NEXT: nor $7, $zero, $6
+; O1-NEXT: andi $1, $4, 255
+; O1-NEXT: sllv $4, $1, $3
+; O1-NEXT: andi $1, $5, 255
+; O1-NEXT: sllv $5, $1, $3
+; O1-NEXT: $BB12_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $8, 0($2)
+; O1-NEXT: and $9, $8, $6
+; O1-NEXT: bne $9, $4, $BB12_3
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: # in Loop: Header=BB12_1 Depth=1
+; O1-NEXT: and $8, $8, $7
+; O1-NEXT: or $8, $8, $5
+; O1-NEXT: sc $8, 0($2)
+; O1-NEXT: beqz $8, $BB12_1
+; O1-NEXT: nop
+; O1-NEXT: $BB12_3: # %entry
+; O1-NEXT: srlv $1, $9, $3
+; O1-NEXT: sll $1, $1, 24
+; O1-NEXT: sra $1, $1, 24
+; O1-NEXT: # %bb.4: # %entry
+; O1-NEXT: sll $1, $1, 24
+; O1-NEXT: jr $ra
+; O1-NEXT: sra $2, $1, 24
+;
+; O2-LABEL: AtomicCmpSwap8:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: lw $1, %got(y)($1)
+; O2-NEXT: addiu $2, $zero, -4
+; O2-NEXT: and $2, $1, $2
+; O2-NEXT: andi $1, $1, 3
+; O2-NEXT: sll $3, $1, 3
+; O2-NEXT: ori $1, $zero, 255
+; O2-NEXT: sllv $6, $1, $3
+; O2-NEXT: nor $7, $zero, $6
+; O2-NEXT: andi $1, $4, 255
+; O2-NEXT: sllv $4, $1, $3
+; O2-NEXT: andi $1, $5, 255
+; O2-NEXT: sllv $5, $1, $3
+; O2-NEXT: $BB12_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $8, 0($2)
+; O2-NEXT: and $9, $8, $6
+; O2-NEXT: bne $9, $4, $BB12_3
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: # in Loop: Header=BB12_1 Depth=1
+; O2-NEXT: and $8, $8, $7
+; O2-NEXT: or $8, $8, $5
+; O2-NEXT: sc $8, 0($2)
+; O2-NEXT: beqz $8, $BB12_1
+; O2-NEXT: nop
+; O2-NEXT: $BB12_3: # %entry
+; O2-NEXT: srlv $1, $9, $3
+; O2-NEXT: sll $1, $1, 24
+; O2-NEXT: sra $1, $1, 24
+; O2-NEXT: # %bb.4: # %entry
+; O2-NEXT: sll $1, $1, 24
+; O2-NEXT: jr $ra
+; O2-NEXT: sra $2, $1, 24
+;
+; O3-LABEL: AtomicCmpSwap8:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: addiu $2, $zero, -4
+; O3-NEXT: lw $1, %got(y)($1)
+; O3-NEXT: and $2, $1, $2
+; O3-NEXT: andi $1, $1, 3
+; O3-NEXT: sll $3, $1, 3
+; O3-NEXT: ori $1, $zero, 255
+; O3-NEXT: sllv $6, $1, $3
+; O3-NEXT: andi $1, $4, 255
+; O3-NEXT: sllv $4, $1, $3
+; O3-NEXT: andi $1, $5, 255
+; O3-NEXT: nor $7, $zero, $6
+; O3-NEXT: sllv $5, $1, $3
+; O3-NEXT: $BB12_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $8, 0($2)
+; O3-NEXT: and $9, $8, $6
+; O3-NEXT: bne $9, $4, $BB12_3
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: # in Loop: Header=BB12_1 Depth=1
+; O3-NEXT: and $8, $8, $7
+; O3-NEXT: or $8, $8, $5
+; O3-NEXT: sc $8, 0($2)
+; O3-NEXT: beqz $8, $BB12_1
+; O3-NEXT: nop
+; O3-NEXT: $BB12_3: # %entry
+; O3-NEXT: srlv $1, $9, $3
+; O3-NEXT: sll $1, $1, 24
+; O3-NEXT: sra $1, $1, 24
+; O3-NEXT: # %bb.4: # %entry
+; O3-NEXT: sll $1, $1, 24
+; O3-NEXT: jr $ra
+; O3-NEXT: sra $2, $1, 24
+;
+; MIPS32EB-LABEL: AtomicCmpSwap8:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: lw $1, %got(y)($1)
+; MIPS32EB-NEXT: addiu $2, $zero, -4
+; MIPS32EB-NEXT: and $2, $1, $2
+; MIPS32EB-NEXT: andi $1, $1, 3
+; MIPS32EB-NEXT: xori $1, $1, 3
+; MIPS32EB-NEXT: sll $3, $1, 3
+; MIPS32EB-NEXT: ori $1, $zero, 255
+; MIPS32EB-NEXT: sllv $6, $1, $3
+; MIPS32EB-NEXT: nor $7, $zero, $6
+; MIPS32EB-NEXT: andi $1, $4, 255
+; MIPS32EB-NEXT: sllv $4, $1, $3
+; MIPS32EB-NEXT: andi $1, $5, 255
+; MIPS32EB-NEXT: sllv $5, $1, $3
+; MIPS32EB-NEXT: $BB12_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $8, 0($2)
+; MIPS32EB-NEXT: and $9, $8, $6
+; MIPS32EB-NEXT: bne $9, $4, $BB12_3
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: # in Loop: Header=BB12_1 Depth=1
+; MIPS32EB-NEXT: and $8, $8, $7
+; MIPS32EB-NEXT: or $8, $8, $5
+; MIPS32EB-NEXT: sc $8, 0($2)
+; MIPS32EB-NEXT: beqz $8, $BB12_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: $BB12_3: # %entry
+; MIPS32EB-NEXT: srlv $1, $9, $3
+; MIPS32EB-NEXT: sll $1, $1, 24
+; MIPS32EB-NEXT: sra $1, $1, 24
+; MIPS32EB-NEXT: # %bb.4: # %entry
+; MIPS32EB-NEXT: sll $1, $1, 24
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: sra $2, $1, 24
entry:
%pair0 = cmpxchg i8* @y, i8 %oldval, i8 %newval monotonic monotonic
%0 = extractvalue { i8, i1 } %pair0, 0
ret i8 %0
-
-; ALL-LABEL: AtomicCmpSwap8:
-
-; MIPS32-ANY: lw $[[R0:[0-9]+]], %got(y)
-; MIPS64-ANY: ld $[[R0:[0-9]+]], %got_disp(y)(
-
-; ALL: addiu $[[R1:[0-9]+]], $zero, -4
-; ALL: and $[[R2:[0-9]+]], $[[R0]], $[[R1]]
-; ALL: andi $[[R3:[0-9]+]], $[[R0]], 3
-; CHECK-EL: sll $[[R5:[0-9]+]], $[[R3]], 3
-; CHECK-EB: xori $[[R4:[0-9]+]], $[[R3]], 3
-; CHECK-EB: sll $[[R5:[0-9]+]], $[[R4]], 3
-; ALL: ori $[[R6:[0-9]+]], $zero, 255
-; ALL: sllv $[[R7:[0-9]+]], $[[R6]], $[[R5]]
-; ALL: nor $[[R8:[0-9]+]], $zero, $[[R7]]
-; ALL: andi $[[R9:[0-9]+]], $4, 255
-; ALL: sllv $[[R10:[0-9]+]], $[[R9]], $[[R5]]
-; ALL: andi $[[R11:[0-9]+]], $5, 255
-; ALL: sllv $[[R12:[0-9]+]], $[[R11]], $[[R5]]
-
-; ALL: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; ALL: ll $[[R13:[0-9]+]], 0($[[R2]])
-; ALL: and $[[R14:[0-9]+]], $[[R13]], $[[R7]]
-; NOT-MICROMIPS: bne $[[R14]], $[[R10]], [[BB1:(\$|\.L)[A-Z_0-9]+]]
-; MICROMIPS: bne $[[R14]], $[[R10]], [[BB1:(\$|\.L)[A-Z_0-9]+]]
-; MIPSR6: bnec $[[R14]], $[[R10]], [[BB1:(\$|\.L)[A-Z_0-9]+]]
-
-; ALL: and $[[R15:[0-9]+]], $[[R13]], $[[R8]]
-; ALL: or $[[R16:[0-9]+]], $[[R15]], $[[R12]]
-; ALL: sc $[[R16]], 0($[[R2]])
-; NOT-MICROMIPS: beqz $[[R16]], [[BB0]]
-; MICROMIPS: beqzc $[[R16]], [[BB0]]
-; MIPSR6: beqzc $[[R16]], [[BB0]]
-
-; ALL: [[BB1]]:
-; ALL: srlv $[[R17:[0-9]+]], $[[R14]], $[[R5]]
-
-; NO-SEB-SEH: sll $[[R18:[0-9]+]], $[[R17]], 24
-; NO-SEB-SEH: sra $2, $[[R18]], 24
-
-; HAS-SEB-SEH: seb $2, $[[R17]]
}
define i1 @AtomicCmpSwapRes8(i8* %ptr, i8 signext %oldval, i8 signext %newval) nounwind {
+; MIPS32-LABEL: AtomicCmpSwapRes8:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: addiu $1, $zero, -4
+; MIPS32-NEXT: and $2, $4, $1
+; MIPS32-NEXT: andi $1, $4, 3
+; MIPS32-NEXT: sll $3, $1, 3
+; MIPS32-NEXT: ori $1, $zero, 255
+; MIPS32-NEXT: sllv $4, $1, $3
+; MIPS32-NEXT: nor $7, $zero, $4
+; MIPS32-NEXT: andi $1, $5, 255
+; MIPS32-NEXT: sllv $8, $1, $3
+; MIPS32-NEXT: andi $1, $6, 255
+; MIPS32-NEXT: sllv $6, $1, $3
+; MIPS32-NEXT: $BB13_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $9, 0($2)
+; MIPS32-NEXT: and $10, $9, $4
+; MIPS32-NEXT: bne $10, $8, $BB13_3
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: # in Loop: Header=BB13_1 Depth=1
+; MIPS32-NEXT: and $9, $9, $7
+; MIPS32-NEXT: or $9, $9, $6
+; MIPS32-NEXT: sc $9, 0($2)
+; MIPS32-NEXT: beqz $9, $BB13_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: $BB13_3: # %entry
+; MIPS32-NEXT: srlv $1, $10, $3
+; MIPS32-NEXT: sll $1, $1, 24
+; MIPS32-NEXT: sra $1, $1, 24
+; MIPS32-NEXT: # %bb.4: # %entry
+; MIPS32-NEXT: sll $2, $5, 24
+; MIPS32-NEXT: sra $2, $2, 24
+; MIPS32-NEXT: xor $1, $1, $2
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: sltiu $2, $1, 1
+;
+; MIPS32O0-LABEL: AtomicCmpSwapRes8:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: addiu $sp, $sp, -8
+; MIPS32O0-NEXT: addiu $1, $zero, -4
+; MIPS32O0-NEXT: and $1, $4, $1
+; MIPS32O0-NEXT: andi $4, $4, 3
+; MIPS32O0-NEXT: sll $4, $4, 3
+; MIPS32O0-NEXT: ori $2, $zero, 255
+; MIPS32O0-NEXT: sllv $2, $2, $4
+; MIPS32O0-NEXT: nor $3, $zero, $2
+; MIPS32O0-NEXT: andi $7, $5, 255
+; MIPS32O0-NEXT: sllv $7, $7, $4
+; MIPS32O0-NEXT: andi $6, $6, 255
+; MIPS32O0-NEXT: sllv $6, $6, $4
+; MIPS32O0-NEXT: $BB13_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $9, 0($1)
+; MIPS32O0-NEXT: and $10, $9, $2
+; MIPS32O0-NEXT: bne $10, $7, $BB13_3
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: # in Loop: Header=BB13_1 Depth=1
+; MIPS32O0-NEXT: and $9, $9, $3
+; MIPS32O0-NEXT: or $9, $9, $6
+; MIPS32O0-NEXT: sc $9, 0($1)
+; MIPS32O0-NEXT: beqz $9, $BB13_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: $BB13_3: # %entry
+; MIPS32O0-NEXT: srlv $8, $10, $4
+; MIPS32O0-NEXT: sll $8, $8, 24
+; MIPS32O0-NEXT: sra $8, $8, 24
+; MIPS32O0-NEXT: # %bb.4: # %entry
+; MIPS32O0-NEXT: sw $5, 4($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: sw $8, 0($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: # %bb.5: # %entry
+; MIPS32O0-NEXT: lw $1, 4($sp) # 4-byte Folded Reload
+; MIPS32O0-NEXT: sll $2, $1, 24
+; MIPS32O0-NEXT: sra $2, $2, 24
+; MIPS32O0-NEXT: lw $3, 0($sp) # 4-byte Folded Reload
+; MIPS32O0-NEXT: xor $2, $3, $2
+; MIPS32O0-NEXT: sltiu $2, $2, 1
+; MIPS32O0-NEXT: addiu $sp, $sp, 8
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicCmpSwapRes8:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: addiu $1, $zero, -4
+; MIPS32R2-NEXT: and $2, $4, $1
+; MIPS32R2-NEXT: andi $1, $4, 3
+; MIPS32R2-NEXT: sll $3, $1, 3
+; MIPS32R2-NEXT: ori $1, $zero, 255
+; MIPS32R2-NEXT: sllv $4, $1, $3
+; MIPS32R2-NEXT: nor $7, $zero, $4
+; MIPS32R2-NEXT: andi $1, $5, 255
+; MIPS32R2-NEXT: sllv $8, $1, $3
+; MIPS32R2-NEXT: andi $1, $6, 255
+; MIPS32R2-NEXT: sllv $6, $1, $3
+; MIPS32R2-NEXT: $BB13_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $9, 0($2)
+; MIPS32R2-NEXT: and $10, $9, $4
+; MIPS32R2-NEXT: bne $10, $8, $BB13_3
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: # in Loop: Header=BB13_1 Depth=1
+; MIPS32R2-NEXT: and $9, $9, $7
+; MIPS32R2-NEXT: or $9, $9, $6
+; MIPS32R2-NEXT: sc $9, 0($2)
+; MIPS32R2-NEXT: beqz $9, $BB13_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: $BB13_3: # %entry
+; MIPS32R2-NEXT: srlv $1, $10, $3
+; MIPS32R2-NEXT: seb $1, $1
+; MIPS32R2-NEXT: # %bb.4: # %entry
+; MIPS32R2-NEXT: xor $1, $1, $5
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: sltiu $2, $1, 1
+;
+; MIPS32R6-LABEL: AtomicCmpSwapRes8:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: addiu $1, $zero, -4
+; MIPS32R6-NEXT: and $2, $4, $1
+; MIPS32R6-NEXT: andi $1, $4, 3
+; MIPS32R6-NEXT: sll $3, $1, 3
+; MIPS32R6-NEXT: ori $1, $zero, 255
+; MIPS32R6-NEXT: sllv $4, $1, $3
+; MIPS32R6-NEXT: nor $7, $zero, $4
+; MIPS32R6-NEXT: andi $1, $5, 255
+; MIPS32R6-NEXT: sllv $8, $1, $3
+; MIPS32R6-NEXT: andi $1, $6, 255
+; MIPS32R6-NEXT: sllv $6, $1, $3
+; MIPS32R6-NEXT: $BB13_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $9, 0($2)
+; MIPS32R6-NEXT: and $10, $9, $4
+; MIPS32R6-NEXT: bnec $10, $8, $BB13_3
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: # in Loop: Header=BB13_1 Depth=1
+; MIPS32R6-NEXT: and $9, $9, $7
+; MIPS32R6-NEXT: or $9, $9, $6
+; MIPS32R6-NEXT: sc $9, 0($2)
+; MIPS32R6-NEXT: beqzc $9, $BB13_1
+; MIPS32R6-NEXT: $BB13_3: # %entry
+; MIPS32R6-NEXT: srlv $1, $10, $3
+; MIPS32R6-NEXT: seb $1, $1
+; MIPS32R6-NEXT: # %bb.4: # %entry
+; MIPS32R6-NEXT: xor $1, $1, $5
+; MIPS32R6-NEXT: jr $ra
+; MIPS32R6-NEXT: sltiu $2, $1, 1
+;
+; MIPS32R6O0-LABEL: AtomicCmpSwapRes8:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -24
+; MIPS32R6O0-NEXT: move $1, $6
+; MIPS32R6O0-NEXT: move $2, $5
+; MIPS32R6O0-NEXT: move $3, $4
+; MIPS32R6O0-NEXT: addiu $7, $zero, -4
+; MIPS32R6O0-NEXT: and $7, $4, $7
+; MIPS32R6O0-NEXT: andi $4, $4, 3
+; MIPS32R6O0-NEXT: sll $4, $4, 3
+; MIPS32R6O0-NEXT: ori $8, $zero, 255
+; MIPS32R6O0-NEXT: sllv $8, $8, $4
+; MIPS32R6O0-NEXT: nor $9, $zero, $8
+; MIPS32R6O0-NEXT: andi $10, $5, 255
+; MIPS32R6O0-NEXT: sllv $10, $10, $4
+; MIPS32R6O0-NEXT: andi $6, $6, 255
+; MIPS32R6O0-NEXT: sllv $6, $6, $4
+; MIPS32R6O0-NEXT: $BB13_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $12, 0($7)
+; MIPS32R6O0-NEXT: and $13, $12, $8
+; MIPS32R6O0-NEXT: bnec $13, $10, $BB13_3
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: # in Loop: Header=BB13_1 Depth=1
+; MIPS32R6O0-NEXT: and $12, $12, $9
+; MIPS32R6O0-NEXT: or $12, $12, $6
+; MIPS32R6O0-NEXT: sc $12, 0($7)
+; MIPS32R6O0-NEXT: beqzc $12, $BB13_1
+; MIPS32R6O0-NEXT: $BB13_3: # %entry
+; MIPS32R6O0-NEXT: srlv $11, $13, $4
+; MIPS32R6O0-NEXT: seb $11, $11
+; MIPS32R6O0-NEXT: # %bb.4: # %entry
+; MIPS32R6O0-NEXT: sw $11, 20($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $5, 16($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $3, 12($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $1, 8($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $2, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: # %bb.5: # %entry
+; MIPS32R6O0-NEXT: lw $1, 20($sp) # 4-byte Folded Reload
+; MIPS32R6O0-NEXT: lw $2, 16($sp) # 4-byte Folded Reload
+; MIPS32R6O0-NEXT: xor $1, $1, $2
+; MIPS32R6O0-NEXT: sltiu $2, $1, 1
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 24
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicCmpSwapRes8:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: daddiu $1, $zero, -4
+; MIPS4-NEXT: and $2, $4, $1
+; MIPS4-NEXT: andi $1, $4, 3
+; MIPS4-NEXT: sll $3, $1, 3
+; MIPS4-NEXT: ori $1, $zero, 255
+; MIPS4-NEXT: sllv $4, $1, $3
+; MIPS4-NEXT: nor $7, $zero, $4
+; MIPS4-NEXT: andi $1, $5, 255
+; MIPS4-NEXT: sllv $8, $1, $3
+; MIPS4-NEXT: andi $1, $6, 255
+; MIPS4-NEXT: sllv $6, $1, $3
+; MIPS4-NEXT: .LBB13_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $9, 0($2)
+; MIPS4-NEXT: and $10, $9, $4
+; MIPS4-NEXT: bne $10, $8, .LBB13_3
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: # in Loop: Header=BB13_1 Depth=1
+; MIPS4-NEXT: and $9, $9, $7
+; MIPS4-NEXT: or $9, $9, $6
+; MIPS4-NEXT: sc $9, 0($2)
+; MIPS4-NEXT: beqz $9, .LBB13_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: .LBB13_3: # %entry
+; MIPS4-NEXT: srlv $1, $10, $3
+; MIPS4-NEXT: sll $1, $1, 24
+; MIPS4-NEXT: sra $1, $1, 24
+; MIPS4-NEXT: # %bb.4: # %entry
+; MIPS4-NEXT: sll $2, $5, 24
+; MIPS4-NEXT: sra $2, $2, 24
+; MIPS4-NEXT: xor $1, $1, $2
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: sltiu $2, $1, 1
+;
+; MIPS64-LABEL: AtomicCmpSwapRes8:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: daddiu $1, $zero, -4
+; MIPS64-NEXT: and $2, $4, $1
+; MIPS64-NEXT: andi $1, $4, 3
+; MIPS64-NEXT: sll $3, $1, 3
+; MIPS64-NEXT: ori $1, $zero, 255
+; MIPS64-NEXT: sllv $4, $1, $3
+; MIPS64-NEXT: nor $7, $zero, $4
+; MIPS64-NEXT: andi $1, $5, 255
+; MIPS64-NEXT: sllv $8, $1, $3
+; MIPS64-NEXT: andi $1, $6, 255
+; MIPS64-NEXT: sllv $6, $1, $3
+; MIPS64-NEXT: .LBB13_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $9, 0($2)
+; MIPS64-NEXT: and $10, $9, $4
+; MIPS64-NEXT: bne $10, $8, .LBB13_3
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: # in Loop: Header=BB13_1 Depth=1
+; MIPS64-NEXT: and $9, $9, $7
+; MIPS64-NEXT: or $9, $9, $6
+; MIPS64-NEXT: sc $9, 0($2)
+; MIPS64-NEXT: beqz $9, .LBB13_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: .LBB13_3: # %entry
+; MIPS64-NEXT: srlv $1, $10, $3
+; MIPS64-NEXT: sll $1, $1, 24
+; MIPS64-NEXT: sra $1, $1, 24
+; MIPS64-NEXT: # %bb.4: # %entry
+; MIPS64-NEXT: sll $2, $5, 24
+; MIPS64-NEXT: sra $2, $2, 24
+; MIPS64-NEXT: xor $1, $1, $2
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: sltiu $2, $1, 1
+;
+; MIPS64R2-LABEL: AtomicCmpSwapRes8:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: daddiu $1, $zero, -4
+; MIPS64R2-NEXT: and $2, $4, $1
+; MIPS64R2-NEXT: andi $1, $4, 3
+; MIPS64R2-NEXT: sll $3, $1, 3
+; MIPS64R2-NEXT: ori $1, $zero, 255
+; MIPS64R2-NEXT: sllv $4, $1, $3
+; MIPS64R2-NEXT: nor $7, $zero, $4
+; MIPS64R2-NEXT: andi $1, $5, 255
+; MIPS64R2-NEXT: sllv $8, $1, $3
+; MIPS64R2-NEXT: andi $1, $6, 255
+; MIPS64R2-NEXT: sllv $6, $1, $3
+; MIPS64R2-NEXT: .LBB13_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $9, 0($2)
+; MIPS64R2-NEXT: and $10, $9, $4
+; MIPS64R2-NEXT: bne $10, $8, .LBB13_3
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: # in Loop: Header=BB13_1 Depth=1
+; MIPS64R2-NEXT: and $9, $9, $7
+; MIPS64R2-NEXT: or $9, $9, $6
+; MIPS64R2-NEXT: sc $9, 0($2)
+; MIPS64R2-NEXT: beqz $9, .LBB13_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: .LBB13_3: # %entry
+; MIPS64R2-NEXT: srlv $1, $10, $3
+; MIPS64R2-NEXT: seb $1, $1
+; MIPS64R2-NEXT: # %bb.4: # %entry
+; MIPS64R2-NEXT: xor $1, $1, $5
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: sltiu $2, $1, 1
+;
+; MIPS64R6-LABEL: AtomicCmpSwapRes8:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: daddiu $1, $zero, -4
+; MIPS64R6-NEXT: and $2, $4, $1
+; MIPS64R6-NEXT: andi $1, $4, 3
+; MIPS64R6-NEXT: sll $3, $1, 3
+; MIPS64R6-NEXT: ori $1, $zero, 255
+; MIPS64R6-NEXT: sllv $4, $1, $3
+; MIPS64R6-NEXT: nor $7, $zero, $4
+; MIPS64R6-NEXT: andi $1, $5, 255
+; MIPS64R6-NEXT: sllv $8, $1, $3
+; MIPS64R6-NEXT: andi $1, $6, 255
+; MIPS64R6-NEXT: sllv $6, $1, $3
+; MIPS64R6-NEXT: .LBB13_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $9, 0($2)
+; MIPS64R6-NEXT: and $10, $9, $4
+; MIPS64R6-NEXT: bnec $10, $8, .LBB13_3
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: # in Loop: Header=BB13_1 Depth=1
+; MIPS64R6-NEXT: and $9, $9, $7
+; MIPS64R6-NEXT: or $9, $9, $6
+; MIPS64R6-NEXT: sc $9, 0($2)
+; MIPS64R6-NEXT: beqzc $9, .LBB13_1
+; MIPS64R6-NEXT: .LBB13_3: # %entry
+; MIPS64R6-NEXT: srlv $1, $10, $3
+; MIPS64R6-NEXT: seb $1, $1
+; MIPS64R6-NEXT: # %bb.4: # %entry
+; MIPS64R6-NEXT: xor $1, $1, $5
+; MIPS64R6-NEXT: jr $ra
+; MIPS64R6-NEXT: sltiu $2, $1, 1
+;
+; MIPS64R6O0-LABEL: AtomicCmpSwapRes8:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, -16
+; MIPS64R6O0-NEXT: move $1, $6
+; MIPS64R6O0-NEXT: move $2, $5
+; MIPS64R6O0-NEXT: move $5, $4
+; MIPS64R6O0-NEXT: daddiu $6, $zero, -4
+; MIPS64R6O0-NEXT: and $6, $4, $6
+; MIPS64R6O0-NEXT: andi $3, $4, 3
+; MIPS64R6O0-NEXT: xori $3, $3, 3
+; MIPS64R6O0-NEXT: sll $3, $3, 3
+; MIPS64R6O0-NEXT: ori $7, $zero, 255
+; MIPS64R6O0-NEXT: sllv $7, $7, $3
+; MIPS64R6O0-NEXT: nor $8, $zero, $7
+; MIPS64R6O0-NEXT: andi $9, $2, 255
+; MIPS64R6O0-NEXT: sllv $9, $9, $3
+; MIPS64R6O0-NEXT: andi $1, $1, 255
+; MIPS64R6O0-NEXT: sllv $1, $1, $3
+; MIPS64R6O0-NEXT: .LBB13_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $11, 0($6)
+; MIPS64R6O0-NEXT: and $12, $11, $7
+; MIPS64R6O0-NEXT: bnec $12, $9, .LBB13_3
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: # in Loop: Header=BB13_1 Depth=1
+; MIPS64R6O0-NEXT: and $11, $11, $8
+; MIPS64R6O0-NEXT: or $11, $11, $1
+; MIPS64R6O0-NEXT: sc $11, 0($6)
+; MIPS64R6O0-NEXT: beqzc $11, .LBB13_1
+; MIPS64R6O0-NEXT: .LBB13_3: # %entry
+; MIPS64R6O0-NEXT: srlv $10, $12, $3
+; MIPS64R6O0-NEXT: seb $10, $10
+; MIPS64R6O0-NEXT: # %bb.4: # %entry
+; MIPS64R6O0-NEXT: sd $5, 8($sp) # 8-byte Folded Spill
+; MIPS64R6O0-NEXT: sw $10, 4($sp) # 4-byte Folded Spill
+; MIPS64R6O0-NEXT: sw $2, 0($sp) # 4-byte Folded Spill
+; MIPS64R6O0-NEXT: # %bb.5: # %entry
+; MIPS64R6O0-NEXT: lw $1, 4($sp) # 4-byte Folded Reload
+; MIPS64R6O0-NEXT: lw $2, 0($sp) # 4-byte Folded Reload
+; MIPS64R6O0-NEXT: xor $1, $1, $2
+; MIPS64R6O0-NEXT: sltiu $2, $1, 1
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, 16
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicCmpSwapRes8:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: addiu $1, $zero, -4
+; MM32-NEXT: and $2, $4, $1
+; MM32-NEXT: andi $1, $4, 3
+; MM32-NEXT: sll $3, $1, 3
+; MM32-NEXT: ori $1, $zero, 255
+; MM32-NEXT: sllv $4, $1, $3
+; MM32-NEXT: nor $7, $zero, $4
+; MM32-NEXT: andi $1, $5, 255
+; MM32-NEXT: sllv $8, $1, $3
+; MM32-NEXT: andi $1, $6, 255
+; MM32-NEXT: sllv $6, $1, $3
+; MM32-NEXT: $BB13_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $9, 0($2)
+; MM32-NEXT: and $10, $9, $4
+; MM32-NEXT: bne $10, $8, $BB13_3
+; MM32-NEXT: nop
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: # in Loop: Header=BB13_1 Depth=1
+; MM32-NEXT: and $9, $9, $7
+; MM32-NEXT: or $9, $9, $6
+; MM32-NEXT: sc $9, 0($2)
+; MM32-NEXT: beqzc $9, $BB13_1
+; MM32-NEXT: $BB13_3: # %entry
+; MM32-NEXT: srlv $1, $10, $3
+; MM32-NEXT: seb $1, $1
+; MM32-NEXT: # %bb.4: # %entry
+; MM32-NEXT: xor $1, $1, $5
+; MM32-NEXT: jr $ra
+; MM32-NEXT: sltiu $2, $1, 1
+;
+; O1-LABEL: AtomicCmpSwapRes8:
+; O1: # %bb.0: # %entry
+; O1-NEXT: addiu $1, $zero, -4
+; O1-NEXT: and $2, $4, $1
+; O1-NEXT: andi $1, $4, 3
+; O1-NEXT: sll $3, $1, 3
+; O1-NEXT: ori $1, $zero, 255
+; O1-NEXT: sllv $4, $1, $3
+; O1-NEXT: nor $7, $zero, $4
+; O1-NEXT: andi $1, $5, 255
+; O1-NEXT: sllv $8, $1, $3
+; O1-NEXT: andi $1, $6, 255
+; O1-NEXT: sllv $6, $1, $3
+; O1-NEXT: $BB13_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $9, 0($2)
+; O1-NEXT: and $10, $9, $4
+; O1-NEXT: bne $10, $8, $BB13_3
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: # in Loop: Header=BB13_1 Depth=1
+; O1-NEXT: and $9, $9, $7
+; O1-NEXT: or $9, $9, $6
+; O1-NEXT: sc $9, 0($2)
+; O1-NEXT: beqz $9, $BB13_1
+; O1-NEXT: nop
+; O1-NEXT: $BB13_3: # %entry
+; O1-NEXT: srlv $1, $10, $3
+; O1-NEXT: sll $1, $1, 24
+; O1-NEXT: sra $1, $1, 24
+; O1-NEXT: # %bb.4: # %entry
+; O1-NEXT: sll $2, $5, 24
+; O1-NEXT: sra $2, $2, 24
+; O1-NEXT: xor $1, $1, $2
+; O1-NEXT: jr $ra
+; O1-NEXT: sltiu $2, $1, 1
+;
+; O2-LABEL: AtomicCmpSwapRes8:
+; O2: # %bb.0: # %entry
+; O2-NEXT: addiu $1, $zero, -4
+; O2-NEXT: and $2, $4, $1
+; O2-NEXT: andi $1, $4, 3
+; O2-NEXT: sll $3, $1, 3
+; O2-NEXT: ori $1, $zero, 255
+; O2-NEXT: sllv $4, $1, $3
+; O2-NEXT: nor $7, $zero, $4
+; O2-NEXT: andi $1, $5, 255
+; O2-NEXT: sllv $8, $1, $3
+; O2-NEXT: andi $1, $6, 255
+; O2-NEXT: sllv $6, $1, $3
+; O2-NEXT: $BB13_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $9, 0($2)
+; O2-NEXT: and $10, $9, $4
+; O2-NEXT: bne $10, $8, $BB13_3
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: # in Loop: Header=BB13_1 Depth=1
+; O2-NEXT: and $9, $9, $7
+; O2-NEXT: or $9, $9, $6
+; O2-NEXT: sc $9, 0($2)
+; O2-NEXT: beqz $9, $BB13_1
+; O2-NEXT: nop
+; O2-NEXT: $BB13_3: # %entry
+; O2-NEXT: srlv $1, $10, $3
+; O2-NEXT: sll $1, $1, 24
+; O2-NEXT: sra $1, $1, 24
+; O2-NEXT: # %bb.4: # %entry
+; O2-NEXT: sll $2, $5, 24
+; O2-NEXT: sra $2, $2, 24
+; O2-NEXT: xor $1, $1, $2
+; O2-NEXT: jr $ra
+; O2-NEXT: sltiu $2, $1, 1
+;
+; O3-LABEL: AtomicCmpSwapRes8:
+; O3: # %bb.0: # %entry
+; O3-NEXT: addiu $1, $zero, -4
+; O3-NEXT: and $2, $4, $1
+; O3-NEXT: andi $1, $4, 3
+; O3-NEXT: sll $3, $1, 3
+; O3-NEXT: ori $1, $zero, 255
+; O3-NEXT: sllv $4, $1, $3
+; O3-NEXT: andi $1, $5, 255
+; O3-NEXT: sllv $8, $1, $3
+; O3-NEXT: andi $1, $6, 255
+; O3-NEXT: nor $7, $zero, $4
+; O3-NEXT: sllv $6, $1, $3
+; O3-NEXT: $BB13_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $9, 0($2)
+; O3-NEXT: and $10, $9, $4
+; O3-NEXT: bne $10, $8, $BB13_3
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: # in Loop: Header=BB13_1 Depth=1
+; O3-NEXT: and $9, $9, $7
+; O3-NEXT: or $9, $9, $6
+; O3-NEXT: sc $9, 0($2)
+; O3-NEXT: beqz $9, $BB13_1
+; O3-NEXT: nop
+; O3-NEXT: $BB13_3: # %entry
+; O3-NEXT: srlv $1, $10, $3
+; O3-NEXT: sll $1, $1, 24
+; O3-NEXT: sra $1, $1, 24
+; O3-NEXT: # %bb.4: # %entry
+; O3-NEXT: sll $2, $5, 24
+; O3-NEXT: sra $2, $2, 24
+; O3-NEXT: xor $1, $1, $2
+; O3-NEXT: jr $ra
+; O3-NEXT: sltiu $2, $1, 1
+;
+; MIPS32EB-LABEL: AtomicCmpSwapRes8:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: addiu $1, $zero, -4
+; MIPS32EB-NEXT: and $2, $4, $1
+; MIPS32EB-NEXT: andi $1, $4, 3
+; MIPS32EB-NEXT: xori $1, $1, 3
+; MIPS32EB-NEXT: sll $3, $1, 3
+; MIPS32EB-NEXT: ori $1, $zero, 255
+; MIPS32EB-NEXT: sllv $4, $1, $3
+; MIPS32EB-NEXT: nor $7, $zero, $4
+; MIPS32EB-NEXT: andi $1, $5, 255
+; MIPS32EB-NEXT: sllv $8, $1, $3
+; MIPS32EB-NEXT: andi $1, $6, 255
+; MIPS32EB-NEXT: sllv $6, $1, $3
+; MIPS32EB-NEXT: $BB13_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $9, 0($2)
+; MIPS32EB-NEXT: and $10, $9, $4
+; MIPS32EB-NEXT: bne $10, $8, $BB13_3
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: # in Loop: Header=BB13_1 Depth=1
+; MIPS32EB-NEXT: and $9, $9, $7
+; MIPS32EB-NEXT: or $9, $9, $6
+; MIPS32EB-NEXT: sc $9, 0($2)
+; MIPS32EB-NEXT: beqz $9, $BB13_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: $BB13_3: # %entry
+; MIPS32EB-NEXT: srlv $1, $10, $3
+; MIPS32EB-NEXT: sll $1, $1, 24
+; MIPS32EB-NEXT: sra $1, $1, 24
+; MIPS32EB-NEXT: # %bb.4: # %entry
+; MIPS32EB-NEXT: sll $2, $5, 24
+; MIPS32EB-NEXT: sra $2, $2, 24
+; MIPS32EB-NEXT: xor $1, $1, $2
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: sltiu $2, $1, 1
entry:
%0 = cmpxchg i8* %ptr, i8 %oldval, i8 %newval monotonic monotonic
%1 = extractvalue { i8, i1 } %0, 1
ret i1 %1
-; ALL-LABEL: AtomicCmpSwapRes8
-
-; ALL: addiu $[[R1:[0-9]+]], $zero, -4
-; ALL: and $[[R2:[0-9]+]], $4, $[[R1]]
-; ALL: andi $[[R3:[0-9]+]], $4, 3
-; CHECK-EL: sll $[[R5:[0-9]+]], $[[R3]], 3
-; CHECK-EB: xori $[[R4:[0-9]+]], $[[R3]], 3
-; CHECK-EB: sll $[[R5:[0-9]+]], $[[R4]], 3
-; ALL: ori $[[R6:[0-9]+]], $zero, 255
-; ALL: sllv $[[R7:[0-9]+]], $[[R6]], $[[R5]]
-; ALL: nor $[[R8:[0-9]+]], $zero, $[[R7]]
-; ALL: andi $[[R9:[0-9]+]], $5, 255
-; ALL: sllv $[[R10:[0-9]+]], $[[R9]], $[[R5]]
-; ALL: andi $[[R11:[0-9]+]], $6, 255
-; ALL: sllv $[[R12:[0-9]+]], $[[R11]], $[[R5]]
-
-; ALL: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; ALL: ll $[[R13:[0-9]+]], 0($[[R2]])
-; ALL: and $[[R14:[0-9]+]], $[[R13]], $[[R7]]
-; NOT-MICROMIPS: bne $[[R14]], $[[R10]], [[BB1:(\$|\.L)[A-Z_0-9]+]]
-; MICROMIPS: bne $[[R14]], $[[R10]], [[BB1:(\$|\.L)[A-Z_0-9]+]]
-; MIPSR6: bnec $[[R14]], $[[R10]], [[BB1:(\$|\.L)[A-Z_0-9]+]]
-
-; ALL: and $[[R15:[0-9]+]], $[[R13]], $[[R8]]
-; ALL: or $[[R16:[0-9]+]], $[[R15]], $[[R12]]
-; ALL: sc $[[R16]], 0($[[R2]])
-; NOT-MICROMIPS: beqz $[[R16]], [[BB0]]
-; MICROMIPS: beqzc $[[R16]], [[BB0]]
-; MIPSR6: beqzc $[[R16]], [[BB0]]
-
-; ALL: [[BB1]]:
-; ALL: srlv $[[R17:[0-9]+]], $[[R14]], $[[R5]]
-
-; NO-SEB-SEH: sll $[[R18:[0-9]+]], $[[R17]], 24
-; NO-SEB-SEH: sra $[[R19:[0-9]+]], $[[R18]], 24
-
; FIXME: -march=mips produces a redundant sign extension here...
-; NO-SEB-SEH: sll $[[R20:[0-9]+]], $5, 24
-; NO-SEB-SEH: sra $[[R20]], $[[R20]], 24
-
-; HAS-SEB-SEH: seb $[[R19:[0-9]+]], $[[R17]]
-
; FIXME: ...Leading to this split check.
-; NO-SEB-SEH: xor $[[R21:[0-9]+]], $[[R19]], $[[R20]]
-; HAS-SEB-SEH: xor $[[R21:[0-9]+]], $[[R19]], $5
-; ALL: sltiu $2, $[[R21]], 1
}
; Check one i16 so that we cover the seh sign extend
@z = common global i16 0, align 1
define signext i16 @AtomicLoadAdd16(i16 signext %incr) nounwind {
+; MIPS32-LABEL: AtomicLoadAdd16:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: lw $1, %got(z)($1)
+; MIPS32-NEXT: addiu $2, $zero, -4
+; MIPS32-NEXT: and $2, $1, $2
+; MIPS32-NEXT: andi $1, $1, 3
+; MIPS32-NEXT: sll $3, $1, 3
+; MIPS32-NEXT: ori $1, $zero, 65535
+; MIPS32-NEXT: sllv $5, $1, $3
+; MIPS32-NEXT: nor $6, $zero, $5
+; MIPS32-NEXT: sllv $4, $4, $3
+; MIPS32-NEXT: $BB14_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $7, 0($2)
+; MIPS32-NEXT: addu $8, $7, $4
+; MIPS32-NEXT: and $8, $8, $5
+; MIPS32-NEXT: and $9, $7, $6
+; MIPS32-NEXT: or $9, $9, $8
+; MIPS32-NEXT: sc $9, 0($2)
+; MIPS32-NEXT: beqz $9, $BB14_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: and $1, $7, $5
+; MIPS32-NEXT: srlv $1, $1, $3
+; MIPS32-NEXT: sll $1, $1, 16
+; MIPS32-NEXT: sra $1, $1, 16
+; MIPS32-NEXT: # %bb.3: # %entry
+; MIPS32-NEXT: sll $1, $1, 16
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: sra $2, $1, 16
+;
+; MIPS32O0-LABEL: AtomicLoadAdd16:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addiu $sp, $sp, -8
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: lw $2, %got(z)($2)
+; MIPS32O0-NEXT: addiu $25, $zero, -4
+; MIPS32O0-NEXT: and $25, $2, $25
+; MIPS32O0-NEXT: andi $2, $2, 3
+; MIPS32O0-NEXT: sll $2, $2, 3
+; MIPS32O0-NEXT: ori $1, $zero, 65535
+; MIPS32O0-NEXT: sllv $1, $1, $2
+; MIPS32O0-NEXT: nor $3, $zero, $1
+; MIPS32O0-NEXT: sllv $4, $4, $2
+; MIPS32O0-NEXT: $BB14_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $6, 0($25)
+; MIPS32O0-NEXT: addu $7, $6, $4
+; MIPS32O0-NEXT: and $7, $7, $1
+; MIPS32O0-NEXT: and $8, $6, $3
+; MIPS32O0-NEXT: or $8, $8, $7
+; MIPS32O0-NEXT: sc $8, 0($25)
+; MIPS32O0-NEXT: beqz $8, $BB14_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: and $5, $6, $1
+; MIPS32O0-NEXT: srlv $5, $5, $2
+; MIPS32O0-NEXT: sll $5, $5, 16
+; MIPS32O0-NEXT: sra $5, $5, 16
+; MIPS32O0-NEXT: # %bb.3: # %entry
+; MIPS32O0-NEXT: sw $5, 4($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: # %bb.4: # %entry
+; MIPS32O0-NEXT: lw $1, 4($sp) # 4-byte Folded Reload
+; MIPS32O0-NEXT: sll $2, $1, 16
+; MIPS32O0-NEXT: sra $2, $2, 16
+; MIPS32O0-NEXT: addiu $sp, $sp, 8
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicLoadAdd16:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: lw $1, %got(z)($1)
+; MIPS32R2-NEXT: addiu $2, $zero, -4
+; MIPS32R2-NEXT: and $2, $1, $2
+; MIPS32R2-NEXT: andi $1, $1, 3
+; MIPS32R2-NEXT: sll $3, $1, 3
+; MIPS32R2-NEXT: ori $1, $zero, 65535
+; MIPS32R2-NEXT: sllv $5, $1, $3
+; MIPS32R2-NEXT: nor $6, $zero, $5
+; MIPS32R2-NEXT: sllv $4, $4, $3
+; MIPS32R2-NEXT: $BB14_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $7, 0($2)
+; MIPS32R2-NEXT: addu $8, $7, $4
+; MIPS32R2-NEXT: and $8, $8, $5
+; MIPS32R2-NEXT: and $9, $7, $6
+; MIPS32R2-NEXT: or $9, $9, $8
+; MIPS32R2-NEXT: sc $9, 0($2)
+; MIPS32R2-NEXT: beqz $9, $BB14_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: and $1, $7, $5
+; MIPS32R2-NEXT: srlv $1, $1, $3
+; MIPS32R2-NEXT: seh $1, $1
+; MIPS32R2-NEXT: # %bb.3: # %entry
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: seh $2, $1
+;
+; MIPS32R6-LABEL: AtomicLoadAdd16:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: lw $1, %got(z)($1)
+; MIPS32R6-NEXT: addiu $2, $zero, -4
+; MIPS32R6-NEXT: and $2, $1, $2
+; MIPS32R6-NEXT: andi $1, $1, 3
+; MIPS32R6-NEXT: sll $3, $1, 3
+; MIPS32R6-NEXT: ori $1, $zero, 65535
+; MIPS32R6-NEXT: sllv $5, $1, $3
+; MIPS32R6-NEXT: nor $6, $zero, $5
+; MIPS32R6-NEXT: sllv $4, $4, $3
+; MIPS32R6-NEXT: $BB14_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $7, 0($2)
+; MIPS32R6-NEXT: addu $8, $7, $4
+; MIPS32R6-NEXT: and $8, $8, $5
+; MIPS32R6-NEXT: and $9, $7, $6
+; MIPS32R6-NEXT: or $9, $9, $8
+; MIPS32R6-NEXT: sc $9, 0($2)
+; MIPS32R6-NEXT: beqzc $9, $BB14_1
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: and $1, $7, $5
+; MIPS32R6-NEXT: srlv $1, $1, $3
+; MIPS32R6-NEXT: seh $1, $1
+; MIPS32R6-NEXT: # %bb.3: # %entry
+; MIPS32R6-NEXT: jr $ra
+; MIPS32R6-NEXT: seh $2, $1
+;
+; MIPS32R6O0-LABEL: AtomicLoadAdd16:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -8
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $4
+; MIPS32R6O0-NEXT: lw $2, %got(z)($2)
+; MIPS32R6O0-NEXT: addiu $1, $zero, -4
+; MIPS32R6O0-NEXT: and $1, $2, $1
+; MIPS32R6O0-NEXT: andi $2, $2, 3
+; MIPS32R6O0-NEXT: sll $2, $2, 3
+; MIPS32R6O0-NEXT: ori $3, $zero, 65535
+; MIPS32R6O0-NEXT: sllv $3, $3, $2
+; MIPS32R6O0-NEXT: nor $5, $zero, $3
+; MIPS32R6O0-NEXT: sllv $4, $4, $2
+; MIPS32R6O0-NEXT: $BB14_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $7, 0($1)
+; MIPS32R6O0-NEXT: addu $8, $7, $4
+; MIPS32R6O0-NEXT: and $8, $8, $3
+; MIPS32R6O0-NEXT: and $9, $7, $5
+; MIPS32R6O0-NEXT: or $9, $9, $8
+; MIPS32R6O0-NEXT: sc $9, 0($1)
+; MIPS32R6O0-NEXT: beqzc $9, $BB14_1
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: and $6, $7, $3
+; MIPS32R6O0-NEXT: srlv $6, $6, $2
+; MIPS32R6O0-NEXT: seh $6, $6
+; MIPS32R6O0-NEXT: # %bb.3: # %entry
+; MIPS32R6O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $6, 0($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: # %bb.4: # %entry
+; MIPS32R6O0-NEXT: lw $1, 0($sp) # 4-byte Folded Reload
+; MIPS32R6O0-NEXT: seh $2, $1
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 8
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicLoadAdd16:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd16)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd16)))
+; MIPS4-NEXT: ld $1, %got_disp(z)($1)
+; MIPS4-NEXT: daddiu $2, $zero, -4
+; MIPS4-NEXT: and $2, $1, $2
+; MIPS4-NEXT: andi $1, $1, 3
+; MIPS4-NEXT: sll $3, $1, 3
+; MIPS4-NEXT: ori $1, $zero, 65535
+; MIPS4-NEXT: sllv $5, $1, $3
+; MIPS4-NEXT: nor $6, $zero, $5
+; MIPS4-NEXT: sllv $4, $4, $3
+; MIPS4-NEXT: .LBB14_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $7, 0($2)
+; MIPS4-NEXT: addu $8, $7, $4
+; MIPS4-NEXT: and $8, $8, $5
+; MIPS4-NEXT: and $9, $7, $6
+; MIPS4-NEXT: or $9, $9, $8
+; MIPS4-NEXT: sc $9, 0($2)
+; MIPS4-NEXT: beqz $9, .LBB14_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: and $1, $7, $5
+; MIPS4-NEXT: srlv $1, $1, $3
+; MIPS4-NEXT: sll $1, $1, 16
+; MIPS4-NEXT: sra $1, $1, 16
+; MIPS4-NEXT: # %bb.3: # %entry
+; MIPS4-NEXT: sll $1, $1, 16
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: sra $2, $1, 16
+;
+; MIPS64-LABEL: AtomicLoadAdd16:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd16)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd16)))
+; MIPS64-NEXT: ld $1, %got_disp(z)($1)
+; MIPS64-NEXT: daddiu $2, $zero, -4
+; MIPS64-NEXT: and $2, $1, $2
+; MIPS64-NEXT: andi $1, $1, 3
+; MIPS64-NEXT: sll $3, $1, 3
+; MIPS64-NEXT: ori $1, $zero, 65535
+; MIPS64-NEXT: sllv $5, $1, $3
+; MIPS64-NEXT: nor $6, $zero, $5
+; MIPS64-NEXT: sllv $4, $4, $3
+; MIPS64-NEXT: .LBB14_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $7, 0($2)
+; MIPS64-NEXT: addu $8, $7, $4
+; MIPS64-NEXT: and $8, $8, $5
+; MIPS64-NEXT: and $9, $7, $6
+; MIPS64-NEXT: or $9, $9, $8
+; MIPS64-NEXT: sc $9, 0($2)
+; MIPS64-NEXT: beqz $9, .LBB14_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: and $1, $7, $5
+; MIPS64-NEXT: srlv $1, $1, $3
+; MIPS64-NEXT: sll $1, $1, 16
+; MIPS64-NEXT: sra $1, $1, 16
+; MIPS64-NEXT: # %bb.3: # %entry
+; MIPS64-NEXT: sll $1, $1, 16
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: sra $2, $1, 16
+;
+; MIPS64R2-LABEL: AtomicLoadAdd16:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd16)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd16)))
+; MIPS64R2-NEXT: ld $1, %got_disp(z)($1)
+; MIPS64R2-NEXT: daddiu $2, $zero, -4
+; MIPS64R2-NEXT: and $2, $1, $2
+; MIPS64R2-NEXT: andi $1, $1, 3
+; MIPS64R2-NEXT: sll $3, $1, 3
+; MIPS64R2-NEXT: ori $1, $zero, 65535
+; MIPS64R2-NEXT: sllv $5, $1, $3
+; MIPS64R2-NEXT: nor $6, $zero, $5
+; MIPS64R2-NEXT: sllv $4, $4, $3
+; MIPS64R2-NEXT: .LBB14_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $7, 0($2)
+; MIPS64R2-NEXT: addu $8, $7, $4
+; MIPS64R2-NEXT: and $8, $8, $5
+; MIPS64R2-NEXT: and $9, $7, $6
+; MIPS64R2-NEXT: or $9, $9, $8
+; MIPS64R2-NEXT: sc $9, 0($2)
+; MIPS64R2-NEXT: beqz $9, .LBB14_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: and $1, $7, $5
+; MIPS64R2-NEXT: srlv $1, $1, $3
+; MIPS64R2-NEXT: seh $1, $1
+; MIPS64R2-NEXT: # %bb.3: # %entry
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: seh $2, $1
+;
+; MIPS64R6-LABEL: AtomicLoadAdd16:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd16)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd16)))
+; MIPS64R6-NEXT: ld $1, %got_disp(z)($1)
+; MIPS64R6-NEXT: daddiu $2, $zero, -4
+; MIPS64R6-NEXT: and $2, $1, $2
+; MIPS64R6-NEXT: andi $1, $1, 3
+; MIPS64R6-NEXT: sll $3, $1, 3
+; MIPS64R6-NEXT: ori $1, $zero, 65535
+; MIPS64R6-NEXT: sllv $5, $1, $3
+; MIPS64R6-NEXT: nor $6, $zero, $5
+; MIPS64R6-NEXT: sllv $4, $4, $3
+; MIPS64R6-NEXT: .LBB14_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $7, 0($2)
+; MIPS64R6-NEXT: addu $8, $7, $4
+; MIPS64R6-NEXT: and $8, $8, $5
+; MIPS64R6-NEXT: and $9, $7, $6
+; MIPS64R6-NEXT: or $9, $9, $8
+; MIPS64R6-NEXT: sc $9, 0($2)
+; MIPS64R6-NEXT: beqzc $9, .LBB14_1
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: and $1, $7, $5
+; MIPS64R6-NEXT: srlv $1, $1, $3
+; MIPS64R6-NEXT: seh $1, $1
+; MIPS64R6-NEXT: # %bb.3: # %entry
+; MIPS64R6-NEXT: jr $ra
+; MIPS64R6-NEXT: seh $2, $1
+;
+; MIPS64R6O0-LABEL: AtomicLoadAdd16:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, -16
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd16)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd16)))
+; MIPS64R6O0-NEXT: move $2, $4
+; MIPS64R6O0-NEXT: ld $1, %got_disp(z)($1)
+; MIPS64R6O0-NEXT: daddiu $4, $zero, -4
+; MIPS64R6O0-NEXT: and $4, $1, $4
+; MIPS64R6O0-NEXT: andi $3, $1, 3
+; MIPS64R6O0-NEXT: xori $3, $3, 2
+; MIPS64R6O0-NEXT: sll $3, $3, 3
+; MIPS64R6O0-NEXT: ori $5, $zero, 65535
+; MIPS64R6O0-NEXT: sllv $5, $5, $3
+; MIPS64R6O0-NEXT: nor $6, $zero, $5
+; MIPS64R6O0-NEXT: sllv $2, $2, $3
+; MIPS64R6O0-NEXT: .LBB14_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $8, 0($4)
+; MIPS64R6O0-NEXT: addu $9, $8, $2
+; MIPS64R6O0-NEXT: and $9, $9, $5
+; MIPS64R6O0-NEXT: and $10, $8, $6
+; MIPS64R6O0-NEXT: or $10, $10, $9
+; MIPS64R6O0-NEXT: sc $10, 0($4)
+; MIPS64R6O0-NEXT: beqzc $10, .LBB14_1
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: and $7, $8, $5
+; MIPS64R6O0-NEXT: srlv $7, $7, $3
+; MIPS64R6O0-NEXT: seh $7, $7
+; MIPS64R6O0-NEXT: # %bb.3: # %entry
+; MIPS64R6O0-NEXT: sw $7, 12($sp) # 4-byte Folded Spill
+; MIPS64R6O0-NEXT: # %bb.4: # %entry
+; MIPS64R6O0-NEXT: lw $1, 12($sp) # 4-byte Folded Reload
+; MIPS64R6O0-NEXT: seh $2, $1
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, 16
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicLoadAdd16:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: lw $1, %got(z)($2)
+; MM32-NEXT: addiu $2, $zero, -4
+; MM32-NEXT: and $2, $1, $2
+; MM32-NEXT: andi $1, $1, 3
+; MM32-NEXT: sll $3, $1, 3
+; MM32-NEXT: ori $1, $zero, 65535
+; MM32-NEXT: sllv $5, $1, $3
+; MM32-NEXT: nor $6, $zero, $5
+; MM32-NEXT: sllv $4, $4, $3
+; MM32-NEXT: $BB14_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $7, 0($2)
+; MM32-NEXT: addu $8, $7, $4
+; MM32-NEXT: and $8, $8, $5
+; MM32-NEXT: and $9, $7, $6
+; MM32-NEXT: or $9, $9, $8
+; MM32-NEXT: sc $9, 0($2)
+; MM32-NEXT: beqzc $9, $BB14_1
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: and $1, $7, $5
+; MM32-NEXT: srlv $1, $1, $3
+; MM32-NEXT: seh $1, $1
+; MM32-NEXT: # %bb.3: # %entry
+; MM32-NEXT: jr $ra
+; MM32-NEXT: seh $2, $1
+;
+; O1-LABEL: AtomicLoadAdd16:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: lw $1, %got(z)($1)
+; O1-NEXT: addiu $2, $zero, -4
+; O1-NEXT: and $2, $1, $2
+; O1-NEXT: andi $1, $1, 3
+; O1-NEXT: sll $3, $1, 3
+; O1-NEXT: ori $1, $zero, 65535
+; O1-NEXT: sllv $5, $1, $3
+; O1-NEXT: nor $6, $zero, $5
+; O1-NEXT: sllv $4, $4, $3
+; O1-NEXT: $BB14_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $7, 0($2)
+; O1-NEXT: addu $8, $7, $4
+; O1-NEXT: and $8, $8, $5
+; O1-NEXT: and $9, $7, $6
+; O1-NEXT: or $9, $9, $8
+; O1-NEXT: sc $9, 0($2)
+; O1-NEXT: beqz $9, $BB14_1
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: and $1, $7, $5
+; O1-NEXT: srlv $1, $1, $3
+; O1-NEXT: sll $1, $1, 16
+; O1-NEXT: sra $1, $1, 16
+; O1-NEXT: # %bb.3: # %entry
+; O1-NEXT: sll $1, $1, 16
+; O1-NEXT: jr $ra
+; O1-NEXT: sra $2, $1, 16
+;
+; O2-LABEL: AtomicLoadAdd16:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: lw $1, %got(z)($1)
+; O2-NEXT: addiu $2, $zero, -4
+; O2-NEXT: and $2, $1, $2
+; O2-NEXT: andi $1, $1, 3
+; O2-NEXT: sll $3, $1, 3
+; O2-NEXT: ori $1, $zero, 65535
+; O2-NEXT: sllv $5, $1, $3
+; O2-NEXT: nor $6, $zero, $5
+; O2-NEXT: sllv $4, $4, $3
+; O2-NEXT: $BB14_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $7, 0($2)
+; O2-NEXT: addu $8, $7, $4
+; O2-NEXT: and $8, $8, $5
+; O2-NEXT: and $9, $7, $6
+; O2-NEXT: or $9, $9, $8
+; O2-NEXT: sc $9, 0($2)
+; O2-NEXT: beqz $9, $BB14_1
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: and $1, $7, $5
+; O2-NEXT: srlv $1, $1, $3
+; O2-NEXT: sll $1, $1, 16
+; O2-NEXT: sra $1, $1, 16
+; O2-NEXT: # %bb.3: # %entry
+; O2-NEXT: sll $1, $1, 16
+; O2-NEXT: jr $ra
+; O2-NEXT: sra $2, $1, 16
+;
+; O3-LABEL: AtomicLoadAdd16:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: addiu $2, $zero, -4
+; O3-NEXT: lw $1, %got(z)($1)
+; O3-NEXT: and $2, $1, $2
+; O3-NEXT: andi $1, $1, 3
+; O3-NEXT: sll $3, $1, 3
+; O3-NEXT: ori $1, $zero, 65535
+; O3-NEXT: sllv $5, $1, $3
+; O3-NEXT: sllv $4, $4, $3
+; O3-NEXT: nor $6, $zero, $5
+; O3-NEXT: $BB14_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $7, 0($2)
+; O3-NEXT: addu $8, $7, $4
+; O3-NEXT: and $8, $8, $5
+; O3-NEXT: and $9, $7, $6
+; O3-NEXT: or $9, $9, $8
+; O3-NEXT: sc $9, 0($2)
+; O3-NEXT: beqz $9, $BB14_1
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: and $1, $7, $5
+; O3-NEXT: srlv $1, $1, $3
+; O3-NEXT: sll $1, $1, 16
+; O3-NEXT: sra $1, $1, 16
+; O3-NEXT: # %bb.3: # %entry
+; O3-NEXT: sll $1, $1, 16
+; O3-NEXT: jr $ra
+; O3-NEXT: sra $2, $1, 16
+;
+; MIPS32EB-LABEL: AtomicLoadAdd16:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: lw $1, %got(z)($1)
+; MIPS32EB-NEXT: addiu $2, $zero, -4
+; MIPS32EB-NEXT: and $2, $1, $2
+; MIPS32EB-NEXT: andi $1, $1, 3
+; MIPS32EB-NEXT: xori $1, $1, 2
+; MIPS32EB-NEXT: sll $3, $1, 3
+; MIPS32EB-NEXT: ori $1, $zero, 65535
+; MIPS32EB-NEXT: sllv $5, $1, $3
+; MIPS32EB-NEXT: nor $6, $zero, $5
+; MIPS32EB-NEXT: sllv $4, $4, $3
+; MIPS32EB-NEXT: $BB14_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $7, 0($2)
+; MIPS32EB-NEXT: addu $8, $7, $4
+; MIPS32EB-NEXT: and $8, $8, $5
+; MIPS32EB-NEXT: and $9, $7, $6
+; MIPS32EB-NEXT: or $9, $9, $8
+; MIPS32EB-NEXT: sc $9, 0($2)
+; MIPS32EB-NEXT: beqz $9, $BB14_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: and $1, $7, $5
+; MIPS32EB-NEXT: srlv $1, $1, $3
+; MIPS32EB-NEXT: sll $1, $1, 16
+; MIPS32EB-NEXT: sra $1, $1, 16
+; MIPS32EB-NEXT: # %bb.3: # %entry
+; MIPS32EB-NEXT: sll $1, $1, 16
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: sra $2, $1, 16
entry:
%0 = atomicrmw add i16* @z, i16 %incr monotonic
ret i16 %0
-; ALL-LABEL: AtomicLoadAdd16:
-
-; MIPS32-ANY: lw $[[R0:[0-9]+]], %got(z)
-; MIPS64-ANY: ld $[[R0:[0-9]+]], %got_disp(z)(
-
-; ALL: addiu $[[R1:[0-9]+]], $zero, -4
-; ALL: and $[[R2:[0-9]+]], $[[R0]], $[[R1]]
-; ALL: andi $[[R3:[0-9]+]], $[[R0]], 3
-; CHECK-EB: xori $[[R4:[0-9]+]], $[[R3]], 2
-; CHECK-EB: sll $[[R5:[0-9]+]], $[[R4]], 3
-; CHECK-EL: sll $[[R5:[0-9]+]], $[[R3]], 3
-; ALL: ori $[[R6:[0-9]+]], $zero, 65535
-; ALL: sllv $[[R7:[0-9]+]], $[[R6]], $[[R5]]
-; ALL: nor $[[R8:[0-9]+]], $zero, $[[R7]]
-; ALL: sllv $[[R9:[0-9]+]], $4, $[[R5]]
-
-; O0: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; O0: ld $[[R10:[0-9]+]]
-; O0-NEXT: ll $[[R11:[0-9]+]], 0($[[R10]])
-
-; ALL: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; ALL: ll $[[R12:[0-9]+]], 0($[[R2]])
-; ALL: addu $[[R13:[0-9]+]], $[[R12]], $[[R9]]
-; ALL: and $[[R14:[0-9]+]], $[[R13]], $[[R7]]
-; ALL: and $[[R15:[0-9]+]], $[[R12]], $[[R8]]
-; ALL: or $[[R16:[0-9]+]], $[[R15]], $[[R14]]
-; ALL: sc $[[R16]], 0($[[R2]])
-; NOT-MICROMIPS: beqz $[[R16]], [[BB0]]
-; MICROMIPS: beqzc $[[R16]], [[BB0]]
-; MIPSR6: beqzc $[[R16]], [[BB0]]
-
-; ALL: and $[[R17:[0-9]+]], $[[R12]], $[[R7]]
-; ALL: srlv $[[R18:[0-9]+]], $[[R17]], $[[R5]]
-
-; NO-SEB-SEH: sll $[[R19:[0-9]+]], $[[R18]], 16
-; NO-SEB-SEH: sra $2, $[[R19]], 16
-
-; MIPS32R2: seh $2, $[[R18]]
}
; Test that the i16 return value from cmpxchg is recognised as signed,
; The rest of the functions here are testing the atomic expansion, so
; we just match the end of the function.
define {i16, i1} @foo(i16* %addr, i16 %l, i16 %r, i16 %new) {
+; MIPS32-LABEL: foo:
+; MIPS32: # %bb.0:
+; MIPS32-NEXT: addu $1, $5, $6
+; MIPS32-NEXT: sync
+; MIPS32-NEXT: addiu $2, $zero, -4
+; MIPS32-NEXT: and $3, $4, $2
+; MIPS32-NEXT: andi $2, $4, 3
+; MIPS32-NEXT: sll $4, $2, 3
+; MIPS32-NEXT: ori $2, $zero, 65535
+; MIPS32-NEXT: sllv $5, $2, $4
+; MIPS32-NEXT: nor $6, $zero, $5
+; MIPS32-NEXT: andi $2, $1, 65535
+; MIPS32-NEXT: sllv $8, $2, $4
+; MIPS32-NEXT: andi $2, $7, 65535
+; MIPS32-NEXT: sllv $7, $2, $4
+; MIPS32-NEXT: $BB15_1: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $9, 0($3)
+; MIPS32-NEXT: and $10, $9, $5
+; MIPS32-NEXT: bne $10, $8, $BB15_3
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # in Loop: Header=BB15_1 Depth=1
+; MIPS32-NEXT: and $9, $9, $6
+; MIPS32-NEXT: or $9, $9, $7
+; MIPS32-NEXT: sc $9, 0($3)
+; MIPS32-NEXT: beqz $9, $BB15_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: $BB15_3:
+; MIPS32-NEXT: srlv $2, $10, $4
+; MIPS32-NEXT: sll $2, $2, 16
+; MIPS32-NEXT: sra $2, $2, 16
+; MIPS32-NEXT: # %bb.4:
+; MIPS32-NEXT: sll $1, $1, 16
+; MIPS32-NEXT: sra $1, $1, 16
+; MIPS32-NEXT: xor $1, $2, $1
+; MIPS32-NEXT: sltiu $3, $1, 1
+; MIPS32-NEXT: sync
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: nop
+;
+; MIPS32O0-LABEL: foo:
+; MIPS32O0: # %bb.0:
+; MIPS32O0-NEXT: addiu $sp, $sp, -8
+; MIPS32O0-NEXT: .cfi_def_cfa_offset 8
+; MIPS32O0-NEXT: addu $5, $5, $6
+; MIPS32O0-NEXT: sync
+; MIPS32O0-NEXT: addiu $6, $zero, -4
+; MIPS32O0-NEXT: and $6, $4, $6
+; MIPS32O0-NEXT: andi $4, $4, 3
+; MIPS32O0-NEXT: sll $4, $4, 3
+; MIPS32O0-NEXT: ori $1, $zero, 65535
+; MIPS32O0-NEXT: sllv $1, $1, $4
+; MIPS32O0-NEXT: nor $2, $zero, $1
+; MIPS32O0-NEXT: andi $3, $5, 65535
+; MIPS32O0-NEXT: sllv $3, $3, $4
+; MIPS32O0-NEXT: andi $7, $7, 65535
+; MIPS32O0-NEXT: sllv $7, $7, $4
+; MIPS32O0-NEXT: $BB15_1: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $9, 0($6)
+; MIPS32O0-NEXT: and $10, $9, $1
+; MIPS32O0-NEXT: bne $10, $3, $BB15_3
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # in Loop: Header=BB15_1 Depth=1
+; MIPS32O0-NEXT: and $9, $9, $2
+; MIPS32O0-NEXT: or $9, $9, $7
+; MIPS32O0-NEXT: sc $9, 0($6)
+; MIPS32O0-NEXT: beqz $9, $BB15_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: $BB15_3:
+; MIPS32O0-NEXT: srlv $8, $10, $4
+; MIPS32O0-NEXT: sll $8, $8, 16
+; MIPS32O0-NEXT: sra $8, $8, 16
+; MIPS32O0-NEXT: # %bb.4:
+; MIPS32O0-NEXT: sw $5, 4($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: sw $8, 0($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: # %bb.5:
+; MIPS32O0-NEXT: lw $1, 4($sp) # 4-byte Folded Reload
+; MIPS32O0-NEXT: sll $2, $1, 16
+; MIPS32O0-NEXT: sra $2, $2, 16
+; MIPS32O0-NEXT: lw $3, 0($sp) # 4-byte Folded Reload
+; MIPS32O0-NEXT: xor $2, $3, $2
+; MIPS32O0-NEXT: sltiu $3, $2, 1
+; MIPS32O0-NEXT: sync
+; MIPS32O0-NEXT: lw $2, 0($sp) # 4-byte Folded Reload
+; MIPS32O0-NEXT: addiu $sp, $sp, 8
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: foo:
+; MIPS32R2: # %bb.0:
+; MIPS32R2-NEXT: addu $1, $5, $6
+; MIPS32R2-NEXT: sync
+; MIPS32R2-NEXT: addiu $2, $zero, -4
+; MIPS32R2-NEXT: and $3, $4, $2
+; MIPS32R2-NEXT: andi $2, $4, 3
+; MIPS32R2-NEXT: sll $4, $2, 3
+; MIPS32R2-NEXT: ori $2, $zero, 65535
+; MIPS32R2-NEXT: sllv $5, $2, $4
+; MIPS32R2-NEXT: nor $6, $zero, $5
+; MIPS32R2-NEXT: andi $2, $1, 65535
+; MIPS32R2-NEXT: sllv $8, $2, $4
+; MIPS32R2-NEXT: andi $2, $7, 65535
+; MIPS32R2-NEXT: sllv $7, $2, $4
+; MIPS32R2-NEXT: $BB15_1: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $9, 0($3)
+; MIPS32R2-NEXT: and $10, $9, $5
+; MIPS32R2-NEXT: bne $10, $8, $BB15_3
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # in Loop: Header=BB15_1 Depth=1
+; MIPS32R2-NEXT: and $9, $9, $6
+; MIPS32R2-NEXT: or $9, $9, $7
+; MIPS32R2-NEXT: sc $9, 0($3)
+; MIPS32R2-NEXT: beqz $9, $BB15_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: $BB15_3:
+; MIPS32R2-NEXT: srlv $2, $10, $4
+; MIPS32R2-NEXT: seh $2, $2
+; MIPS32R2-NEXT: # %bb.4:
+; MIPS32R2-NEXT: seh $1, $1
+; MIPS32R2-NEXT: xor $1, $2, $1
+; MIPS32R2-NEXT: sltiu $3, $1, 1
+; MIPS32R2-NEXT: sync
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: nop
+;
+; MIPS32R6-LABEL: foo:
+; MIPS32R6: # %bb.0:
+; MIPS32R6-NEXT: addu $1, $5, $6
+; MIPS32R6-NEXT: sync
+; MIPS32R6-NEXT: addiu $2, $zero, -4
+; MIPS32R6-NEXT: and $3, $4, $2
+; MIPS32R6-NEXT: andi $2, $4, 3
+; MIPS32R6-NEXT: sll $4, $2, 3
+; MIPS32R6-NEXT: ori $2, $zero, 65535
+; MIPS32R6-NEXT: sllv $5, $2, $4
+; MIPS32R6-NEXT: nor $6, $zero, $5
+; MIPS32R6-NEXT: andi $2, $1, 65535
+; MIPS32R6-NEXT: sllv $8, $2, $4
+; MIPS32R6-NEXT: andi $2, $7, 65535
+; MIPS32R6-NEXT: sllv $7, $2, $4
+; MIPS32R6-NEXT: $BB15_1: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $9, 0($3)
+; MIPS32R6-NEXT: and $10, $9, $5
+; MIPS32R6-NEXT: bnec $10, $8, $BB15_3
+; MIPS32R6-NEXT: # %bb.2: # in Loop: Header=BB15_1 Depth=1
+; MIPS32R6-NEXT: and $9, $9, $6
+; MIPS32R6-NEXT: or $9, $9, $7
+; MIPS32R6-NEXT: sc $9, 0($3)
+; MIPS32R6-NEXT: beqzc $9, $BB15_1
+; MIPS32R6-NEXT: $BB15_3:
+; MIPS32R6-NEXT: srlv $2, $10, $4
+; MIPS32R6-NEXT: seh $2, $2
+; MIPS32R6-NEXT: # %bb.4:
+; MIPS32R6-NEXT: seh $1, $1
+; MIPS32R6-NEXT: xor $1, $2, $1
+; MIPS32R6-NEXT: sltiu $3, $1, 1
+; MIPS32R6-NEXT: sync
+; MIPS32R6-NEXT: jrc $ra
+;
+; MIPS32R6O0-LABEL: foo:
+; MIPS32R6O0: # %bb.0:
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -24
+; MIPS32R6O0-NEXT: .cfi_def_cfa_offset 24
+; MIPS32R6O0-NEXT: move $1, $7
+; MIPS32R6O0-NEXT: move $2, $6
+; MIPS32R6O0-NEXT: move $3, $5
+; MIPS32R6O0-NEXT: move $8, $4
+; MIPS32R6O0-NEXT: addu $5, $5, $6
+; MIPS32R6O0-NEXT: sync
+; MIPS32R6O0-NEXT: addiu $6, $zero, -4
+; MIPS32R6O0-NEXT: and $6, $4, $6
+; MIPS32R6O0-NEXT: andi $4, $4, 3
+; MIPS32R6O0-NEXT: sll $4, $4, 3
+; MIPS32R6O0-NEXT: ori $9, $zero, 65535
+; MIPS32R6O0-NEXT: sllv $9, $9, $4
+; MIPS32R6O0-NEXT: nor $10, $zero, $9
+; MIPS32R6O0-NEXT: andi $11, $5, 65535
+; MIPS32R6O0-NEXT: sllv $11, $11, $4
+; MIPS32R6O0-NEXT: andi $7, $7, 65535
+; MIPS32R6O0-NEXT: sllv $7, $7, $4
+; MIPS32R6O0-NEXT: $BB15_1: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $13, 0($6)
+; MIPS32R6O0-NEXT: and $14, $13, $9
+; MIPS32R6O0-NEXT: bnec $14, $11, $BB15_3
+; MIPS32R6O0-NEXT: # %bb.2: # in Loop: Header=BB15_1 Depth=1
+; MIPS32R6O0-NEXT: and $13, $13, $10
+; MIPS32R6O0-NEXT: or $13, $13, $7
+; MIPS32R6O0-NEXT: sc $13, 0($6)
+; MIPS32R6O0-NEXT: beqzc $13, $BB15_1
+; MIPS32R6O0-NEXT: $BB15_3:
+; MIPS32R6O0-NEXT: srlv $12, $14, $4
+; MIPS32R6O0-NEXT: seh $12, $12
+; MIPS32R6O0-NEXT: # %bb.4:
+; MIPS32R6O0-NEXT: sw $12, 20($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $3, 16($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $8, 12($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $5, 8($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $1, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $2, 0($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: # %bb.5:
+; MIPS32R6O0-NEXT: lw $1, 8($sp) # 4-byte Folded Reload
+; MIPS32R6O0-NEXT: seh $2, $1
+; MIPS32R6O0-NEXT: lw $3, 20($sp) # 4-byte Folded Reload
+; MIPS32R6O0-NEXT: xor $2, $3, $2
+; MIPS32R6O0-NEXT: sltiu $3, $2, 1
+; MIPS32R6O0-NEXT: sync
+; MIPS32R6O0-NEXT: lw $2, 20($sp) # 4-byte Folded Reload
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 24
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: foo:
+; MIPS4: # %bb.0:
+; MIPS4-NEXT: sll $1, $6, 0
+; MIPS4-NEXT: sll $2, $5, 0
+; MIPS4-NEXT: addu $1, $2, $1
+; MIPS4-NEXT: sync
+; MIPS4-NEXT: sll $2, $7, 0
+; MIPS4-NEXT: daddiu $3, $zero, -4
+; MIPS4-NEXT: and $3, $4, $3
+; MIPS4-NEXT: andi $4, $4, 3
+; MIPS4-NEXT: sll $4, $4, 3
+; MIPS4-NEXT: ori $5, $zero, 65535
+; MIPS4-NEXT: sllv $5, $5, $4
+; MIPS4-NEXT: nor $6, $zero, $5
+; MIPS4-NEXT: andi $7, $1, 65535
+; MIPS4-NEXT: sllv $7, $7, $4
+; MIPS4-NEXT: andi $2, $2, 65535
+; MIPS4-NEXT: sllv $8, $2, $4
+; MIPS4-NEXT: .LBB15_1: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $9, 0($3)
+; MIPS4-NEXT: and $10, $9, $5
+; MIPS4-NEXT: bne $10, $7, .LBB15_3
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # in Loop: Header=BB15_1 Depth=1
+; MIPS4-NEXT: and $9, $9, $6
+; MIPS4-NEXT: or $9, $9, $8
+; MIPS4-NEXT: sc $9, 0($3)
+; MIPS4-NEXT: beqz $9, .LBB15_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: .LBB15_3:
+; MIPS4-NEXT: srlv $2, $10, $4
+; MIPS4-NEXT: sll $2, $2, 16
+; MIPS4-NEXT: sra $2, $2, 16
+; MIPS4-NEXT: # %bb.4:
+; MIPS4-NEXT: sll $1, $1, 16
+; MIPS4-NEXT: sra $1, $1, 16
+; MIPS4-NEXT: xor $1, $2, $1
+; MIPS4-NEXT: sltiu $3, $1, 1
+; MIPS4-NEXT: sync
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: nop
+;
+; MIPS64-LABEL: foo:
+; MIPS64: # %bb.0:
+; MIPS64-NEXT: sll $1, $6, 0
+; MIPS64-NEXT: sll $2, $5, 0
+; MIPS64-NEXT: addu $1, $2, $1
+; MIPS64-NEXT: sync
+; MIPS64-NEXT: sll $2, $7, 0
+; MIPS64-NEXT: daddiu $3, $zero, -4
+; MIPS64-NEXT: and $3, $4, $3
+; MIPS64-NEXT: andi $4, $4, 3
+; MIPS64-NEXT: sll $4, $4, 3
+; MIPS64-NEXT: ori $5, $zero, 65535
+; MIPS64-NEXT: sllv $5, $5, $4
+; MIPS64-NEXT: nor $6, $zero, $5
+; MIPS64-NEXT: andi $7, $1, 65535
+; MIPS64-NEXT: sllv $7, $7, $4
+; MIPS64-NEXT: andi $2, $2, 65535
+; MIPS64-NEXT: sllv $8, $2, $4
+; MIPS64-NEXT: .LBB15_1: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $9, 0($3)
+; MIPS64-NEXT: and $10, $9, $5
+; MIPS64-NEXT: bne $10, $7, .LBB15_3
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # in Loop: Header=BB15_1 Depth=1
+; MIPS64-NEXT: and $9, $9, $6
+; MIPS64-NEXT: or $9, $9, $8
+; MIPS64-NEXT: sc $9, 0($3)
+; MIPS64-NEXT: beqz $9, .LBB15_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: .LBB15_3:
+; MIPS64-NEXT: srlv $2, $10, $4
+; MIPS64-NEXT: sll $2, $2, 16
+; MIPS64-NEXT: sra $2, $2, 16
+; MIPS64-NEXT: # %bb.4:
+; MIPS64-NEXT: sll $1, $1, 16
+; MIPS64-NEXT: sra $1, $1, 16
+; MIPS64-NEXT: xor $1, $2, $1
+; MIPS64-NEXT: sltiu $3, $1, 1
+; MIPS64-NEXT: sync
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: nop
+;
+; MIPS64R2-LABEL: foo:
+; MIPS64R2: # %bb.0:
+; MIPS64R2-NEXT: sll $1, $6, 0
+; MIPS64R2-NEXT: sll $2, $5, 0
+; MIPS64R2-NEXT: addu $1, $2, $1
+; MIPS64R2-NEXT: sync
+; MIPS64R2-NEXT: sll $2, $7, 0
+; MIPS64R2-NEXT: daddiu $3, $zero, -4
+; MIPS64R2-NEXT: and $3, $4, $3
+; MIPS64R2-NEXT: andi $4, $4, 3
+; MIPS64R2-NEXT: sll $4, $4, 3
+; MIPS64R2-NEXT: ori $5, $zero, 65535
+; MIPS64R2-NEXT: sllv $5, $5, $4
+; MIPS64R2-NEXT: nor $6, $zero, $5
+; MIPS64R2-NEXT: andi $7, $1, 65535
+; MIPS64R2-NEXT: sllv $7, $7, $4
+; MIPS64R2-NEXT: andi $2, $2, 65535
+; MIPS64R2-NEXT: sllv $8, $2, $4
+; MIPS64R2-NEXT: .LBB15_1: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $9, 0($3)
+; MIPS64R2-NEXT: and $10, $9, $5
+; MIPS64R2-NEXT: bne $10, $7, .LBB15_3
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # in Loop: Header=BB15_1 Depth=1
+; MIPS64R2-NEXT: and $9, $9, $6
+; MIPS64R2-NEXT: or $9, $9, $8
+; MIPS64R2-NEXT: sc $9, 0($3)
+; MIPS64R2-NEXT: beqz $9, .LBB15_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: .LBB15_3:
+; MIPS64R2-NEXT: srlv $2, $10, $4
+; MIPS64R2-NEXT: seh $2, $2
+; MIPS64R2-NEXT: # %bb.4:
+; MIPS64R2-NEXT: seh $1, $1
+; MIPS64R2-NEXT: xor $1, $2, $1
+; MIPS64R2-NEXT: sltiu $3, $1, 1
+; MIPS64R2-NEXT: sync
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: nop
+;
+; MIPS64R6-LABEL: foo:
+; MIPS64R6: # %bb.0:
+; MIPS64R6-NEXT: sll $1, $6, 0
+; MIPS64R6-NEXT: sll $2, $5, 0
+; MIPS64R6-NEXT: addu $1, $2, $1
+; MIPS64R6-NEXT: sync
+; MIPS64R6-NEXT: sll $2, $7, 0
+; MIPS64R6-NEXT: daddiu $3, $zero, -4
+; MIPS64R6-NEXT: and $3, $4, $3
+; MIPS64R6-NEXT: andi $4, $4, 3
+; MIPS64R6-NEXT: sll $4, $4, 3
+; MIPS64R6-NEXT: ori $5, $zero, 65535
+; MIPS64R6-NEXT: sllv $5, $5, $4
+; MIPS64R6-NEXT: nor $6, $zero, $5
+; MIPS64R6-NEXT: andi $7, $1, 65535
+; MIPS64R6-NEXT: sllv $7, $7, $4
+; MIPS64R6-NEXT: andi $2, $2, 65535
+; MIPS64R6-NEXT: sllv $8, $2, $4
+; MIPS64R6-NEXT: .LBB15_1: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $9, 0($3)
+; MIPS64R6-NEXT: and $10, $9, $5
+; MIPS64R6-NEXT: bnec $10, $7, .LBB15_3
+; MIPS64R6-NEXT: # %bb.2: # in Loop: Header=BB15_1 Depth=1
+; MIPS64R6-NEXT: and $9, $9, $6
+; MIPS64R6-NEXT: or $9, $9, $8
+; MIPS64R6-NEXT: sc $9, 0($3)
+; MIPS64R6-NEXT: beqzc $9, .LBB15_1
+; MIPS64R6-NEXT: .LBB15_3:
+; MIPS64R6-NEXT: srlv $2, $10, $4
+; MIPS64R6-NEXT: seh $2, $2
+; MIPS64R6-NEXT: # %bb.4:
+; MIPS64R6-NEXT: seh $1, $1
+; MIPS64R6-NEXT: xor $1, $2, $1
+; MIPS64R6-NEXT: sltiu $3, $1, 1
+; MIPS64R6-NEXT: sync
+; MIPS64R6-NEXT: jrc $ra
+;
+; MIPS64R6O0-LABEL: foo:
+; MIPS64R6O0: # %bb.0:
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, -16
+; MIPS64R6O0-NEXT: .cfi_def_cfa_offset 16
+; MIPS64R6O0-NEXT: move $1, $7
+; MIPS64R6O0-NEXT: sll $1, $1, 0
+; MIPS64R6O0-NEXT: move $2, $6
+; MIPS64R6O0-NEXT: sll $2, $2, 0
+; MIPS64R6O0-NEXT: move $3, $5
+; MIPS64R6O0-NEXT: sll $3, $3, 0
+; MIPS64R6O0-NEXT: move $5, $4
+; MIPS64R6O0-NEXT: addu $2, $3, $2
+; MIPS64R6O0-NEXT: sync
+; MIPS64R6O0-NEXT: daddiu $6, $zero, -4
+; MIPS64R6O0-NEXT: and $6, $4, $6
+; MIPS64R6O0-NEXT: andi $3, $4, 3
+; MIPS64R6O0-NEXT: xori $3, $3, 2
+; MIPS64R6O0-NEXT: sll $3, $3, 3
+; MIPS64R6O0-NEXT: ori $8, $zero, 65535
+; MIPS64R6O0-NEXT: sllv $8, $8, $3
+; MIPS64R6O0-NEXT: nor $9, $zero, $8
+; MIPS64R6O0-NEXT: andi $10, $2, 65535
+; MIPS64R6O0-NEXT: sllv $10, $10, $3
+; MIPS64R6O0-NEXT: andi $1, $1, 65535
+; MIPS64R6O0-NEXT: sllv $1, $1, $3
+; MIPS64R6O0-NEXT: .LBB15_1: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $12, 0($6)
+; MIPS64R6O0-NEXT: and $13, $12, $8
+; MIPS64R6O0-NEXT: bnec $13, $10, .LBB15_3
+; MIPS64R6O0-NEXT: # %bb.2: # in Loop: Header=BB15_1 Depth=1
+; MIPS64R6O0-NEXT: and $12, $12, $9
+; MIPS64R6O0-NEXT: or $12, $12, $1
+; MIPS64R6O0-NEXT: sc $12, 0($6)
+; MIPS64R6O0-NEXT: beqzc $12, .LBB15_1
+; MIPS64R6O0-NEXT: .LBB15_3:
+; MIPS64R6O0-NEXT: srlv $11, $13, $3
+; MIPS64R6O0-NEXT: seh $11, $11
+; MIPS64R6O0-NEXT: # %bb.4:
+; MIPS64R6O0-NEXT: sw $2, 12($sp) # 4-byte Folded Spill
+; MIPS64R6O0-NEXT: sw $11, 8($sp) # 4-byte Folded Spill
+; MIPS64R6O0-NEXT: sd $5, 0($sp) # 8-byte Folded Spill
+; MIPS64R6O0-NEXT: # %bb.5:
+; MIPS64R6O0-NEXT: lw $1, 12($sp) # 4-byte Folded Reload
+; MIPS64R6O0-NEXT: seh $2, $1
+; MIPS64R6O0-NEXT: lw $3, 8($sp) # 4-byte Folded Reload
+; MIPS64R6O0-NEXT: xor $2, $3, $2
+; MIPS64R6O0-NEXT: sltiu $3, $2, 1
+; MIPS64R6O0-NEXT: sync
+; MIPS64R6O0-NEXT: lw $2, 8($sp) # 4-byte Folded Reload
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, 16
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: foo:
+; MM32: # %bb.0:
+; MM32-NEXT: addu16 $3, $5, $6
+; MM32-NEXT: sync
+; MM32-NEXT: addiu $1, $zero, -4
+; MM32-NEXT: and $1, $4, $1
+; MM32-NEXT: andi $2, $4, 3
+; MM32-NEXT: sll $4, $2, 3
+; MM32-NEXT: ori $2, $zero, 65535
+; MM32-NEXT: sllv $5, $2, $4
+; MM32-NEXT: nor $6, $zero, $5
+; MM32-NEXT: andi $2, $3, 65535
+; MM32-NEXT: sllv $8, $2, $4
+; MM32-NEXT: andi $2, $7, 65535
+; MM32-NEXT: sllv $7, $2, $4
+; MM32-NEXT: $BB15_1: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $9, 0($1)
+; MM32-NEXT: and $10, $9, $5
+; MM32-NEXT: bne $10, $8, $BB15_3
+; MM32-NEXT: nop
+; MM32-NEXT: # %bb.2: # in Loop: Header=BB15_1 Depth=1
+; MM32-NEXT: and $9, $9, $6
+; MM32-NEXT: or $9, $9, $7
+; MM32-NEXT: sc $9, 0($1)
+; MM32-NEXT: beqzc $9, $BB15_1
+; MM32-NEXT: $BB15_3:
+; MM32-NEXT: srlv $2, $10, $4
+; MM32-NEXT: seh $2, $2
+; MM32-NEXT: # %bb.4:
+; MM32-NEXT: seh $1, $3
+; MM32-NEXT: xor $1, $2, $1
+; MM32-NEXT: sltiu $3, $1, 1
+; MM32-NEXT: sync
+; MM32-NEXT: jrc $ra
+;
+; O1-LABEL: foo:
+; O1: # %bb.0:
+; O1-NEXT: addu $1, $5, $6
+; O1-NEXT: sync
+; O1-NEXT: addiu $2, $zero, -4
+; O1-NEXT: and $3, $4, $2
+; O1-NEXT: andi $2, $4, 3
+; O1-NEXT: sll $4, $2, 3
+; O1-NEXT: ori $2, $zero, 65535
+; O1-NEXT: sllv $5, $2, $4
+; O1-NEXT: nor $6, $zero, $5
+; O1-NEXT: andi $2, $1, 65535
+; O1-NEXT: sllv $8, $2, $4
+; O1-NEXT: andi $2, $7, 65535
+; O1-NEXT: sllv $7, $2, $4
+; O1-NEXT: $BB15_1: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $9, 0($3)
+; O1-NEXT: and $10, $9, $5
+; O1-NEXT: bne $10, $8, $BB15_3
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # in Loop: Header=BB15_1 Depth=1
+; O1-NEXT: and $9, $9, $6
+; O1-NEXT: or $9, $9, $7
+; O1-NEXT: sc $9, 0($3)
+; O1-NEXT: beqz $9, $BB15_1
+; O1-NEXT: nop
+; O1-NEXT: $BB15_3:
+; O1-NEXT: srlv $2, $10, $4
+; O1-NEXT: sll $2, $2, 16
+; O1-NEXT: sra $2, $2, 16
+; O1-NEXT: # %bb.4:
+; O1-NEXT: sll $1, $1, 16
+; O1-NEXT: sra $1, $1, 16
+; O1-NEXT: xor $1, $2, $1
+; O1-NEXT: sltiu $3, $1, 1
+; O1-NEXT: sync
+; O1-NEXT: jr $ra
+; O1-NEXT: nop
+;
+; O2-LABEL: foo:
+; O2: # %bb.0:
+; O2-NEXT: addu $1, $5, $6
+; O2-NEXT: sync
+; O2-NEXT: addiu $2, $zero, -4
+; O2-NEXT: and $3, $4, $2
+; O2-NEXT: andi $2, $4, 3
+; O2-NEXT: sll $4, $2, 3
+; O2-NEXT: ori $2, $zero, 65535
+; O2-NEXT: sllv $5, $2, $4
+; O2-NEXT: nor $6, $zero, $5
+; O2-NEXT: andi $2, $1, 65535
+; O2-NEXT: sllv $8, $2, $4
+; O2-NEXT: andi $2, $7, 65535
+; O2-NEXT: sllv $7, $2, $4
+; O2-NEXT: $BB15_1: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $9, 0($3)
+; O2-NEXT: and $10, $9, $5
+; O2-NEXT: bne $10, $8, $BB15_3
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # in Loop: Header=BB15_1 Depth=1
+; O2-NEXT: and $9, $9, $6
+; O2-NEXT: or $9, $9, $7
+; O2-NEXT: sc $9, 0($3)
+; O2-NEXT: beqz $9, $BB15_1
+; O2-NEXT: nop
+; O2-NEXT: $BB15_3:
+; O2-NEXT: srlv $2, $10, $4
+; O2-NEXT: sll $2, $2, 16
+; O2-NEXT: sra $2, $2, 16
+; O2-NEXT: # %bb.4:
+; O2-NEXT: sll $1, $1, 16
+; O2-NEXT: sra $1, $1, 16
+; O2-NEXT: xor $1, $2, $1
+; O2-NEXT: sltiu $3, $1, 1
+; O2-NEXT: sync
+; O2-NEXT: jr $ra
+; O2-NEXT: nop
+;
+; O3-LABEL: foo:
+; O3: # %bb.0:
+; O3-NEXT: addiu $2, $zero, -4
+; O3-NEXT: addu $1, $5, $6
+; O3-NEXT: sync
+; O3-NEXT: and $3, $4, $2
+; O3-NEXT: andi $2, $4, 3
+; O3-NEXT: sll $4, $2, 3
+; O3-NEXT: ori $2, $zero, 65535
+; O3-NEXT: sllv $5, $2, $4
+; O3-NEXT: andi $2, $1, 65535
+; O3-NEXT: sll $1, $1, 16
+; O3-NEXT: sllv $8, $2, $4
+; O3-NEXT: andi $2, $7, 65535
+; O3-NEXT: nor $6, $zero, $5
+; O3-NEXT: sra $1, $1, 16
+; O3-NEXT: sllv $7, $2, $4
+; O3-NEXT: $BB15_1: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $9, 0($3)
+; O3-NEXT: and $10, $9, $5
+; O3-NEXT: bne $10, $8, $BB15_3
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # in Loop: Header=BB15_1 Depth=1
+; O3-NEXT: and $9, $9, $6
+; O3-NEXT: or $9, $9, $7
+; O3-NEXT: sc $9, 0($3)
+; O3-NEXT: beqz $9, $BB15_1
+; O3-NEXT: nop
+; O3-NEXT: $BB15_3:
+; O3-NEXT: srlv $2, $10, $4
+; O3-NEXT: sll $2, $2, 16
+; O3-NEXT: sra $2, $2, 16
+; O3-NEXT: # %bb.4:
+; O3-NEXT: sync
+; O3-NEXT: xor $1, $2, $1
+; O3-NEXT: jr $ra
+; O3-NEXT: sltiu $3, $1, 1
+;
+; MIPS32EB-LABEL: foo:
+; MIPS32EB: # %bb.0:
+; MIPS32EB-NEXT: addu $1, $5, $6
+; MIPS32EB-NEXT: sync
+; MIPS32EB-NEXT: addiu $2, $zero, -4
+; MIPS32EB-NEXT: and $3, $4, $2
+; MIPS32EB-NEXT: andi $2, $4, 3
+; MIPS32EB-NEXT: xori $2, $2, 2
+; MIPS32EB-NEXT: sll $4, $2, 3
+; MIPS32EB-NEXT: ori $2, $zero, 65535
+; MIPS32EB-NEXT: sllv $5, $2, $4
+; MIPS32EB-NEXT: nor $6, $zero, $5
+; MIPS32EB-NEXT: andi $2, $1, 65535
+; MIPS32EB-NEXT: sllv $8, $2, $4
+; MIPS32EB-NEXT: andi $2, $7, 65535
+; MIPS32EB-NEXT: sllv $7, $2, $4
+; MIPS32EB-NEXT: $BB15_1: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $9, 0($3)
+; MIPS32EB-NEXT: and $10, $9, $5
+; MIPS32EB-NEXT: bne $10, $8, $BB15_3
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # in Loop: Header=BB15_1 Depth=1
+; MIPS32EB-NEXT: and $9, $9, $6
+; MIPS32EB-NEXT: or $9, $9, $7
+; MIPS32EB-NEXT: sc $9, 0($3)
+; MIPS32EB-NEXT: beqz $9, $BB15_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: $BB15_3:
+; MIPS32EB-NEXT: srlv $2, $10, $4
+; MIPS32EB-NEXT: sll $2, $2, 16
+; MIPS32EB-NEXT: sra $2, $2, 16
+; MIPS32EB-NEXT: # %bb.4:
+; MIPS32EB-NEXT: sll $1, $1, 16
+; MIPS32EB-NEXT: sra $1, $1, 16
+; MIPS32EB-NEXT: xor $1, $2, $1
+; MIPS32EB-NEXT: sltiu $3, $1, 1
+; MIPS32EB-NEXT: sync
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: nop
%desired = add i16 %l, %r
%res = cmpxchg i16* %addr, i16 %desired, i16 %new seq_cst seq_cst
ret {i16, i1} %res
-
-; ALL-LABEL: foo
-; MIPSR6: addu $[[R2:[0-9]+]], $[[R1:[0-9]+]], $[[R0:[0-9]+]]
-; NOT-MICROMIPS: addu $[[R2:[0-9]+]], $[[R1:[0-9]+]], $[[R0:[0-9]+]]
-; MICROMIPS: addu16 $[[R2:[0-9]+]], $[[R1:[0-9]+]], $[[R0:[0-9]+]]
-
-; ALL: sync
-
-; ALL: andi $[[R3:[0-9]+]], $[[R2]], 65535
-; ALL: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; ALL: ll $[[R4:[0-9]+]], 0($[[R5:[0-9]+]])
-; ALL: and $[[R6:[0-9]+]], $[[R4]], $
-; ALL: and $[[R7:[0-9]+]], $[[R4]], $
-; ALL: or $[[R8:[0-9]+]], $[[R7]], $
-; ALL: sc $[[R8]], 0($[[R5]])
-; NOT-MICROMIPS: beqz $[[R8]], [[BB0]]
-; MICROMIPS: beqzc $[[R8]], [[BB0]]
-; MIPSR6: beqzc $[[R8]], [[BB0]]
-
-; ALL: srlv $[[R9:[0-9]+]], $[[R6]], $
-
-; NO-SEB-SEH: sll $[[R10:[0-9]+]], $[[R9]], 16
-; NO-SEB-SEH: sra $[[R11:[0-9]+]], $[[R10]], 16
-
-; NO-SEB-SEH: sll $[[R12:[0-9]+]], $[[R2]], 16
-; NO-SEB-SEH: sra $[[R13:[0-9]+]], $[[R12]], 16
-
-; HAS-SEB-SEH: seh $[[R11:[0-9]+]], $[[R9]]
-; HAS-SEB-SEH: seh $[[R13:[0-9]+]], $[[R2]]
-
-; ALL: xor $[[R12:[0-9]+]], $[[R11]], $[[R13]]
-; ALL: sltiu $3, $[[R12]], 1
-; ALL: sync
}
@countsint = common global i32 0, align 4
define i32 @CheckSync(i32 signext %v) nounwind noinline {
+; MIPS32-LABEL: CheckSync:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: sync
+; MIPS32-NEXT: lw $1, %got(countsint)($1)
+; MIPS32-NEXT: $BB16_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $2, 0($1)
+; MIPS32-NEXT: addu $3, $2, $4
+; MIPS32-NEXT: sc $3, 0($1)
+; MIPS32-NEXT: beqz $3, $BB16_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: sync
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: nop
+;
+; MIPS32O0-LABEL: CheckSync:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: sync
+; MIPS32O0-NEXT: lw $2, %got(countsint)($2)
+; MIPS32O0-NEXT: $BB16_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $25, 0($2)
+; MIPS32O0-NEXT: addu $1, $25, $4
+; MIPS32O0-NEXT: sc $1, 0($2)
+; MIPS32O0-NEXT: beqz $1, $BB16_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: sync
+; MIPS32O0-NEXT: move $2, $25
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: CheckSync:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: sync
+; MIPS32R2-NEXT: lw $1, %got(countsint)($1)
+; MIPS32R2-NEXT: $BB16_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $2, 0($1)
+; MIPS32R2-NEXT: addu $3, $2, $4
+; MIPS32R2-NEXT: sc $3, 0($1)
+; MIPS32R2-NEXT: beqz $3, $BB16_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: sync
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: nop
+;
+; MIPS32R6-LABEL: CheckSync:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: sync
+; MIPS32R6-NEXT: lw $1, %got(countsint)($1)
+; MIPS32R6-NEXT: $BB16_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $2, 0($1)
+; MIPS32R6-NEXT: addu $3, $2, $4
+; MIPS32R6-NEXT: sc $3, 0($1)
+; MIPS32R6-NEXT: beqzc $3, $BB16_1
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: sync
+; MIPS32R6-NEXT: jrc $ra
+;
+; MIPS32R6O0-LABEL: CheckSync:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -8
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $4
+; MIPS32R6O0-NEXT: sync
+; MIPS32R6O0-NEXT: lw $2, %got(countsint)($2)
+; MIPS32R6O0-NEXT: $BB16_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $1, 0($2)
+; MIPS32R6O0-NEXT: addu $3, $1, $4
+; MIPS32R6O0-NEXT: sc $3, 0($2)
+; MIPS32R6O0-NEXT: beqzc $3, $BB16_1
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: sync
+; MIPS32R6O0-NEXT: move $2, $1
+; MIPS32R6O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 8
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: CheckSync:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(CheckSync)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(CheckSync)))
+; MIPS4-NEXT: sync
+; MIPS4-NEXT: ld $1, %got_disp(countsint)($1)
+; MIPS4-NEXT: .LBB16_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $2, 0($1)
+; MIPS4-NEXT: addu $3, $2, $4
+; MIPS4-NEXT: sc $3, 0($1)
+; MIPS4-NEXT: beqz $3, .LBB16_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: sync
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: nop
+;
+; MIPS64-LABEL: CheckSync:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(CheckSync)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(CheckSync)))
+; MIPS64-NEXT: sync
+; MIPS64-NEXT: ld $1, %got_disp(countsint)($1)
+; MIPS64-NEXT: .LBB16_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $2, 0($1)
+; MIPS64-NEXT: addu $3, $2, $4
+; MIPS64-NEXT: sc $3, 0($1)
+; MIPS64-NEXT: beqz $3, .LBB16_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: sync
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: nop
+;
+; MIPS64R2-LABEL: CheckSync:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(CheckSync)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(CheckSync)))
+; MIPS64R2-NEXT: sync
+; MIPS64R2-NEXT: ld $1, %got_disp(countsint)($1)
+; MIPS64R2-NEXT: .LBB16_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $2, 0($1)
+; MIPS64R2-NEXT: addu $3, $2, $4
+; MIPS64R2-NEXT: sc $3, 0($1)
+; MIPS64R2-NEXT: beqz $3, .LBB16_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: sync
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: nop
+;
+; MIPS64R6-LABEL: CheckSync:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(CheckSync)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(CheckSync)))
+; MIPS64R6-NEXT: sync
+; MIPS64R6-NEXT: ld $1, %got_disp(countsint)($1)
+; MIPS64R6-NEXT: .LBB16_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $2, 0($1)
+; MIPS64R6-NEXT: addu $3, $2, $4
+; MIPS64R6-NEXT: sc $3, 0($1)
+; MIPS64R6-NEXT: beqzc $3, .LBB16_1
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: sync
+; MIPS64R6-NEXT: jrc $ra
+;
+; MIPS64R6O0-LABEL: CheckSync:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(CheckSync)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(CheckSync)))
+; MIPS64R6O0-NEXT: move $2, $4
+; MIPS64R6O0-NEXT: sync
+; MIPS64R6O0-NEXT: ld $1, %got_disp(countsint)($1)
+; MIPS64R6O0-NEXT: .LBB16_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $3, 0($1)
+; MIPS64R6O0-NEXT: addu $5, $3, $2
+; MIPS64R6O0-NEXT: sc $5, 0($1)
+; MIPS64R6O0-NEXT: beqzc $5, .LBB16_1
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: sync
+; MIPS64R6O0-NEXT: move $2, $3
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: CheckSync:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: sync
+; MM32-NEXT: lw $1, %got(countsint)($2)
+; MM32-NEXT: $BB16_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $2, 0($1)
+; MM32-NEXT: addu16 $3, $2, $4
+; MM32-NEXT: sc $3, 0($1)
+; MM32-NEXT: beqzc $3, $BB16_1
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: sync
+; MM32-NEXT: jrc $ra
+;
+; O1-LABEL: CheckSync:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: sync
+; O1-NEXT: lw $1, %got(countsint)($1)
+; O1-NEXT: $BB16_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $2, 0($1)
+; O1-NEXT: addu $3, $2, $4
+; O1-NEXT: sc $3, 0($1)
+; O1-NEXT: beqz $3, $BB16_1
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: sync
+; O1-NEXT: jr $ra
+; O1-NEXT: nop
+;
+; O2-LABEL: CheckSync:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: sync
+; O2-NEXT: lw $1, %got(countsint)($1)
+; O2-NEXT: $BB16_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $2, 0($1)
+; O2-NEXT: addu $3, $2, $4
+; O2-NEXT: sc $3, 0($1)
+; O2-NEXT: beqz $3, $BB16_1
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: sync
+; O2-NEXT: jr $ra
+; O2-NEXT: nop
+;
+; O3-LABEL: CheckSync:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: sync
+; O3-NEXT: lw $1, %got(countsint)($1)
+; O3-NEXT: $BB16_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $2, 0($1)
+; O3-NEXT: addu $3, $2, $4
+; O3-NEXT: sc $3, 0($1)
+; O3-NEXT: beqz $3, $BB16_1
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: sync
+; O3-NEXT: jr $ra
+; O3-NEXT: nop
+;
+; MIPS32EB-LABEL: CheckSync:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: sync
+; MIPS32EB-NEXT: lw $1, %got(countsint)($1)
+; MIPS32EB-NEXT: $BB16_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $2, 0($1)
+; MIPS32EB-NEXT: addu $3, $2, $4
+; MIPS32EB-NEXT: sc $3, 0($1)
+; MIPS32EB-NEXT: beqz $3, $BB16_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: sync
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: nop
entry:
%0 = atomicrmw add i32* @countsint, i32 %v seq_cst
- ret i32 %0
-
-; ALL-LABEL: CheckSync:
-
-; ALL: sync
-; ALL: ll
-; ALL: sc
-; ALL: beq
-; ALL: sync
+ ret i32 %0
}
; make sure that this assertion in
; line 1203: assert(TargetRegisterInfo::isVirtualRegister(regB) &&
;
; it failed when MipsDAGToDAGISel::ReplaceUsesWithZeroReg replaced an
-; operand of an atomic instruction with register $zero.
+; operand of an atomic instruction with register $zero.
@a = external global i32
define i32 @zeroreg() nounwind {
+; MIPS32-LABEL: zeroreg:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: sync
+; MIPS32-NEXT: addiu $2, $zero, 0
+; MIPS32-NEXT: addiu $3, $zero, 1
+; MIPS32-NEXT: lw $1, %got(a)($1)
+; MIPS32-NEXT: $BB17_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $4, 0($1)
+; MIPS32-NEXT: bne $4, $3, $BB17_3
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: # in Loop: Header=BB17_1 Depth=1
+; MIPS32-NEXT: move $5, $2
+; MIPS32-NEXT: sc $5, 0($1)
+; MIPS32-NEXT: beqz $5, $BB17_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: $BB17_3: # %entry
+; MIPS32-NEXT: xor $1, $4, $3
+; MIPS32-NEXT: sltiu $2, $1, 1
+; MIPS32-NEXT: sync
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: nop
+;
+; MIPS32O0-LABEL: zeroreg:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addiu $sp, $sp, -16
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: sync
+; MIPS32O0-NEXT: lw $2, %got(a)($2)
+; MIPS32O0-NEXT: addiu $25, $zero, 0
+; MIPS32O0-NEXT: addiu $1, $zero, 1
+; MIPS32O0-NEXT: lw $3, 12($sp) # 4-byte Folded Reload
+; MIPS32O0-NEXT: move $4, $1
+; MIPS32O0-NEXT: $BB17_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $5, 0($2)
+; MIPS32O0-NEXT: bne $5, $4, $BB17_3
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: # in Loop: Header=BB17_1 Depth=1
+; MIPS32O0-NEXT: move $6, $25
+; MIPS32O0-NEXT: sc $6, 0($2)
+; MIPS32O0-NEXT: beqz $6, $BB17_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: $BB17_3: # %entry
+; MIPS32O0-NEXT: xor $1, $5, $1
+; MIPS32O0-NEXT: sltiu $1, $1, 1
+; MIPS32O0-NEXT: sync
+; MIPS32O0-NEXT: addiu $2, $zero, 1
+; MIPS32O0-NEXT: xor $2, $5, $2
+; MIPS32O0-NEXT: sltiu $2, $2, 1
+; MIPS32O0-NEXT: andi $2, $2, 1
+; MIPS32O0-NEXT: sw $3, 8($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: sw $5, 12($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: sw $1, 4($sp) # 4-byte Folded Spill
+; MIPS32O0-NEXT: addiu $sp, $sp, 16
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: zeroreg:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: sync
+; MIPS32R2-NEXT: addiu $2, $zero, 0
+; MIPS32R2-NEXT: addiu $3, $zero, 1
+; MIPS32R2-NEXT: lw $1, %got(a)($1)
+; MIPS32R2-NEXT: $BB17_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $4, 0($1)
+; MIPS32R2-NEXT: bne $4, $3, $BB17_3
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: # in Loop: Header=BB17_1 Depth=1
+; MIPS32R2-NEXT: move $5, $2
+; MIPS32R2-NEXT: sc $5, 0($1)
+; MIPS32R2-NEXT: beqz $5, $BB17_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: $BB17_3: # %entry
+; MIPS32R2-NEXT: xor $1, $4, $3
+; MIPS32R2-NEXT: sltiu $2, $1, 1
+; MIPS32R2-NEXT: sync
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: nop
+;
+; MIPS32R6-LABEL: zeroreg:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: sync
+; MIPS32R6-NEXT: addiu $2, $zero, 0
+; MIPS32R6-NEXT: addiu $3, $zero, 1
+; MIPS32R6-NEXT: lw $1, %got(a)($1)
+; MIPS32R6-NEXT: $BB17_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $4, 0($1)
+; MIPS32R6-NEXT: bnec $4, $3, $BB17_3
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: # in Loop: Header=BB17_1 Depth=1
+; MIPS32R6-NEXT: move $5, $2
+; MIPS32R6-NEXT: sc $5, 0($1)
+; MIPS32R6-NEXT: beqzc $5, $BB17_1
+; MIPS32R6-NEXT: $BB17_3: # %entry
+; MIPS32R6-NEXT: xor $1, $4, $3
+; MIPS32R6-NEXT: sltiu $2, $1, 1
+; MIPS32R6-NEXT: sync
+; MIPS32R6-NEXT: jrc $ra
+;
+; MIPS32R6O0-LABEL: zeroreg:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -8
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: sync
+; MIPS32R6O0-NEXT: lw $2, %got(a)($2)
+; MIPS32R6O0-NEXT: addiu $25, $zero, 0
+; MIPS32R6O0-NEXT: addiu $1, $zero, 1
+; MIPS32R6O0-NEXT: lw $3, 4($sp) # 4-byte Folded Reload
+; MIPS32R6O0-NEXT: move $4, $1
+; MIPS32R6O0-NEXT: $BB17_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $5, 0($2)
+; MIPS32R6O0-NEXT: bnec $5, $4, $BB17_3
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: # in Loop: Header=BB17_1 Depth=1
+; MIPS32R6O0-NEXT: move $6, $25
+; MIPS32R6O0-NEXT: sc $6, 0($2)
+; MIPS32R6O0-NEXT: beqzc $6, $BB17_1
+; MIPS32R6O0-NEXT: $BB17_3: # %entry
+; MIPS32R6O0-NEXT: xor $1, $5, $1
+; MIPS32R6O0-NEXT: sltiu $2, $1, 1
+; MIPS32R6O0-NEXT: sync
+; MIPS32R6O0-NEXT: sw $3, 0($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: sw $5, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 8
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: zeroreg:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(zeroreg)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(zeroreg)))
+; MIPS4-NEXT: sync
+; MIPS4-NEXT: addiu $2, $zero, 0
+; MIPS4-NEXT: addiu $3, $zero, 1
+; MIPS4-NEXT: ld $1, %got_disp(a)($1)
+; MIPS4-NEXT: .LBB17_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $4, 0($1)
+; MIPS4-NEXT: bne $4, $3, .LBB17_3
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: # in Loop: Header=BB17_1 Depth=1
+; MIPS4-NEXT: move $5, $2
+; MIPS4-NEXT: sc $5, 0($1)
+; MIPS4-NEXT: beqz $5, .LBB17_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: .LBB17_3: # %entry
+; MIPS4-NEXT: xor $1, $4, $3
+; MIPS4-NEXT: sltiu $2, $1, 1
+; MIPS4-NEXT: sync
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: nop
+;
+; MIPS64-LABEL: zeroreg:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(zeroreg)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(zeroreg)))
+; MIPS64-NEXT: sync
+; MIPS64-NEXT: addiu $2, $zero, 0
+; MIPS64-NEXT: addiu $3, $zero, 1
+; MIPS64-NEXT: ld $1, %got_disp(a)($1)
+; MIPS64-NEXT: .LBB17_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $4, 0($1)
+; MIPS64-NEXT: bne $4, $3, .LBB17_3
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: # in Loop: Header=BB17_1 Depth=1
+; MIPS64-NEXT: move $5, $2
+; MIPS64-NEXT: sc $5, 0($1)
+; MIPS64-NEXT: beqz $5, .LBB17_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: .LBB17_3: # %entry
+; MIPS64-NEXT: xor $1, $4, $3
+; MIPS64-NEXT: sltiu $2, $1, 1
+; MIPS64-NEXT: sync
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: nop
+;
+; MIPS64R2-LABEL: zeroreg:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(zeroreg)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(zeroreg)))
+; MIPS64R2-NEXT: sync
+; MIPS64R2-NEXT: addiu $2, $zero, 0
+; MIPS64R2-NEXT: addiu $3, $zero, 1
+; MIPS64R2-NEXT: ld $1, %got_disp(a)($1)
+; MIPS64R2-NEXT: .LBB17_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $4, 0($1)
+; MIPS64R2-NEXT: bne $4, $3, .LBB17_3
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: # in Loop: Header=BB17_1 Depth=1
+; MIPS64R2-NEXT: move $5, $2
+; MIPS64R2-NEXT: sc $5, 0($1)
+; MIPS64R2-NEXT: beqz $5, .LBB17_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: .LBB17_3: # %entry
+; MIPS64R2-NEXT: xor $1, $4, $3
+; MIPS64R2-NEXT: sltiu $2, $1, 1
+; MIPS64R2-NEXT: sync
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: nop
+;
+; MIPS64R6-LABEL: zeroreg:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(zeroreg)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(zeroreg)))
+; MIPS64R6-NEXT: sync
+; MIPS64R6-NEXT: addiu $2, $zero, 0
+; MIPS64R6-NEXT: addiu $3, $zero, 1
+; MIPS64R6-NEXT: ld $1, %got_disp(a)($1)
+; MIPS64R6-NEXT: .LBB17_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $4, 0($1)
+; MIPS64R6-NEXT: bnec $4, $3, .LBB17_3
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: # in Loop: Header=BB17_1 Depth=1
+; MIPS64R6-NEXT: move $5, $2
+; MIPS64R6-NEXT: sc $5, 0($1)
+; MIPS64R6-NEXT: beqzc $5, .LBB17_1
+; MIPS64R6-NEXT: .LBB17_3: # %entry
+; MIPS64R6-NEXT: xor $1, $4, $3
+; MIPS64R6-NEXT: sltiu $2, $1, 1
+; MIPS64R6-NEXT: sync
+; MIPS64R6-NEXT: jrc $ra
+;
+; MIPS64R6O0-LABEL: zeroreg:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, -16
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(zeroreg)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(zeroreg)))
+; MIPS64R6O0-NEXT: sync
+; MIPS64R6O0-NEXT: ld $1, %got_disp(a)($1)
+; MIPS64R6O0-NEXT: addiu $2, $zero, 0
+; MIPS64R6O0-NEXT: addiu $3, $zero, 1
+; MIPS64R6O0-NEXT: lw $4, 12($sp) # 4-byte Folded Reload
+; MIPS64R6O0-NEXT: move $5, $3
+; MIPS64R6O0-NEXT: .LBB17_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $6, 0($1)
+; MIPS64R6O0-NEXT: bnec $6, $5, .LBB17_3
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: # in Loop: Header=BB17_1 Depth=1
+; MIPS64R6O0-NEXT: move $7, $2
+; MIPS64R6O0-NEXT: sc $7, 0($1)
+; MIPS64R6O0-NEXT: beqzc $7, .LBB17_1
+; MIPS64R6O0-NEXT: .LBB17_3: # %entry
+; MIPS64R6O0-NEXT: xor $2, $6, $3
+; MIPS64R6O0-NEXT: sltiu $2, $2, 1
+; MIPS64R6O0-NEXT: sync
+; MIPS64R6O0-NEXT: sw $4, 8($sp) # 4-byte Folded Spill
+; MIPS64R6O0-NEXT: sw $6, 12($sp) # 4-byte Folded Spill
+; MIPS64R6O0-NEXT: daddiu $sp, $sp, 16
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: zeroreg:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: sync
+; MM32-NEXT: li16 $3, 0
+; MM32-NEXT: li16 $4, 1
+; MM32-NEXT: lw $1, %got(a)($2)
+; MM32-NEXT: $BB17_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $2, 0($1)
+; MM32-NEXT: bne $2, $4, $BB17_3
+; MM32-NEXT: nop
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: # in Loop: Header=BB17_1 Depth=1
+; MM32-NEXT: move $5, $3
+; MM32-NEXT: sc $5, 0($1)
+; MM32-NEXT: beqzc $5, $BB17_1
+; MM32-NEXT: $BB17_3: # %entry
+; MM32-NEXT: xor $1, $2, $4
+; MM32-NEXT: sltiu $2, $1, 1
+; MM32-NEXT: sync
+; MM32-NEXT: jrc $ra
+;
+; O1-LABEL: zeroreg:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: sync
+; O1-NEXT: addiu $2, $zero, 0
+; O1-NEXT: addiu $3, $zero, 1
+; O1-NEXT: lw $1, %got(a)($1)
+; O1-NEXT: $BB17_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $4, 0($1)
+; O1-NEXT: bne $4, $3, $BB17_3
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: # in Loop: Header=BB17_1 Depth=1
+; O1-NEXT: move $5, $2
+; O1-NEXT: sc $5, 0($1)
+; O1-NEXT: beqz $5, $BB17_1
+; O1-NEXT: nop
+; O1-NEXT: $BB17_3: # %entry
+; O1-NEXT: xor $1, $4, $3
+; O1-NEXT: sltiu $2, $1, 1
+; O1-NEXT: sync
+; O1-NEXT: jr $ra
+; O1-NEXT: nop
+;
+; O2-LABEL: zeroreg:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: sync
+; O2-NEXT: addiu $2, $zero, 0
+; O2-NEXT: addiu $3, $zero, 1
+; O2-NEXT: lw $1, %got(a)($1)
+; O2-NEXT: $BB17_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $4, 0($1)
+; O2-NEXT: bne $4, $3, $BB17_3
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: # in Loop: Header=BB17_1 Depth=1
+; O2-NEXT: move $5, $2
+; O2-NEXT: sc $5, 0($1)
+; O2-NEXT: beqz $5, $BB17_1
+; O2-NEXT: nop
+; O2-NEXT: $BB17_3: # %entry
+; O2-NEXT: xor $1, $4, $3
+; O2-NEXT: sltiu $2, $1, 1
+; O2-NEXT: sync
+; O2-NEXT: jr $ra
+; O2-NEXT: nop
+;
+; O3-LABEL: zeroreg:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: addiu $2, $zero, 0
+; O3-NEXT: addiu $3, $zero, 1
+; O3-NEXT: sync
+; O3-NEXT: lw $1, %got(a)($1)
+; O3-NEXT: $BB17_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $4, 0($1)
+; O3-NEXT: bne $4, $3, $BB17_3
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: # in Loop: Header=BB17_1 Depth=1
+; O3-NEXT: move $5, $2
+; O3-NEXT: sc $5, 0($1)
+; O3-NEXT: beqz $5, $BB17_1
+; O3-NEXT: nop
+; O3-NEXT: $BB17_3: # %entry
+; O3-NEXT: sync
+; O3-NEXT: xor $1, $4, $3
+; O3-NEXT: jr $ra
+; O3-NEXT: sltiu $2, $1, 1
+;
+; MIPS32EB-LABEL: zeroreg:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: sync
+; MIPS32EB-NEXT: addiu $2, $zero, 0
+; MIPS32EB-NEXT: addiu $3, $zero, 1
+; MIPS32EB-NEXT: lw $1, %got(a)($1)
+; MIPS32EB-NEXT: $BB17_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $4, 0($1)
+; MIPS32EB-NEXT: bne $4, $3, $BB17_3
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: # in Loop: Header=BB17_1 Depth=1
+; MIPS32EB-NEXT: move $5, $2
+; MIPS32EB-NEXT: sc $5, 0($1)
+; MIPS32EB-NEXT: beqz $5, $BB17_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: $BB17_3: # %entry
+; MIPS32EB-NEXT: xor $1, $4, $3
+; MIPS32EB-NEXT: sltiu $2, $1, 1
+; MIPS32EB-NEXT: sync
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: nop
entry:
%pair0 = cmpxchg i32* @a, i32 1, i32 0 seq_cst seq_cst
%0 = extractvalue { i32, i1 } %pair0, 0
; Check that MIPS32R6 has the correct offset range.
; FIXME: At the moment, we don't seem to do addr+offset for any atomic load/store.
define i32 @AtomicLoadAdd32_OffGt9Bit(i32 signext %incr) nounwind {
+; MIPS32-LABEL: AtomicLoadAdd32_OffGt9Bit:
+; MIPS32: # %bb.0: # %entry
+; MIPS32-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32-NEXT: addu $1, $2, $25
+; MIPS32-NEXT: lw $1, %got(x)($1)
+; MIPS32-NEXT: addiu $1, $1, 1024
+; MIPS32-NEXT: $BB18_1: # %entry
+; MIPS32-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32-NEXT: ll $2, 0($1)
+; MIPS32-NEXT: addu $3, $2, $4
+; MIPS32-NEXT: sc $3, 0($1)
+; MIPS32-NEXT: beqz $3, $BB18_1
+; MIPS32-NEXT: nop
+; MIPS32-NEXT: # %bb.2: # %entry
+; MIPS32-NEXT: jr $ra
+; MIPS32-NEXT: nop
+;
+; MIPS32O0-LABEL: AtomicLoadAdd32_OffGt9Bit:
+; MIPS32O0: # %bb.0: # %entry
+; MIPS32O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32O0-NEXT: addu $2, $2, $25
+; MIPS32O0-NEXT: lw $2, %got(x)($2)
+; MIPS32O0-NEXT: addiu $2, $2, 1024
+; MIPS32O0-NEXT: $BB18_1: # %entry
+; MIPS32O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32O0-NEXT: ll $25, 0($2)
+; MIPS32O0-NEXT: addu $1, $25, $4
+; MIPS32O0-NEXT: sc $1, 0($2)
+; MIPS32O0-NEXT: beqz $1, $BB18_1
+; MIPS32O0-NEXT: nop
+; MIPS32O0-NEXT: # %bb.2: # %entry
+; MIPS32O0-NEXT: move $2, $25
+; MIPS32O0-NEXT: jr $ra
+; MIPS32O0-NEXT: nop
+;
+; MIPS32R2-LABEL: AtomicLoadAdd32_OffGt9Bit:
+; MIPS32R2: # %bb.0: # %entry
+; MIPS32R2-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R2-NEXT: addu $1, $2, $25
+; MIPS32R2-NEXT: lw $1, %got(x)($1)
+; MIPS32R2-NEXT: addiu $1, $1, 1024
+; MIPS32R2-NEXT: $BB18_1: # %entry
+; MIPS32R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R2-NEXT: ll $2, 0($1)
+; MIPS32R2-NEXT: addu $3, $2, $4
+; MIPS32R2-NEXT: sc $3, 0($1)
+; MIPS32R2-NEXT: beqz $3, $BB18_1
+; MIPS32R2-NEXT: nop
+; MIPS32R2-NEXT: # %bb.2: # %entry
+; MIPS32R2-NEXT: jr $ra
+; MIPS32R2-NEXT: nop
+;
+; MIPS32R6-LABEL: AtomicLoadAdd32_OffGt9Bit:
+; MIPS32R6: # %bb.0: # %entry
+; MIPS32R6-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6-NEXT: addu $1, $2, $25
+; MIPS32R6-NEXT: lw $1, %got(x)($1)
+; MIPS32R6-NEXT: addiu $1, $1, 1024
+; MIPS32R6-NEXT: $BB18_1: # %entry
+; MIPS32R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6-NEXT: ll $2, 0($1)
+; MIPS32R6-NEXT: addu $3, $2, $4
+; MIPS32R6-NEXT: sc $3, 0($1)
+; MIPS32R6-NEXT: beqzc $3, $BB18_1
+; MIPS32R6-NEXT: nop
+; MIPS32R6-NEXT: # %bb.2: # %entry
+; MIPS32R6-NEXT: jrc $ra
+;
+; MIPS32R6O0-LABEL: AtomicLoadAdd32_OffGt9Bit:
+; MIPS32R6O0: # %bb.0: # %entry
+; MIPS32R6O0-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32R6O0-NEXT: addiu $sp, $sp, -8
+; MIPS32R6O0-NEXT: addu $2, $2, $25
+; MIPS32R6O0-NEXT: move $25, $4
+; MIPS32R6O0-NEXT: lw $2, %got(x)($2)
+; MIPS32R6O0-NEXT: addiu $2, $2, 1024
+; MIPS32R6O0-NEXT: $BB18_1: # %entry
+; MIPS32R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32R6O0-NEXT: ll $1, 0($2)
+; MIPS32R6O0-NEXT: addu $3, $1, $4
+; MIPS32R6O0-NEXT: sc $3, 0($2)
+; MIPS32R6O0-NEXT: beqzc $3, $BB18_1
+; MIPS32R6O0-NEXT: # %bb.2: # %entry
+; MIPS32R6O0-NEXT: move $2, $1
+; MIPS32R6O0-NEXT: sw $25, 4($sp) # 4-byte Folded Spill
+; MIPS32R6O0-NEXT: addiu $sp, $sp, 8
+; MIPS32R6O0-NEXT: jrc $ra
+;
+; MIPS4-LABEL: AtomicLoadAdd32_OffGt9Bit:
+; MIPS4: # %bb.0: # %entry
+; MIPS4-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd32_OffGt9Bit)))
+; MIPS4-NEXT: daddu $1, $1, $25
+; MIPS4-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd32_OffGt9Bit)))
+; MIPS4-NEXT: ld $1, %got_disp(x)($1)
+; MIPS4-NEXT: daddiu $1, $1, 1024
+; MIPS4-NEXT: .LBB18_1: # %entry
+; MIPS4-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS4-NEXT: ll $2, 0($1)
+; MIPS4-NEXT: addu $3, $2, $4
+; MIPS4-NEXT: sc $3, 0($1)
+; MIPS4-NEXT: beqz $3, .LBB18_1
+; MIPS4-NEXT: nop
+; MIPS4-NEXT: # %bb.2: # %entry
+; MIPS4-NEXT: jr $ra
+; MIPS4-NEXT: nop
+;
+; MIPS64-LABEL: AtomicLoadAdd32_OffGt9Bit:
+; MIPS64: # %bb.0: # %entry
+; MIPS64-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd32_OffGt9Bit)))
+; MIPS64-NEXT: daddu $1, $1, $25
+; MIPS64-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd32_OffGt9Bit)))
+; MIPS64-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64-NEXT: daddiu $1, $1, 1024
+; MIPS64-NEXT: .LBB18_1: # %entry
+; MIPS64-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64-NEXT: ll $2, 0($1)
+; MIPS64-NEXT: addu $3, $2, $4
+; MIPS64-NEXT: sc $3, 0($1)
+; MIPS64-NEXT: beqz $3, .LBB18_1
+; MIPS64-NEXT: nop
+; MIPS64-NEXT: # %bb.2: # %entry
+; MIPS64-NEXT: jr $ra
+; MIPS64-NEXT: nop
+;
+; MIPS64R2-LABEL: AtomicLoadAdd32_OffGt9Bit:
+; MIPS64R2: # %bb.0: # %entry
+; MIPS64R2-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd32_OffGt9Bit)))
+; MIPS64R2-NEXT: daddu $1, $1, $25
+; MIPS64R2-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd32_OffGt9Bit)))
+; MIPS64R2-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R2-NEXT: daddiu $1, $1, 1024
+; MIPS64R2-NEXT: .LBB18_1: # %entry
+; MIPS64R2-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R2-NEXT: ll $2, 0($1)
+; MIPS64R2-NEXT: addu $3, $2, $4
+; MIPS64R2-NEXT: sc $3, 0($1)
+; MIPS64R2-NEXT: beqz $3, .LBB18_1
+; MIPS64R2-NEXT: nop
+; MIPS64R2-NEXT: # %bb.2: # %entry
+; MIPS64R2-NEXT: jr $ra
+; MIPS64R2-NEXT: nop
+;
+; MIPS64R6-LABEL: AtomicLoadAdd32_OffGt9Bit:
+; MIPS64R6: # %bb.0: # %entry
+; MIPS64R6-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd32_OffGt9Bit)))
+; MIPS64R6-NEXT: daddu $1, $1, $25
+; MIPS64R6-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd32_OffGt9Bit)))
+; MIPS64R6-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6-NEXT: daddiu $1, $1, 1024
+; MIPS64R6-NEXT: .LBB18_1: # %entry
+; MIPS64R6-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6-NEXT: ll $2, 0($1)
+; MIPS64R6-NEXT: addu $3, $2, $4
+; MIPS64R6-NEXT: sc $3, 0($1)
+; MIPS64R6-NEXT: beqzc $3, .LBB18_1
+; MIPS64R6-NEXT: nop
+; MIPS64R6-NEXT: # %bb.2: # %entry
+; MIPS64R6-NEXT: jrc $ra
+;
+; MIPS64R6O0-LABEL: AtomicLoadAdd32_OffGt9Bit:
+; MIPS64R6O0: # %bb.0: # %entry
+; MIPS64R6O0-NEXT: lui $1, %hi(%neg(%gp_rel(AtomicLoadAdd32_OffGt9Bit)))
+; MIPS64R6O0-NEXT: daddu $1, $1, $25
+; MIPS64R6O0-NEXT: daddiu $1, $1, %lo(%neg(%gp_rel(AtomicLoadAdd32_OffGt9Bit)))
+; MIPS64R6O0-NEXT: move $2, $4
+; MIPS64R6O0-NEXT: ld $1, %got_disp(x)($1)
+; MIPS64R6O0-NEXT: daddiu $1, $1, 1024
+; MIPS64R6O0-NEXT: .LBB18_1: # %entry
+; MIPS64R6O0-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS64R6O0-NEXT: ll $3, 0($1)
+; MIPS64R6O0-NEXT: addu $5, $3, $2
+; MIPS64R6O0-NEXT: sc $5, 0($1)
+; MIPS64R6O0-NEXT: beqzc $5, .LBB18_1
+; MIPS64R6O0-NEXT: # %bb.2: # %entry
+; MIPS64R6O0-NEXT: move $2, $3
+; MIPS64R6O0-NEXT: jrc $ra
+;
+; MM32-LABEL: AtomicLoadAdd32_OffGt9Bit:
+; MM32: # %bb.0: # %entry
+; MM32-NEXT: lui $2, %hi(_gp_disp)
+; MM32-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MM32-NEXT: addu $2, $2, $25
+; MM32-NEXT: lw $1, %got(x)($2)
+; MM32-NEXT: addiu $1, $1, 1024
+; MM32-NEXT: $BB18_1: # %entry
+; MM32-NEXT: # =>This Inner Loop Header: Depth=1
+; MM32-NEXT: ll $2, 0($1)
+; MM32-NEXT: addu16 $3, $2, $4
+; MM32-NEXT: sc $3, 0($1)
+; MM32-NEXT: beqzc $3, $BB18_1
+; MM32-NEXT: # %bb.2: # %entry
+; MM32-NEXT: jrc $ra
+;
+; O1-LABEL: AtomicLoadAdd32_OffGt9Bit:
+; O1: # %bb.0: # %entry
+; O1-NEXT: lui $2, %hi(_gp_disp)
+; O1-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O1-NEXT: addu $1, $2, $25
+; O1-NEXT: lw $1, %got(x)($1)
+; O1-NEXT: addiu $1, $1, 1024
+; O1-NEXT: $BB18_1: # %entry
+; O1-NEXT: # =>This Inner Loop Header: Depth=1
+; O1-NEXT: ll $2, 0($1)
+; O1-NEXT: addu $3, $2, $4
+; O1-NEXT: sc $3, 0($1)
+; O1-NEXT: beqz $3, $BB18_1
+; O1-NEXT: nop
+; O1-NEXT: # %bb.2: # %entry
+; O1-NEXT: jr $ra
+; O1-NEXT: nop
+;
+; O2-LABEL: AtomicLoadAdd32_OffGt9Bit:
+; O2: # %bb.0: # %entry
+; O2-NEXT: lui $2, %hi(_gp_disp)
+; O2-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O2-NEXT: addu $1, $2, $25
+; O2-NEXT: lw $1, %got(x)($1)
+; O2-NEXT: addiu $1, $1, 1024
+; O2-NEXT: $BB18_1: # %entry
+; O2-NEXT: # =>This Inner Loop Header: Depth=1
+; O2-NEXT: ll $2, 0($1)
+; O2-NEXT: addu $3, $2, $4
+; O2-NEXT: sc $3, 0($1)
+; O2-NEXT: beqz $3, $BB18_1
+; O2-NEXT: nop
+; O2-NEXT: # %bb.2: # %entry
+; O2-NEXT: jr $ra
+; O2-NEXT: nop
+;
+; O3-LABEL: AtomicLoadAdd32_OffGt9Bit:
+; O3: # %bb.0: # %entry
+; O3-NEXT: lui $2, %hi(_gp_disp)
+; O3-NEXT: addiu $2, $2, %lo(_gp_disp)
+; O3-NEXT: addu $1, $2, $25
+; O3-NEXT: lw $1, %got(x)($1)
+; O3-NEXT: addiu $1, $1, 1024
+; O3-NEXT: $BB18_1: # %entry
+; O3-NEXT: # =>This Inner Loop Header: Depth=1
+; O3-NEXT: ll $2, 0($1)
+; O3-NEXT: addu $3, $2, $4
+; O3-NEXT: sc $3, 0($1)
+; O3-NEXT: beqz $3, $BB18_1
+; O3-NEXT: nop
+; O3-NEXT: # %bb.2: # %entry
+; O3-NEXT: jr $ra
+; O3-NEXT: nop
+;
+; MIPS32EB-LABEL: AtomicLoadAdd32_OffGt9Bit:
+; MIPS32EB: # %bb.0: # %entry
+; MIPS32EB-NEXT: lui $2, %hi(_gp_disp)
+; MIPS32EB-NEXT: addiu $2, $2, %lo(_gp_disp)
+; MIPS32EB-NEXT: addu $1, $2, $25
+; MIPS32EB-NEXT: lw $1, %got(x)($1)
+; MIPS32EB-NEXT: addiu $1, $1, 1024
+; MIPS32EB-NEXT: $BB18_1: # %entry
+; MIPS32EB-NEXT: # =>This Inner Loop Header: Depth=1
+; MIPS32EB-NEXT: ll $2, 0($1)
+; MIPS32EB-NEXT: addu $3, $2, $4
+; MIPS32EB-NEXT: sc $3, 0($1)
+; MIPS32EB-NEXT: beqz $3, $BB18_1
+; MIPS32EB-NEXT: nop
+; MIPS32EB-NEXT: # %bb.2: # %entry
+; MIPS32EB-NEXT: jr $ra
+; MIPS32EB-NEXT: nop
entry:
%0 = atomicrmw add i32* getelementptr(i32, i32* @x, i32 256), i32 %incr monotonic
ret i32 %0
-; ALL-LABEL: AtomicLoadAdd32_OffGt9Bit:
-
-; MIPS32-ANY: lw $[[R0:[0-9]+]], %got(x)
-; MIPS64-ANY: ld $[[R0:[0-9]+]], %got_disp(x)(
-
-; ALL: addiu $[[PTR:[0-9]+]], $[[R0]], 1024
-; ALL: [[BB0:(\$|\.L)[A-Z_0-9]+]]:
-; ALL: ll $[[R1:[0-9]+]], 0($[[PTR]])
-; ALL: addu $[[R2:[0-9]+]], $[[R1]], $4
-; ALL: sc $[[R2]], 0($[[PTR]])
-; NOT-MICROMIPS: beqz $[[R2]], [[BB0]]
-; MICROMIPS: beqzc $[[R2]], [[BB0]]
-; MIPSR6: beqzc $[[R2]], [[BB0]]
}