%1 = atomicrmw xchg ptr %a, i64 %b acquire
ret i64 %1
}
+
+define i8 @atomicrmw_add_i8_acquire(ptr %a, i8 %b) nounwind {
+; LA32-LABEL: atomicrmw_add_i8_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $a2, $zero, -4
+; LA32-NEXT: and $a2, $a0, $a2
+; LA32-NEXT: slli.w $a0, $a0, 3
+; LA32-NEXT: ori $a3, $zero, 255
+; LA32-NEXT: sll.w $a3, $a3, $a0
+; LA32-NEXT: andi $a1, $a1, 255
+; LA32-NEXT: sll.w $a1, $a1, $a0
+; LA32-NEXT: .LBB4_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a4, $a2, 0
+; LA32-NEXT: add.w $a5, $a4, $a1
+; LA32-NEXT: xor $a5, $a4, $a5
+; LA32-NEXT: and $a5, $a5, $a3
+; LA32-NEXT: xor $a5, $a4, $a5
+; LA32-NEXT: sc.w $a5, $a2, 0
+; LA32-NEXT: beq $a5, $zero, .LBB4_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: srl.w $a0, $a4, $a0
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_add_i8_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: addi.w $a2, $zero, -4
+; LA64-NEXT: and $a2, $a0, $a2
+; LA64-NEXT: slli.d $a0, $a0, 3
+; LA64-NEXT: ori $a3, $zero, 255
+; LA64-NEXT: sll.w $a3, $a3, $a0
+; LA64-NEXT: addi.w $a3, $a3, 0
+; LA64-NEXT: andi $a1, $a1, 255
+; LA64-NEXT: sll.w $a1, $a1, $a0
+; LA64-NEXT: addi.w $a1, $a1, 0
+; LA64-NEXT: .LBB4_1: # =>This Inner Loop Header: Depth=1
+; LA64-NEXT: dbar 0
+; LA64-NEXT: ll.w $a4, $a2, 0
+; LA64-NEXT: add.w $a5, $a4, $a1
+; LA64-NEXT: xor $a5, $a4, $a5
+; LA64-NEXT: and $a5, $a5, $a3
+; LA64-NEXT: xor $a5, $a4, $a5
+; LA64-NEXT: sc.w $a5, $a2, 0
+; LA64-NEXT: beq $a5, $zero, .LBB4_1
+; LA64-NEXT: # %bb.2:
+; LA64-NEXT: srl.w $a0, $a4, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw add ptr %a, i8 %b acquire
+ ret i8 %1
+}
+
+define i16 @atomicrmw_add_i16_acquire(ptr %a, i16 %b) nounwind {
+; LA32-LABEL: atomicrmw_add_i16_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $a2, $zero, -4
+; LA32-NEXT: and $a2, $a0, $a2
+; LA32-NEXT: slli.w $a0, $a0, 3
+; LA32-NEXT: lu12i.w $a3, 15
+; LA32-NEXT: ori $a3, $a3, 4095
+; LA32-NEXT: sll.w $a3, $a3, $a0
+; LA32-NEXT: bstrpick.w $a1, $a1, 15, 0
+; LA32-NEXT: sll.w $a1, $a1, $a0
+; LA32-NEXT: .LBB5_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a4, $a2, 0
+; LA32-NEXT: add.w $a5, $a4, $a1
+; LA32-NEXT: xor $a5, $a4, $a5
+; LA32-NEXT: and $a5, $a5, $a3
+; LA32-NEXT: xor $a5, $a4, $a5
+; LA32-NEXT: sc.w $a5, $a2, 0
+; LA32-NEXT: beq $a5, $zero, .LBB5_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: srl.w $a0, $a4, $a0
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_add_i16_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: addi.w $a2, $zero, -4
+; LA64-NEXT: and $a2, $a0, $a2
+; LA64-NEXT: slli.d $a0, $a0, 3
+; LA64-NEXT: lu12i.w $a3, 15
+; LA64-NEXT: ori $a3, $a3, 4095
+; LA64-NEXT: sll.w $a3, $a3, $a0
+; LA64-NEXT: addi.w $a3, $a3, 0
+; LA64-NEXT: bstrpick.d $a1, $a1, 15, 0
+; LA64-NEXT: sll.w $a1, $a1, $a0
+; LA64-NEXT: addi.w $a1, $a1, 0
+; LA64-NEXT: .LBB5_1: # =>This Inner Loop Header: Depth=1
+; LA64-NEXT: dbar 0
+; LA64-NEXT: ll.w $a4, $a2, 0
+; LA64-NEXT: add.w $a5, $a4, $a1
+; LA64-NEXT: xor $a5, $a4, $a5
+; LA64-NEXT: and $a5, $a5, $a3
+; LA64-NEXT: xor $a5, $a4, $a5
+; LA64-NEXT: sc.w $a5, $a2, 0
+; LA64-NEXT: beq $a5, $zero, .LBB5_1
+; LA64-NEXT: # %bb.2:
+; LA64-NEXT: srl.w $a0, $a4, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw add ptr %a, i16 %b acquire
+ ret i16 %1
+}
+
+define i32 @atomicrmw_add_i32_acquire(ptr %a, i32 %b) nounwind {
+; LA32-LABEL: atomicrmw_add_i32_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: .LBB6_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a2, $a1, 0
+; LA32-NEXT: add.w $a3, $a2, $a0
+; LA32-NEXT: sc.w $a3, $a1, 0
+; LA32-NEXT: beq $a3, $zero, .LBB6_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: move $a0, $a2
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_add_i32_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: amadd_db.w $a0, $a1, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw add ptr %a, i32 %b acquire
+ ret i32 %1
+}
+
+define i64 @atomicrmw_add_i64_acquire(ptr %a, i64 %b) nounwind {
+; LA32-LABEL: atomicrmw_add_i64_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $sp, $sp, -16
+; LA32-NEXT: st.w $ra, $sp, 12 # 4-byte Folded Spill
+; LA32-NEXT: ori $a3, $zero, 2
+; LA32-NEXT: bl %plt(__atomic_fetch_add_8)
+; LA32-NEXT: ld.w $ra, $sp, 12 # 4-byte Folded Reload
+; LA32-NEXT: addi.w $sp, $sp, 16
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_add_i64_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: amadd_db.d $a0, $a1, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw add ptr %a, i64 %b acquire
+ ret i64 %1
+}
+
+define i8 @atomicrmw_sub_i8_acquire(ptr %a, i8 %b) nounwind {
+; LA32-LABEL: atomicrmw_sub_i8_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $a2, $zero, -4
+; LA32-NEXT: and $a2, $a0, $a2
+; LA32-NEXT: slli.w $a0, $a0, 3
+; LA32-NEXT: ori $a3, $zero, 255
+; LA32-NEXT: sll.w $a3, $a3, $a0
+; LA32-NEXT: andi $a1, $a1, 255
+; LA32-NEXT: sll.w $a1, $a1, $a0
+; LA32-NEXT: .LBB8_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a4, $a2, 0
+; LA32-NEXT: sub.w $a5, $a4, $a1
+; LA32-NEXT: xor $a5, $a4, $a5
+; LA32-NEXT: and $a5, $a5, $a3
+; LA32-NEXT: xor $a5, $a4, $a5
+; LA32-NEXT: sc.w $a5, $a2, 0
+; LA32-NEXT: beq $a5, $zero, .LBB8_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: srl.w $a0, $a4, $a0
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_sub_i8_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: addi.w $a2, $zero, -4
+; LA64-NEXT: and $a2, $a0, $a2
+; LA64-NEXT: slli.d $a0, $a0, 3
+; LA64-NEXT: ori $a3, $zero, 255
+; LA64-NEXT: sll.w $a3, $a3, $a0
+; LA64-NEXT: addi.w $a3, $a3, 0
+; LA64-NEXT: andi $a1, $a1, 255
+; LA64-NEXT: sll.w $a1, $a1, $a0
+; LA64-NEXT: addi.w $a1, $a1, 0
+; LA64-NEXT: .LBB8_1: # =>This Inner Loop Header: Depth=1
+; LA64-NEXT: dbar 0
+; LA64-NEXT: ll.w $a4, $a2, 0
+; LA64-NEXT: sub.w $a5, $a4, $a1
+; LA64-NEXT: xor $a5, $a4, $a5
+; LA64-NEXT: and $a5, $a5, $a3
+; LA64-NEXT: xor $a5, $a4, $a5
+; LA64-NEXT: sc.w $a5, $a2, 0
+; LA64-NEXT: beq $a5, $zero, .LBB8_1
+; LA64-NEXT: # %bb.2:
+; LA64-NEXT: srl.w $a0, $a4, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw sub ptr %a, i8 %b acquire
+ ret i8 %1
+}
+
+define i16 @atomicrmw_sub_i16_acquire(ptr %a, i16 %b) nounwind {
+; LA32-LABEL: atomicrmw_sub_i16_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $a2, $zero, -4
+; LA32-NEXT: and $a2, $a0, $a2
+; LA32-NEXT: slli.w $a0, $a0, 3
+; LA32-NEXT: lu12i.w $a3, 15
+; LA32-NEXT: ori $a3, $a3, 4095
+; LA32-NEXT: sll.w $a3, $a3, $a0
+; LA32-NEXT: bstrpick.w $a1, $a1, 15, 0
+; LA32-NEXT: sll.w $a1, $a1, $a0
+; LA32-NEXT: .LBB9_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a4, $a2, 0
+; LA32-NEXT: sub.w $a5, $a4, $a1
+; LA32-NEXT: xor $a5, $a4, $a5
+; LA32-NEXT: and $a5, $a5, $a3
+; LA32-NEXT: xor $a5, $a4, $a5
+; LA32-NEXT: sc.w $a5, $a2, 0
+; LA32-NEXT: beq $a5, $zero, .LBB9_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: srl.w $a0, $a4, $a0
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_sub_i16_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: addi.w $a2, $zero, -4
+; LA64-NEXT: and $a2, $a0, $a2
+; LA64-NEXT: slli.d $a0, $a0, 3
+; LA64-NEXT: lu12i.w $a3, 15
+; LA64-NEXT: ori $a3, $a3, 4095
+; LA64-NEXT: sll.w $a3, $a3, $a0
+; LA64-NEXT: addi.w $a3, $a3, 0
+; LA64-NEXT: bstrpick.d $a1, $a1, 15, 0
+; LA64-NEXT: sll.w $a1, $a1, $a0
+; LA64-NEXT: addi.w $a1, $a1, 0
+; LA64-NEXT: .LBB9_1: # =>This Inner Loop Header: Depth=1
+; LA64-NEXT: dbar 0
+; LA64-NEXT: ll.w $a4, $a2, 0
+; LA64-NEXT: sub.w $a5, $a4, $a1
+; LA64-NEXT: xor $a5, $a4, $a5
+; LA64-NEXT: and $a5, $a5, $a3
+; LA64-NEXT: xor $a5, $a4, $a5
+; LA64-NEXT: sc.w $a5, $a2, 0
+; LA64-NEXT: beq $a5, $zero, .LBB9_1
+; LA64-NEXT: # %bb.2:
+; LA64-NEXT: srl.w $a0, $a4, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw sub ptr %a, i16 %b acquire
+ ret i16 %1
+}
+
+define i32 @atomicrmw_sub_i32_acquire(ptr %a, i32 %b) nounwind {
+; LA32-LABEL: atomicrmw_sub_i32_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: .LBB10_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a2, $a1, 0
+; LA32-NEXT: sub.w $a3, $a2, $a0
+; LA32-NEXT: sc.w $a3, $a1, 0
+; LA32-NEXT: beq $a3, $zero, .LBB10_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: move $a0, $a2
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_sub_i32_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: sub.w $a1, $zero, $a1
+; LA64-NEXT: amadd_db.w $a0, $a1, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw sub ptr %a, i32 %b acquire
+ ret i32 %1
+}
+
+define i64 @atomicrmw_sub_i64_acquire(ptr %a, i64 %b) nounwind {
+; LA32-LABEL: atomicrmw_sub_i64_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $sp, $sp, -16
+; LA32-NEXT: st.w $ra, $sp, 12 # 4-byte Folded Spill
+; LA32-NEXT: ori $a3, $zero, 2
+; LA32-NEXT: bl %plt(__atomic_fetch_sub_8)
+; LA32-NEXT: ld.w $ra, $sp, 12 # 4-byte Folded Reload
+; LA32-NEXT: addi.w $sp, $sp, 16
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_sub_i64_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: sub.d $a1, $zero, $a1
+; LA64-NEXT: amadd_db.d $a0, $a1, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw sub ptr %a, i64 %b acquire
+ ret i64 %1
+}
+
+define i8 @atomicrmw_nand_i8_acquire(ptr %a, i8 %b) nounwind {
+; LA32-LABEL: atomicrmw_nand_i8_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $a2, $zero, -4
+; LA32-NEXT: and $a2, $a0, $a2
+; LA32-NEXT: slli.w $a0, $a0, 3
+; LA32-NEXT: ori $a3, $zero, 255
+; LA32-NEXT: sll.w $a3, $a3, $a0
+; LA32-NEXT: andi $a1, $a1, 255
+; LA32-NEXT: sll.w $a1, $a1, $a0
+; LA32-NEXT: .LBB12_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a4, $a2, 0
+; LA32-NEXT: and $a5, $a4, $a1
+; LA32-NEXT: xori $a5, $a5, -1
+; LA32-NEXT: xor $a5, $a4, $a5
+; LA32-NEXT: and $a5, $a5, $a3
+; LA32-NEXT: xor $a5, $a4, $a5
+; LA32-NEXT: sc.w $a5, $a2, 0
+; LA32-NEXT: beq $a5, $zero, .LBB12_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: srl.w $a0, $a4, $a0
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_nand_i8_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: addi.w $a2, $zero, -4
+; LA64-NEXT: and $a2, $a0, $a2
+; LA64-NEXT: slli.d $a0, $a0, 3
+; LA64-NEXT: ori $a3, $zero, 255
+; LA64-NEXT: sll.w $a3, $a3, $a0
+; LA64-NEXT: addi.w $a3, $a3, 0
+; LA64-NEXT: andi $a1, $a1, 255
+; LA64-NEXT: sll.w $a1, $a1, $a0
+; LA64-NEXT: addi.w $a1, $a1, 0
+; LA64-NEXT: .LBB12_1: # =>This Inner Loop Header: Depth=1
+; LA64-NEXT: dbar 0
+; LA64-NEXT: ll.w $a4, $a2, 0
+; LA64-NEXT: and $a5, $a4, $a1
+; LA64-NEXT: xori $a5, $a5, -1
+; LA64-NEXT: xor $a5, $a4, $a5
+; LA64-NEXT: and $a5, $a5, $a3
+; LA64-NEXT: xor $a5, $a4, $a5
+; LA64-NEXT: sc.w $a5, $a2, 0
+; LA64-NEXT: beq $a5, $zero, .LBB12_1
+; LA64-NEXT: # %bb.2:
+; LA64-NEXT: srl.w $a0, $a4, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw nand ptr %a, i8 %b acquire
+ ret i8 %1
+}
+
+define i16 @atomicrmw_nand_i16_acquire(ptr %a, i16 %b) nounwind {
+; LA32-LABEL: atomicrmw_nand_i16_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $a2, $zero, -4
+; LA32-NEXT: and $a2, $a0, $a2
+; LA32-NEXT: slli.w $a0, $a0, 3
+; LA32-NEXT: lu12i.w $a3, 15
+; LA32-NEXT: ori $a3, $a3, 4095
+; LA32-NEXT: sll.w $a3, $a3, $a0
+; LA32-NEXT: bstrpick.w $a1, $a1, 15, 0
+; LA32-NEXT: sll.w $a1, $a1, $a0
+; LA32-NEXT: .LBB13_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a4, $a2, 0
+; LA32-NEXT: and $a5, $a4, $a1
+; LA32-NEXT: xori $a5, $a5, -1
+; LA32-NEXT: xor $a5, $a4, $a5
+; LA32-NEXT: and $a5, $a5, $a3
+; LA32-NEXT: xor $a5, $a4, $a5
+; LA32-NEXT: sc.w $a5, $a2, 0
+; LA32-NEXT: beq $a5, $zero, .LBB13_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: srl.w $a0, $a4, $a0
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_nand_i16_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: addi.w $a2, $zero, -4
+; LA64-NEXT: and $a2, $a0, $a2
+; LA64-NEXT: slli.d $a0, $a0, 3
+; LA64-NEXT: lu12i.w $a3, 15
+; LA64-NEXT: ori $a3, $a3, 4095
+; LA64-NEXT: sll.w $a3, $a3, $a0
+; LA64-NEXT: addi.w $a3, $a3, 0
+; LA64-NEXT: bstrpick.d $a1, $a1, 15, 0
+; LA64-NEXT: sll.w $a1, $a1, $a0
+; LA64-NEXT: addi.w $a1, $a1, 0
+; LA64-NEXT: .LBB13_1: # =>This Inner Loop Header: Depth=1
+; LA64-NEXT: dbar 0
+; LA64-NEXT: ll.w $a4, $a2, 0
+; LA64-NEXT: and $a5, $a4, $a1
+; LA64-NEXT: xori $a5, $a5, -1
+; LA64-NEXT: xor $a5, $a4, $a5
+; LA64-NEXT: and $a5, $a5, $a3
+; LA64-NEXT: xor $a5, $a4, $a5
+; LA64-NEXT: sc.w $a5, $a2, 0
+; LA64-NEXT: beq $a5, $zero, .LBB13_1
+; LA64-NEXT: # %bb.2:
+; LA64-NEXT: srl.w $a0, $a4, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw nand ptr %a, i16 %b acquire
+ ret i16 %1
+}
+
+define i32 @atomicrmw_nand_i32_acquire(ptr %a, i32 %b) nounwind {
+; LA32-LABEL: atomicrmw_nand_i32_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: .LBB14_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a2, $a1, 0
+; LA32-NEXT: and $a3, $a2, $a0
+; LA32-NEXT: xori $a3, $a3, -1
+; LA32-NEXT: sc.w $a3, $a1, 0
+; LA32-NEXT: beq $a3, $zero, .LBB14_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: move $a0, $a2
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_nand_i32_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: .LBB14_1: # =>This Inner Loop Header: Depth=1
+; LA64-NEXT: dbar 0
+; LA64-NEXT: ll.w $a2, $a1, 0
+; LA64-NEXT: and $a3, $a2, $a0
+; LA64-NEXT: xori $a3, $a3, -1
+; LA64-NEXT: sc.w $a3, $a1, 0
+; LA64-NEXT: beq $a3, $zero, .LBB14_1
+; LA64-NEXT: # %bb.2:
+; LA64-NEXT: move $a0, $a2
+; LA64-NEXT: ret
+ %1 = atomicrmw nand ptr %a, i32 %b acquire
+ ret i32 %1
+}
+
+define i64 @atomicrmw_nand_i64_acquire(ptr %a, i64 %b) nounwind {
+; LA32-LABEL: atomicrmw_nand_i64_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $sp, $sp, -16
+; LA32-NEXT: st.w $ra, $sp, 12 # 4-byte Folded Spill
+; LA32-NEXT: ori $a3, $zero, 2
+; LA32-NEXT: bl %plt(__atomic_fetch_nand_8)
+; LA32-NEXT: ld.w $ra, $sp, 12 # 4-byte Folded Reload
+; LA32-NEXT: addi.w $sp, $sp, 16
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_nand_i64_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: .LBB15_1: # =>This Inner Loop Header: Depth=1
+; LA64-NEXT: dbar 0
+; LA64-NEXT: ll.d $a2, $a1, 0
+; LA64-NEXT: and $a3, $a2, $a0
+; LA64-NEXT: xori $a3, $a3, -1
+; LA64-NEXT: sc.d $a3, $a1, 0
+; LA64-NEXT: beq $a3, $zero, .LBB15_1
+; LA64-NEXT: # %bb.2:
+; LA64-NEXT: move $a0, $a2
+; LA64-NEXT: ret
+ %1 = atomicrmw nand ptr %a, i64 %b acquire
+ ret i64 %1
+}
+
+define i8 @atomicrmw_and_i8_acquire(ptr %a, i8 %b) nounwind {
+; LA32-LABEL: atomicrmw_and_i8_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: slli.w $a2, $a0, 3
+; LA32-NEXT: ori $a3, $zero, 255
+; LA32-NEXT: sll.w $a3, $a3, $a2
+; LA32-NEXT: andi $a1, $a1, 255
+; LA32-NEXT: sll.w $a1, $a1, $a2
+; LA32-NEXT: orn $a1, $a1, $a3
+; LA32-NEXT: addi.w $a3, $zero, -4
+; LA32-NEXT: and $a0, $a0, $a3
+; LA32-NEXT: .LBB16_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a3, $a1, 0
+; LA32-NEXT: and $a4, $a3, $a0
+; LA32-NEXT: sc.w $a4, $a1, 0
+; LA32-NEXT: beq $a4, $zero, .LBB16_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: srl.w $a0, $a3, $a2
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_and_i8_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: slli.d $a2, $a0, 3
+; LA64-NEXT: ori $a3, $zero, 255
+; LA64-NEXT: sll.w $a3, $a3, $a2
+; LA64-NEXT: andi $a1, $a1, 255
+; LA64-NEXT: sll.w $a1, $a1, $a2
+; LA64-NEXT: orn $a1, $a1, $a3
+; LA64-NEXT: addi.w $a3, $zero, -4
+; LA64-NEXT: and $a0, $a0, $a3
+; LA64-NEXT: amand_db.w $a0, $a1, $a0
+; LA64-NEXT: srl.w $a0, $a0, $a2
+; LA64-NEXT: ret
+ %1 = atomicrmw and ptr %a, i8 %b acquire
+ ret i8 %1
+}
+
+define i16 @atomicrmw_and_i16_acquire(ptr %a, i16 %b) nounwind {
+; LA32-LABEL: atomicrmw_and_i16_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: lu12i.w $a2, 15
+; LA32-NEXT: ori $a2, $a2, 4095
+; LA32-NEXT: slli.w $a3, $a0, 3
+; LA32-NEXT: sll.w $a2, $a2, $a3
+; LA32-NEXT: bstrpick.w $a1, $a1, 15, 0
+; LA32-NEXT: sll.w $a1, $a1, $a3
+; LA32-NEXT: orn $a1, $a1, $a2
+; LA32-NEXT: addi.w $a2, $zero, -4
+; LA32-NEXT: and $a0, $a0, $a2
+; LA32-NEXT: .LBB17_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a2, $a1, 0
+; LA32-NEXT: and $a4, $a2, $a0
+; LA32-NEXT: sc.w $a4, $a1, 0
+; LA32-NEXT: beq $a4, $zero, .LBB17_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: srl.w $a0, $a2, $a3
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_and_i16_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: lu12i.w $a2, 15
+; LA64-NEXT: ori $a2, $a2, 4095
+; LA64-NEXT: slli.d $a3, $a0, 3
+; LA64-NEXT: sll.w $a2, $a2, $a3
+; LA64-NEXT: bstrpick.d $a1, $a1, 15, 0
+; LA64-NEXT: sll.w $a1, $a1, $a3
+; LA64-NEXT: orn $a1, $a1, $a2
+; LA64-NEXT: addi.w $a2, $zero, -4
+; LA64-NEXT: and $a0, $a0, $a2
+; LA64-NEXT: amand_db.w $a0, $a1, $a0
+; LA64-NEXT: srl.w $a0, $a0, $a3
+; LA64-NEXT: ret
+ %1 = atomicrmw and ptr %a, i16 %b acquire
+ ret i16 %1
+}
+
+define i32 @atomicrmw_and_i32_acquire(ptr %a, i32 %b) nounwind {
+; LA32-LABEL: atomicrmw_and_i32_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: .LBB18_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a2, $a1, 0
+; LA32-NEXT: and $a3, $a2, $a0
+; LA32-NEXT: sc.w $a3, $a1, 0
+; LA32-NEXT: beq $a3, $zero, .LBB18_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: move $a0, $a2
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_and_i32_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: amand_db.w $a0, $a1, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw and ptr %a, i32 %b acquire
+ ret i32 %1
+}
+
+define i64 @atomicrmw_and_i64_acquire(ptr %a, i64 %b) nounwind {
+; LA32-LABEL: atomicrmw_and_i64_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $sp, $sp, -16
+; LA32-NEXT: st.w $ra, $sp, 12 # 4-byte Folded Spill
+; LA32-NEXT: ori $a3, $zero, 2
+; LA32-NEXT: bl %plt(__atomic_fetch_and_8)
+; LA32-NEXT: ld.w $ra, $sp, 12 # 4-byte Folded Reload
+; LA32-NEXT: addi.w $sp, $sp, 16
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_and_i64_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: amand_db.d $a0, $a1, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw and ptr %a, i64 %b acquire
+ ret i64 %1
+}
+
+define i8 @atomicrmw_or_i8_acquire(ptr %a, i8 %b) nounwind {
+; LA32-LABEL: atomicrmw_or_i8_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $a2, $zero, -4
+; LA32-NEXT: and $a2, $a0, $a2
+; LA32-NEXT: slli.w $a0, $a0, 3
+; LA32-NEXT: andi $a1, $a1, 255
+; LA32-NEXT: sll.w $a1, $a1, $a0
+; LA32-NEXT: .LBB20_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a3, $a1, 0
+; LA32-NEXT: or $a4, $a3, $a2
+; LA32-NEXT: sc.w $a4, $a1, 0
+; LA32-NEXT: beq $a4, $zero, .LBB20_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: srl.w $a0, $a3, $a0
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_or_i8_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: addi.w $a2, $zero, -4
+; LA64-NEXT: and $a2, $a0, $a2
+; LA64-NEXT: slli.d $a0, $a0, 3
+; LA64-NEXT: andi $a1, $a1, 255
+; LA64-NEXT: sll.w $a1, $a1, $a0
+; LA64-NEXT: amor_db.w $a1, $a1, $a2
+; LA64-NEXT: srl.w $a0, $a1, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw or ptr %a, i8 %b acquire
+ ret i8 %1
+}
+
+define i16 @atomicrmw_or_i16_acquire(ptr %a, i16 %b) nounwind {
+; LA32-LABEL: atomicrmw_or_i16_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $a2, $zero, -4
+; LA32-NEXT: and $a2, $a0, $a2
+; LA32-NEXT: slli.w $a0, $a0, 3
+; LA32-NEXT: bstrpick.w $a1, $a1, 15, 0
+; LA32-NEXT: sll.w $a1, $a1, $a0
+; LA32-NEXT: .LBB21_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a3, $a1, 0
+; LA32-NEXT: or $a4, $a3, $a2
+; LA32-NEXT: sc.w $a4, $a1, 0
+; LA32-NEXT: beq $a4, $zero, .LBB21_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: srl.w $a0, $a3, $a0
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_or_i16_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: addi.w $a2, $zero, -4
+; LA64-NEXT: and $a2, $a0, $a2
+; LA64-NEXT: slli.d $a0, $a0, 3
+; LA64-NEXT: bstrpick.d $a1, $a1, 15, 0
+; LA64-NEXT: sll.w $a1, $a1, $a0
+; LA64-NEXT: amor_db.w $a1, $a1, $a2
+; LA64-NEXT: srl.w $a0, $a1, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw or ptr %a, i16 %b acquire
+ ret i16 %1
+}
+
+define i32 @atomicrmw_or_i32_acquire(ptr %a, i32 %b) nounwind {
+; LA32-LABEL: atomicrmw_or_i32_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: .LBB22_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a2, $a1, 0
+; LA32-NEXT: or $a3, $a2, $a0
+; LA32-NEXT: sc.w $a3, $a1, 0
+; LA32-NEXT: beq $a3, $zero, .LBB22_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: move $a0, $a2
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_or_i32_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: amor_db.w $a0, $a1, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw or ptr %a, i32 %b acquire
+ ret i32 %1
+}
+
+define i64 @atomicrmw_or_i64_acquire(ptr %a, i64 %b) nounwind {
+; LA32-LABEL: atomicrmw_or_i64_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $sp, $sp, -16
+; LA32-NEXT: st.w $ra, $sp, 12 # 4-byte Folded Spill
+; LA32-NEXT: ori $a3, $zero, 2
+; LA32-NEXT: bl %plt(__atomic_fetch_or_8)
+; LA32-NEXT: ld.w $ra, $sp, 12 # 4-byte Folded Reload
+; LA32-NEXT: addi.w $sp, $sp, 16
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_or_i64_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: amor_db.d $a0, $a1, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw or ptr %a, i64 %b acquire
+ ret i64 %1
+}
+
+define i8 @atomicrmw_xor_i8_acquire(ptr %a, i8 %b) nounwind {
+; LA32-LABEL: atomicrmw_xor_i8_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $a2, $zero, -4
+; LA32-NEXT: and $a2, $a0, $a2
+; LA32-NEXT: slli.w $a0, $a0, 3
+; LA32-NEXT: andi $a1, $a1, 255
+; LA32-NEXT: sll.w $a1, $a1, $a0
+; LA32-NEXT: .LBB24_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a3, $a1, 0
+; LA32-NEXT: xor $a4, $a3, $a2
+; LA32-NEXT: sc.w $a4, $a1, 0
+; LA32-NEXT: beq $a4, $zero, .LBB24_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: srl.w $a0, $a3, $a0
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_xor_i8_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: addi.w $a2, $zero, -4
+; LA64-NEXT: and $a2, $a0, $a2
+; LA64-NEXT: slli.d $a0, $a0, 3
+; LA64-NEXT: andi $a1, $a1, 255
+; LA64-NEXT: sll.w $a1, $a1, $a0
+; LA64-NEXT: amxor_db.w $a1, $a1, $a2
+; LA64-NEXT: srl.w $a0, $a1, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw xor ptr %a, i8 %b acquire
+ ret i8 %1
+}
+
+define i16 @atomicrmw_xor_i16_acquire(ptr %a, i16 %b) nounwind {
+; LA32-LABEL: atomicrmw_xor_i16_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $a2, $zero, -4
+; LA32-NEXT: and $a2, $a0, $a2
+; LA32-NEXT: slli.w $a0, $a0, 3
+; LA32-NEXT: bstrpick.w $a1, $a1, 15, 0
+; LA32-NEXT: sll.w $a1, $a1, $a0
+; LA32-NEXT: .LBB25_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a3, $a1, 0
+; LA32-NEXT: xor $a4, $a3, $a2
+; LA32-NEXT: sc.w $a4, $a1, 0
+; LA32-NEXT: beq $a4, $zero, .LBB25_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: srl.w $a0, $a3, $a0
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_xor_i16_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: addi.w $a2, $zero, -4
+; LA64-NEXT: and $a2, $a0, $a2
+; LA64-NEXT: slli.d $a0, $a0, 3
+; LA64-NEXT: bstrpick.d $a1, $a1, 15, 0
+; LA64-NEXT: sll.w $a1, $a1, $a0
+; LA64-NEXT: amxor_db.w $a1, $a1, $a2
+; LA64-NEXT: srl.w $a0, $a1, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw xor ptr %a, i16 %b acquire
+ ret i16 %1
+}
+
+define i32 @atomicrmw_xor_i32_acquire(ptr %a, i32 %b) nounwind {
+; LA32-LABEL: atomicrmw_xor_i32_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: .LBB26_1: # =>This Inner Loop Header: Depth=1
+; LA32-NEXT: dbar 0
+; LA32-NEXT: ll.w $a2, $a1, 0
+; LA32-NEXT: xor $a3, $a2, $a0
+; LA32-NEXT: sc.w $a3, $a1, 0
+; LA32-NEXT: beq $a3, $zero, .LBB26_1
+; LA32-NEXT: # %bb.2:
+; LA32-NEXT: move $a0, $a2
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_xor_i32_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: amxor_db.w $a0, $a1, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw xor ptr %a, i32 %b acquire
+ ret i32 %1
+}
+
+define i64 @atomicrmw_xor_i64_acquire(ptr %a, i64 %b) nounwind {
+; LA32-LABEL: atomicrmw_xor_i64_acquire:
+; LA32: # %bb.0:
+; LA32-NEXT: addi.w $sp, $sp, -16
+; LA32-NEXT: st.w $ra, $sp, 12 # 4-byte Folded Spill
+; LA32-NEXT: ori $a3, $zero, 2
+; LA32-NEXT: bl %plt(__atomic_fetch_xor_8)
+; LA32-NEXT: ld.w $ra, $sp, 12 # 4-byte Folded Reload
+; LA32-NEXT: addi.w $sp, $sp, 16
+; LA32-NEXT: ret
+;
+; LA64-LABEL: atomicrmw_xor_i64_acquire:
+; LA64: # %bb.0:
+; LA64-NEXT: amxor_db.d $a0, $a1, $a0
+; LA64-NEXT: ret
+ %1 = atomicrmw xor ptr %a, i64 %b acquire
+ ret i64 %1
+}