| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py |
| ; RUN: llc --mtriple=loongarch64 < %s | FileCheck %s --check-prefix=LA64 |
| |
| define void @cmpxchg_i8_acquire_acquire(ptr %ptr, i8 %cmp, i8 %val) nounwind { |
| ; LA64-LABEL: cmpxchg_i8_acquire_acquire: |
| ; LA64: # %bb.0: |
| ; LA64-NEXT: addi.w $a3, $zero, -4 |
| ; LA64-NEXT: and $a3, $a0, $a3 |
| ; LA64-NEXT: slli.d $a0, $a0, 3 |
| ; LA64-NEXT: andi $a1, $a1, 255 |
| ; LA64-NEXT: sll.w $a1, $a1, $a0 |
| ; LA64-NEXT: andi $a2, $a2, 255 |
| ; LA64-NEXT: sll.w $a2, $a2, $a0 |
| ; LA64-NEXT: ori $a4, $zero, 255 |
| ; LA64-NEXT: sll.w $a0, $a4, $a0 |
| ; LA64-NEXT: addi.w $a0, $a0, 0 |
| ; LA64-NEXT: addi.w $a2, $a2, 0 |
| ; LA64-NEXT: addi.w $a1, $a1, 0 |
| ; LA64-NEXT: .LBB0_1: # =>This Inner Loop Header: Depth=1 |
| ; LA64-NEXT: ll.w $a4, $a3, 0 |
| ; LA64-NEXT: and $a5, $a4, $a0 |
| ; LA64-NEXT: bne $a5, $a1, .LBB0_3 |
| ; LA64-NEXT: # %bb.2: # in Loop: Header=BB0_1 Depth=1 |
| ; LA64-NEXT: dbar 0 |
| ; LA64-NEXT: andn $a5, $a4, $a0 |
| ; LA64-NEXT: or $a5, $a5, $a2 |
| ; LA64-NEXT: sc.w $a5, $a3, 0 |
| ; LA64-NEXT: beqz $a5, .LBB0_1 |
| ; LA64-NEXT: b .LBB0_4 |
| ; LA64-NEXT: .LBB0_3: |
| ; LA64-NEXT: dbar 1792 |
| ; LA64-NEXT: .LBB0_4: |
| ; LA64-NEXT: ret |
| %res = cmpxchg ptr %ptr, i8 %cmp, i8 %val acquire acquire |
| ret void |
| } |
| |
| define void @cmpxchg_i16_acquire_acquire(ptr %ptr, i16 %cmp, i16 %val) nounwind { |
| ; LA64-LABEL: cmpxchg_i16_acquire_acquire: |
| ; LA64: # %bb.0: |
| ; LA64-NEXT: addi.w $a3, $zero, -4 |
| ; LA64-NEXT: and $a3, $a0, $a3 |
| ; LA64-NEXT: slli.d $a0, $a0, 3 |
| ; LA64-NEXT: bstrpick.d $a1, $a1, 15, 0 |
| ; LA64-NEXT: sll.w $a1, $a1, $a0 |
| ; LA64-NEXT: bstrpick.d $a2, $a2, 15, 0 |
| ; LA64-NEXT: sll.w $a2, $a2, $a0 |
| ; LA64-NEXT: lu12i.w $a4, 15 |
| ; LA64-NEXT: ori $a4, $a4, 4095 |
| ; LA64-NEXT: sll.w $a0, $a4, $a0 |
| ; LA64-NEXT: addi.w $a0, $a0, 0 |
| ; LA64-NEXT: addi.w $a2, $a2, 0 |
| ; LA64-NEXT: addi.w $a1, $a1, 0 |
| ; LA64-NEXT: .LBB1_1: # =>This Inner Loop Header: Depth=1 |
| ; LA64-NEXT: ll.w $a4, $a3, 0 |
| ; LA64-NEXT: and $a5, $a4, $a0 |
| ; LA64-NEXT: bne $a5, $a1, .LBB1_3 |
| ; LA64-NEXT: # %bb.2: # in Loop: Header=BB1_1 Depth=1 |
| ; LA64-NEXT: dbar 0 |
| ; LA64-NEXT: andn $a5, $a4, $a0 |
| ; LA64-NEXT: or $a5, $a5, $a2 |
| ; LA64-NEXT: sc.w $a5, $a3, 0 |
| ; LA64-NEXT: beqz $a5, .LBB1_1 |
| ; LA64-NEXT: b .LBB1_4 |
| ; LA64-NEXT: .LBB1_3: |
| ; LA64-NEXT: dbar 1792 |
| ; LA64-NEXT: .LBB1_4: |
| ; LA64-NEXT: ret |
| %res = cmpxchg ptr %ptr, i16 %cmp, i16 %val acquire acquire |
| ret void |
| } |
| |
| define void @cmpxchg_i32_acquire_acquire(ptr %ptr, i32 %cmp, i32 %val) nounwind { |
| ; LA64-LABEL: cmpxchg_i32_acquire_acquire: |
| ; LA64: # %bb.0: |
| ; LA64-NEXT: .LBB2_1: # =>This Inner Loop Header: Depth=1 |
| ; LA64-NEXT: ll.w $a3, $a0, 0 |
| ; LA64-NEXT: bne $a3, $a1, .LBB2_3 |
| ; LA64-NEXT: # %bb.2: # in Loop: Header=BB2_1 Depth=1 |
| ; LA64-NEXT: dbar 0 |
| ; LA64-NEXT: move $a4, $a2 |
| ; LA64-NEXT: sc.w $a4, $a0, 0 |
| ; LA64-NEXT: beqz $a4, .LBB2_1 |
| ; LA64-NEXT: b .LBB2_4 |
| ; LA64-NEXT: .LBB2_3: |
| ; LA64-NEXT: dbar 1792 |
| ; LA64-NEXT: .LBB2_4: |
| ; LA64-NEXT: ret |
| %res = cmpxchg ptr %ptr, i32 %cmp, i32 %val acquire acquire |
| ret void |
| } |
| |
| define void @cmpxchg_i64_acquire_acquire(ptr %ptr, i64 %cmp, i64 %val) nounwind { |
| ; LA64-LABEL: cmpxchg_i64_acquire_acquire: |
| ; LA64: # %bb.0: |
| ; LA64-NEXT: .LBB3_1: # =>This Inner Loop Header: Depth=1 |
| ; LA64-NEXT: ll.d $a3, $a0, 0 |
| ; LA64-NEXT: bne $a3, $a1, .LBB3_3 |
| ; LA64-NEXT: # %bb.2: # in Loop: Header=BB3_1 Depth=1 |
| ; LA64-NEXT: dbar 0 |
| ; LA64-NEXT: move $a4, $a2 |
| ; LA64-NEXT: sc.d $a4, $a0, 0 |
| ; LA64-NEXT: beqz $a4, .LBB3_1 |
| ; LA64-NEXT: b .LBB3_4 |
| ; LA64-NEXT: .LBB3_3: |
| ; LA64-NEXT: dbar 1792 |
| ; LA64-NEXT: .LBB3_4: |
| ; LA64-NEXT: ret |
| %res = cmpxchg ptr %ptr, i64 %cmp, i64 %val acquire acquire |
| ret void |
| } |
| |
| define i8 @cmpxchg_i8_acquire_acquire_reti8(ptr %ptr, i8 %cmp, i8 %val) nounwind { |
| ; LA64-LABEL: cmpxchg_i8_acquire_acquire_reti8: |
| ; LA64: # %bb.0: |
| ; LA64-NEXT: addi.w $a3, $zero, -4 |
| ; LA64-NEXT: and $a3, $a0, $a3 |
| ; LA64-NEXT: slli.d $a0, $a0, 3 |
| ; LA64-NEXT: ori $a4, $zero, 255 |
| ; LA64-NEXT: sll.w $a4, $a4, $a0 |
| ; LA64-NEXT: addi.w $a4, $a4, 0 |
| ; LA64-NEXT: andi $a2, $a2, 255 |
| ; LA64-NEXT: sll.w $a2, $a2, $a0 |
| ; LA64-NEXT: addi.w $a2, $a2, 0 |
| ; LA64-NEXT: andi $a1, $a1, 255 |
| ; LA64-NEXT: sll.w $a1, $a1, $a0 |
| ; LA64-NEXT: addi.w $a1, $a1, 0 |
| ; LA64-NEXT: .LBB4_1: # =>This Inner Loop Header: Depth=1 |
| ; LA64-NEXT: ll.w $a5, $a3, 0 |
| ; LA64-NEXT: and $a6, $a5, $a4 |
| ; LA64-NEXT: bne $a6, $a1, .LBB4_3 |
| ; LA64-NEXT: # %bb.2: # in Loop: Header=BB4_1 Depth=1 |
| ; LA64-NEXT: dbar 0 |
| ; LA64-NEXT: andn $a6, $a5, $a4 |
| ; LA64-NEXT: or $a6, $a6, $a2 |
| ; LA64-NEXT: sc.w $a6, $a3, 0 |
| ; LA64-NEXT: beqz $a6, .LBB4_1 |
| ; LA64-NEXT: b .LBB4_4 |
| ; LA64-NEXT: .LBB4_3: |
| ; LA64-NEXT: dbar 1792 |
| ; LA64-NEXT: .LBB4_4: |
| ; LA64-NEXT: srl.w $a0, $a5, $a0 |
| ; LA64-NEXT: ret |
| %tmp = cmpxchg ptr %ptr, i8 %cmp, i8 %val acquire acquire |
| %res = extractvalue { i8, i1 } %tmp, 0 |
| ret i8 %res |
| } |
| |
| define i16 @cmpxchg_i16_acquire_acquire_reti16(ptr %ptr, i16 %cmp, i16 %val) nounwind { |
| ; LA64-LABEL: cmpxchg_i16_acquire_acquire_reti16: |
| ; LA64: # %bb.0: |
| ; LA64-NEXT: addi.w $a3, $zero, -4 |
| ; LA64-NEXT: and $a3, $a0, $a3 |
| ; LA64-NEXT: slli.d $a0, $a0, 3 |
| ; LA64-NEXT: lu12i.w $a4, 15 |
| ; LA64-NEXT: ori $a4, $a4, 4095 |
| ; LA64-NEXT: sll.w $a4, $a4, $a0 |
| ; LA64-NEXT: addi.w $a4, $a4, 0 |
| ; LA64-NEXT: bstrpick.d $a2, $a2, 15, 0 |
| ; LA64-NEXT: sll.w $a2, $a2, $a0 |
| ; LA64-NEXT: addi.w $a2, $a2, 0 |
| ; LA64-NEXT: bstrpick.d $a1, $a1, 15, 0 |
| ; LA64-NEXT: sll.w $a1, $a1, $a0 |
| ; LA64-NEXT: addi.w $a1, $a1, 0 |
| ; LA64-NEXT: .LBB5_1: # =>This Inner Loop Header: Depth=1 |
| ; LA64-NEXT: ll.w $a5, $a3, 0 |
| ; LA64-NEXT: and $a6, $a5, $a4 |
| ; LA64-NEXT: bne $a6, $a1, .LBB5_3 |
| ; LA64-NEXT: # %bb.2: # in Loop: Header=BB5_1 Depth=1 |
| ; LA64-NEXT: dbar 0 |
| ; LA64-NEXT: andn $a6, $a5, $a4 |
| ; LA64-NEXT: or $a6, $a6, $a2 |
| ; LA64-NEXT: sc.w $a6, $a3, 0 |
| ; LA64-NEXT: beqz $a6, .LBB5_1 |
| ; LA64-NEXT: b .LBB5_4 |
| ; LA64-NEXT: .LBB5_3: |
| ; LA64-NEXT: dbar 1792 |
| ; LA64-NEXT: .LBB5_4: |
| ; LA64-NEXT: srl.w $a0, $a5, $a0 |
| ; LA64-NEXT: ret |
| %tmp = cmpxchg ptr %ptr, i16 %cmp, i16 %val acquire acquire |
| %res = extractvalue { i16, i1 } %tmp, 0 |
| ret i16 %res |
| } |
| |
| define i32 @cmpxchg_i32_acquire_acquire_reti32(ptr %ptr, i32 %cmp, i32 %val) nounwind { |
| ; LA64-LABEL: cmpxchg_i32_acquire_acquire_reti32: |
| ; LA64: # %bb.0: |
| ; LA64-NEXT: .LBB6_1: # =>This Inner Loop Header: Depth=1 |
| ; LA64-NEXT: ll.w $a3, $a0, 0 |
| ; LA64-NEXT: bne $a3, $a1, .LBB6_3 |
| ; LA64-NEXT: # %bb.2: # in Loop: Header=BB6_1 Depth=1 |
| ; LA64-NEXT: dbar 0 |
| ; LA64-NEXT: move $a4, $a2 |
| ; LA64-NEXT: sc.w $a4, $a0, 0 |
| ; LA64-NEXT: beqz $a4, .LBB6_1 |
| ; LA64-NEXT: b .LBB6_4 |
| ; LA64-NEXT: .LBB6_3: |
| ; LA64-NEXT: dbar 1792 |
| ; LA64-NEXT: .LBB6_4: |
| ; LA64-NEXT: move $a0, $a3 |
| ; LA64-NEXT: ret |
| %tmp = cmpxchg ptr %ptr, i32 %cmp, i32 %val acquire acquire |
| %res = extractvalue { i32, i1 } %tmp, 0 |
| ret i32 %res |
| } |
| |
| define i64 @cmpxchg_i64_acquire_acquire_reti64(ptr %ptr, i64 %cmp, i64 %val) nounwind { |
| ; LA64-LABEL: cmpxchg_i64_acquire_acquire_reti64: |
| ; LA64: # %bb.0: |
| ; LA64-NEXT: .LBB7_1: # =>This Inner Loop Header: Depth=1 |
| ; LA64-NEXT: ll.d $a3, $a0, 0 |
| ; LA64-NEXT: bne $a3, $a1, .LBB7_3 |
| ; LA64-NEXT: # %bb.2: # in Loop: Header=BB7_1 Depth=1 |
| ; LA64-NEXT: dbar 0 |
| ; LA64-NEXT: move $a4, $a2 |
| ; LA64-NEXT: sc.d $a4, $a0, 0 |
| ; LA64-NEXT: beqz $a4, .LBB7_1 |
| ; LA64-NEXT: b .LBB7_4 |
| ; LA64-NEXT: .LBB7_3: |
| ; LA64-NEXT: dbar 1792 |
| ; LA64-NEXT: .LBB7_4: |
| ; LA64-NEXT: move $a0, $a3 |
| ; LA64-NEXT: ret |
| %tmp = cmpxchg ptr %ptr, i64 %cmp, i64 %val acquire acquire |
| %res = extractvalue { i64, i1 } %tmp, 0 |
| ret i64 %res |
| } |
| |
| define i1 @cmpxchg_i8_acquire_acquire_reti1(ptr %ptr, i8 %cmp, i8 %val) nounwind { |
| ; LA64-LABEL: cmpxchg_i8_acquire_acquire_reti1: |
| ; LA64: # %bb.0: |
| ; LA64-NEXT: addi.w $a3, $zero, -4 |
| ; LA64-NEXT: and $a3, $a0, $a3 |
| ; LA64-NEXT: slli.d $a0, $a0, 3 |
| ; LA64-NEXT: andi $a1, $a1, 255 |
| ; LA64-NEXT: sll.w $a1, $a1, $a0 |
| ; LA64-NEXT: ori $a4, $zero, 255 |
| ; LA64-NEXT: sll.w $a4, $a4, $a0 |
| ; LA64-NEXT: andi $a2, $a2, 255 |
| ; LA64-NEXT: sll.w $a0, $a2, $a0 |
| ; LA64-NEXT: addi.w $a0, $a0, 0 |
| ; LA64-NEXT: addi.w $a2, $a4, 0 |
| ; LA64-NEXT: addi.w $a5, $a1, 0 |
| ; LA64-NEXT: .LBB8_1: # =>This Inner Loop Header: Depth=1 |
| ; LA64-NEXT: ll.w $a6, $a3, 0 |
| ; LA64-NEXT: and $a7, $a6, $a2 |
| ; LA64-NEXT: bne $a7, $a5, .LBB8_3 |
| ; LA64-NEXT: # %bb.2: # in Loop: Header=BB8_1 Depth=1 |
| ; LA64-NEXT: dbar 0 |
| ; LA64-NEXT: andn $a7, $a6, $a2 |
| ; LA64-NEXT: or $a7, $a7, $a0 |
| ; LA64-NEXT: sc.w $a7, $a3, 0 |
| ; LA64-NEXT: beqz $a7, .LBB8_1 |
| ; LA64-NEXT: b .LBB8_4 |
| ; LA64-NEXT: .LBB8_3: |
| ; LA64-NEXT: dbar 1792 |
| ; LA64-NEXT: .LBB8_4: |
| ; LA64-NEXT: and $a0, $a6, $a4 |
| ; LA64-NEXT: bstrpick.d $a0, $a0, 31, 0 |
| ; LA64-NEXT: bstrpick.d $a1, $a1, 31, 0 |
| ; LA64-NEXT: xor $a0, $a1, $a0 |
| ; LA64-NEXT: sltui $a0, $a0, 1 |
| ; LA64-NEXT: ret |
| %tmp = cmpxchg ptr %ptr, i8 %cmp, i8 %val acquire acquire |
| %res = extractvalue { i8, i1 } %tmp, 1 |
| ret i1 %res |
| } |
| |
| define i1 @cmpxchg_i16_acquire_acquire_reti1(ptr %ptr, i16 %cmp, i16 %val) nounwind { |
| ; LA64-LABEL: cmpxchg_i16_acquire_acquire_reti1: |
| ; LA64: # %bb.0: |
| ; LA64-NEXT: addi.w $a3, $zero, -4 |
| ; LA64-NEXT: and $a3, $a0, $a3 |
| ; LA64-NEXT: slli.d $a0, $a0, 3 |
| ; LA64-NEXT: bstrpick.d $a1, $a1, 15, 0 |
| ; LA64-NEXT: sll.w $a1, $a1, $a0 |
| ; LA64-NEXT: lu12i.w $a4, 15 |
| ; LA64-NEXT: ori $a4, $a4, 4095 |
| ; LA64-NEXT: sll.w $a4, $a4, $a0 |
| ; LA64-NEXT: bstrpick.d $a2, $a2, 15, 0 |
| ; LA64-NEXT: sll.w $a0, $a2, $a0 |
| ; LA64-NEXT: addi.w $a0, $a0, 0 |
| ; LA64-NEXT: addi.w $a2, $a4, 0 |
| ; LA64-NEXT: addi.w $a5, $a1, 0 |
| ; LA64-NEXT: .LBB9_1: # =>This Inner Loop Header: Depth=1 |
| ; LA64-NEXT: ll.w $a6, $a3, 0 |
| ; LA64-NEXT: and $a7, $a6, $a2 |
| ; LA64-NEXT: bne $a7, $a5, .LBB9_3 |
| ; LA64-NEXT: # %bb.2: # in Loop: Header=BB9_1 Depth=1 |
| ; LA64-NEXT: dbar 0 |
| ; LA64-NEXT: andn $a7, $a6, $a2 |
| ; LA64-NEXT: or $a7, $a7, $a0 |
| ; LA64-NEXT: sc.w $a7, $a3, 0 |
| ; LA64-NEXT: beqz $a7, .LBB9_1 |
| ; LA64-NEXT: b .LBB9_4 |
| ; LA64-NEXT: .LBB9_3: |
| ; LA64-NEXT: dbar 1792 |
| ; LA64-NEXT: .LBB9_4: |
| ; LA64-NEXT: and $a0, $a6, $a4 |
| ; LA64-NEXT: bstrpick.d $a0, $a0, 31, 0 |
| ; LA64-NEXT: bstrpick.d $a1, $a1, 31, 0 |
| ; LA64-NEXT: xor $a0, $a1, $a0 |
| ; LA64-NEXT: sltui $a0, $a0, 1 |
| ; LA64-NEXT: ret |
| %tmp = cmpxchg ptr %ptr, i16 %cmp, i16 %val acquire acquire |
| %res = extractvalue { i16, i1 } %tmp, 1 |
| ret i1 %res |
| } |
| |
| define i1 @cmpxchg_i32_acquire_acquire_reti1(ptr %ptr, i32 %cmp, i32 %val) nounwind { |
| ; LA64-LABEL: cmpxchg_i32_acquire_acquire_reti1: |
| ; LA64: # %bb.0: |
| ; LA64-NEXT: .LBB10_1: # =>This Inner Loop Header: Depth=1 |
| ; LA64-NEXT: ll.w $a3, $a0, 0 |
| ; LA64-NEXT: bne $a3, $a1, .LBB10_3 |
| ; LA64-NEXT: # %bb.2: # in Loop: Header=BB10_1 Depth=1 |
| ; LA64-NEXT: dbar 0 |
| ; LA64-NEXT: move $a4, $a2 |
| ; LA64-NEXT: sc.w $a4, $a0, 0 |
| ; LA64-NEXT: beqz $a4, .LBB10_1 |
| ; LA64-NEXT: b .LBB10_4 |
| ; LA64-NEXT: .LBB10_3: |
| ; LA64-NEXT: dbar 1792 |
| ; LA64-NEXT: .LBB10_4: |
| ; LA64-NEXT: addi.w $a0, $a1, 0 |
| ; LA64-NEXT: xor $a0, $a3, $a0 |
| ; LA64-NEXT: sltui $a0, $a0, 1 |
| ; LA64-NEXT: ret |
| %tmp = cmpxchg ptr %ptr, i32 %cmp, i32 %val acquire acquire |
| %res = extractvalue { i32, i1 } %tmp, 1 |
| ret i1 %res |
| } |
| |
| define i1 @cmpxchg_i64_acquire_acquire_reti1(ptr %ptr, i64 %cmp, i64 %val) nounwind { |
| ; LA64-LABEL: cmpxchg_i64_acquire_acquire_reti1: |
| ; LA64: # %bb.0: |
| ; LA64-NEXT: .LBB11_1: # =>This Inner Loop Header: Depth=1 |
| ; LA64-NEXT: ll.d $a3, $a0, 0 |
| ; LA64-NEXT: bne $a3, $a1, .LBB11_3 |
| ; LA64-NEXT: # %bb.2: # in Loop: Header=BB11_1 Depth=1 |
| ; LA64-NEXT: dbar 0 |
| ; LA64-NEXT: move $a4, $a2 |
| ; LA64-NEXT: sc.d $a4, $a0, 0 |
| ; LA64-NEXT: beqz $a4, .LBB11_1 |
| ; LA64-NEXT: b .LBB11_4 |
| ; LA64-NEXT: .LBB11_3: |
| ; LA64-NEXT: dbar 1792 |
| ; LA64-NEXT: .LBB11_4: |
| ; LA64-NEXT: xor $a0, $a3, $a1 |
| ; LA64-NEXT: sltui $a0, $a0, 1 |
| ; LA64-NEXT: ret |
| %tmp = cmpxchg ptr %ptr, i64 %cmp, i64 %val acquire acquire |
| %res = extractvalue { i64, i1 } %tmp, 1 |
| ret i1 %res |
| } |