blob: 46c0f8f9588774c619610fc8406d7c42dc562db5 [file] [log] [blame]
; RUN: llc < %s -mtriple=ve-unknown-unknown | FileCheck %s
;;; Test atomicrmw operations
@c = common global i8 0, align 4
@s = common global i16 0, align 4
@i = common global i32 0, align 4
@l = common global i64 0, align 4
; Function Attrs: norecurse nounwind
define signext i8 @test_atomic_fetch_add_1() {
; CHECK-LABEL: test_atomic_fetch_add_1:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: fencem 3
; CHECK-NEXT: lea %s0, c@lo
; CHECK-NEXT: and %s0, %s0, (32)0
; CHECK-NEXT: lea.sl %s0, c@hi(, %s0)
; CHECK-NEXT: and %s0, -4, %s0
; CHECK-NEXT: ldl.sx %s2, (, %s0)
; CHECK-NEXT: lea %s1, -256
; CHECK-NEXT: and %s1, %s1, (32)0
; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
; CHECK-NEXT: or %s3, 0, %s2
; CHECK-NEXT: adds.w.sx %s2, 1, %s2
; CHECK-NEXT: and %s2, %s2, (56)0
; CHECK-NEXT: and %s4, %s3, %s1
; CHECK-NEXT: or %s2, %s4, %s2
; CHECK-NEXT: cas.w %s2, (%s0), %s3
; CHECK-NEXT: brne.w %s2, %s3, .LBB{{[0-9]+}}_1
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
; CHECK-NEXT: sll %s0, %s2, 56
; CHECK-NEXT: sra.l %s0, %s0, 56
; CHECK-NEXT: fencem 3
; CHECK-NEXT: b.l.t (, %s10)
entry:
%0 = atomicrmw add i8* @c, i8 1 seq_cst
ret i8 %0
}
; Function Attrs: norecurse nounwind
define signext i16 @test_atomic_fetch_sub_2() {
; CHECK-LABEL: test_atomic_fetch_sub_2:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: fencem 3
; CHECK-NEXT: lea %s0, s@lo
; CHECK-NEXT: and %s0, %s0, (32)0
; CHECK-NEXT: lea.sl %s0, s@hi(, %s0)
; CHECK-NEXT: and %s0, -4, %s0
; CHECK-NEXT: ldl.sx %s2, (, %s0)
; CHECK-NEXT: lea %s1, -65536
; CHECK-NEXT: and %s1, %s1, (32)0
; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
; CHECK-NEXT: or %s3, 0, %s2
; CHECK-NEXT: adds.w.sx %s2, -1, %s2
; CHECK-NEXT: and %s2, %s2, (48)0
; CHECK-NEXT: and %s4, %s3, %s1
; CHECK-NEXT: or %s2, %s4, %s2
; CHECK-NEXT: cas.w %s2, (%s0), %s3
; CHECK-NEXT: brne.w %s2, %s3, .LBB{{[0-9]+}}_1
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
; CHECK-NEXT: sll %s0, %s2, 48
; CHECK-NEXT: sra.l %s0, %s0, 48
; CHECK-NEXT: fencem 3
; CHECK-NEXT: b.l.t (, %s10)
entry:
%0 = atomicrmw sub i16* @s, i16 1 seq_cst
ret i16 %0
}
; Function Attrs: norecurse nounwind
define signext i32 @test_atomic_fetch_and_4() {
; CHECK-LABEL: test_atomic_fetch_and_4:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: fencem 3
; CHECK-NEXT: lea %s0, i@lo
; CHECK-NEXT: and %s0, %s0, (32)0
; CHECK-NEXT: lea.sl %s0, i@hi(, %s0)
; CHECK-NEXT: ldl.sx %s1, (, %s0)
; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
; CHECK-NEXT: or %s2, 0, %s1
; CHECK-NEXT: and %s1, 1, %s2
; CHECK-NEXT: cas.w %s1, (%s0), %s2
; CHECK-NEXT: brne.w %s1, %s2, .LBB{{[0-9]+}}_1
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
; CHECK-NEXT: adds.w.sx %s0, %s1, (0)1
; CHECK-NEXT: fencem 3
; CHECK-NEXT: b.l.t (, %s10)
entry:
%0 = atomicrmw and i32* @i, i32 1 seq_cst
ret i32 %0
}
; Function Attrs: norecurse nounwind
define i64 @test_atomic_fetch_or_8() {
; CHECK-LABEL: test_atomic_fetch_or_8:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: fencem 3
; CHECK-NEXT: lea %s0, l@lo
; CHECK-NEXT: and %s0, %s0, (32)0
; CHECK-NEXT: lea.sl %s1, l@hi(, %s0)
; CHECK-NEXT: ld %s0, (, %s1)
; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
; CHECK-NEXT: or %s2, 0, %s0
; CHECK-NEXT: or %s0, 1, %s0
; CHECK-NEXT: cas.l %s0, (%s1), %s2
; CHECK-NEXT: brne.l %s0, %s2, .LBB{{[0-9]+}}_1
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
; CHECK-NEXT: fencem 3
; CHECK-NEXT: b.l.t (, %s10)
entry:
%0 = atomicrmw or i64* @l, i64 1 seq_cst
ret i64 %0
}
; Function Attrs: norecurse nounwind
define signext i8 @test_atomic_fetch_xor_1() {
; CHECK-LABEL: test_atomic_fetch_xor_1:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: fencem 3
; CHECK-NEXT: lea %s0, c@lo
; CHECK-NEXT: and %s0, %s0, (32)0
; CHECK-NEXT: lea.sl %s0, c@hi(, %s0)
; CHECK-NEXT: and %s1, -4, %s0
; CHECK-NEXT: ldl.sx %s0, (, %s1)
; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
; CHECK-NEXT: or %s2, 0, %s0
; CHECK-NEXT: xor %s0, 1, %s2
; CHECK-NEXT: cas.w %s0, (%s1), %s2
; CHECK-NEXT: brne.w %s0, %s2, .LBB{{[0-9]+}}_1
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
; CHECK-NEXT: sll %s0, %s0, 56
; CHECK-NEXT: sra.l %s0, %s0, 56
; CHECK-NEXT: fencem 3
; CHECK-NEXT: b.l.t (, %s10)
entry:
%0 = atomicrmw xor i8* @c, i8 1 seq_cst
ret i8 %0
}
; Function Attrs: norecurse nounwind
define signext i16 @test_atomic_fetch_nand_2() {
; CHECK-LABEL: test_atomic_fetch_nand_2:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: fencem 3
; CHECK-NEXT: lea %s0, s@lo
; CHECK-NEXT: and %s0, %s0, (32)0
; CHECK-NEXT: lea.sl %s0, s@hi(, %s0)
; CHECK-NEXT: and %s0, -4, %s0
; CHECK-NEXT: ldl.sx %s2, (, %s0)
; CHECK-NEXT: lea %s1, 65534
; CHECK-NEXT: lea %s3, -65536
; CHECK-NEXT: and %s3, %s3, (32)0
; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
; CHECK-NEXT: or %s4, 0, %s2
; CHECK-NEXT: xor %s2, -1, %s4
; CHECK-NEXT: or %s2, %s2, %s1
; CHECK-NEXT: and %s2, %s2, (48)0
; CHECK-NEXT: and %s5, %s4, %s3
; CHECK-NEXT: or %s2, %s5, %s2
; CHECK-NEXT: cas.w %s2, (%s0), %s4
; CHECK-NEXT: brne.w %s2, %s4, .LBB{{[0-9]+}}_1
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
; CHECK-NEXT: sll %s0, %s2, 48
; CHECK-NEXT: sra.l %s0, %s0, 48
; CHECK-NEXT: fencem 3
; CHECK-NEXT: b.l.t (, %s10)
entry:
%0 = atomicrmw nand i16* @s, i16 1 seq_cst
ret i16 %0
}
; Function Attrs: norecurse nounwind
define signext i32 @test_atomic_fetch_max_4() {
; CHECK-LABEL: test_atomic_fetch_max_4:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: fencem 3
; CHECK-NEXT: lea %s0, i@lo
; CHECK-NEXT: and %s0, %s0, (32)0
; CHECK-NEXT: lea.sl %s1, i@hi(, %s0)
; CHECK-NEXT: ldl.sx %s0, (, %s1)
; CHECK-NEXT: or %s2, 1, (0)1
; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
; CHECK-NEXT: or %s3, 0, %s0
; CHECK-NEXT: maxs.w.sx %s0, %s0, %s2
; CHECK-NEXT: cas.w %s0, (%s1), %s3
; CHECK-NEXT: brne.w %s0, %s3, .LBB{{[0-9]+}}_1
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
; CHECK-NEXT: adds.w.sx %s0, %s0, (0)1
; CHECK-NEXT: fencem 3
; CHECK-NEXT: b.l.t (, %s10)
entry:
%0 = atomicrmw max i32* @i, i32 1 seq_cst
ret i32 %0
}
; Function Attrs: norecurse nounwind
define signext i32 @test_atomic_fetch_min_4() {
; CHECK-LABEL: test_atomic_fetch_min_4:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: fencem 3
; CHECK-NEXT: lea %s0, i@lo
; CHECK-NEXT: and %s0, %s0, (32)0
; CHECK-NEXT: lea.sl %s0, i@hi(, %s0)
; CHECK-NEXT: ldl.sx %s1, (, %s0)
; CHECK-NEXT: or %s2, 2, (0)1
; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
; CHECK-NEXT: or %s3, 0, %s1
; CHECK-NEXT: cmps.w.sx %s4, %s1, %s2
; CHECK-NEXT: or %s1, 1, (0)1
; CHECK-NEXT: cmov.w.lt %s1, %s3, %s4
; CHECK-NEXT: cas.w %s1, (%s0), %s3
; CHECK-NEXT: brne.w %s1, %s3, .LBB{{[0-9]+}}_1
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
; CHECK-NEXT: adds.w.sx %s0, %s1, (0)1
; CHECK-NEXT: fencem 3
; CHECK-NEXT: b.l.t (, %s10)
entry:
%0 = atomicrmw min i32* @i, i32 1 seq_cst
ret i32 %0
}
; Function Attrs: norecurse nounwind
define signext i32 @test_atomic_fetch_umax_4() {
; CHECK-LABEL: test_atomic_fetch_umax_4:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: fencem 3
; CHECK-NEXT: lea %s0, i@lo
; CHECK-NEXT: and %s0, %s0, (32)0
; CHECK-NEXT: lea.sl %s0, i@hi(, %s0)
; CHECK-NEXT: ldl.sx %s1, (, %s0)
; CHECK-NEXT: or %s2, 1, (0)1
; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
; CHECK-NEXT: or %s3, 0, %s1
; CHECK-NEXT: cmpu.w %s4, %s1, %s2
; CHECK-NEXT: or %s1, 1, (0)1
; CHECK-NEXT: cmov.w.gt %s1, %s3, %s4
; CHECK-NEXT: cas.w %s1, (%s0), %s3
; CHECK-NEXT: brne.w %s1, %s3, .LBB{{[0-9]+}}_1
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
; CHECK-NEXT: adds.w.sx %s0, %s1, (0)1
; CHECK-NEXT: fencem 3
; CHECK-NEXT: b.l.t (, %s10)
entry:
%0 = atomicrmw umax i32* @i, i32 1 seq_cst
ret i32 %0
}
; Function Attrs: norecurse nounwind
define signext i32 @test_atomic_fetch_umin_4() {
; CHECK-LABEL: test_atomic_fetch_umin_4:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: fencem 3
; CHECK-NEXT: lea %s0, i@lo
; CHECK-NEXT: and %s0, %s0, (32)0
; CHECK-NEXT: lea.sl %s0, i@hi(, %s0)
; CHECK-NEXT: ldl.sx %s1, (, %s0)
; CHECK-NEXT: or %s2, 2, (0)1
; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
; CHECK-NEXT: or %s3, 0, %s1
; CHECK-NEXT: cmpu.w %s4, %s1, %s2
; CHECK-NEXT: or %s1, 1, (0)1
; CHECK-NEXT: cmov.w.lt %s1, %s3, %s4
; CHECK-NEXT: cas.w %s1, (%s0), %s3
; CHECK-NEXT: brne.w %s1, %s3, .LBB{{[0-9]+}}_1
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
; CHECK-NEXT: adds.w.sx %s0, %s1, (0)1
; CHECK-NEXT: fencem 3
; CHECK-NEXT: b.l.t (, %s10)
entry:
%0 = atomicrmw umin i32* @i, i32 1 seq_cst
ret i32 %0
}