; RUN: llc < %s -mtriple=ve-unknown-unknown | FileCheck %s ;;; Test atomicrmw operations @c = common global i8 0, align 4 @s = common global i16 0, align 4 @i = common global i32 0, align 4 @l = common global i64 0, align 4 ; Function Attrs: norecurse nounwind define signext i8 @test_atomic_fetch_add_1() { ; CHECK-LABEL: test_atomic_fetch_add_1: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: lea %s0, c@lo ; CHECK-NEXT: and %s0, %s0, (32)0 ; CHECK-NEXT: lea.sl %s0, c@hi(, %s0) ; CHECK-NEXT: and %s0, -4, %s0 ; CHECK-NEXT: ldl.sx %s2, (, %s0) ; CHECK-NEXT: lea %s1, -256 ; CHECK-NEXT: and %s1, %s1, (32)0 ; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: or %s3, 0, %s2 ; CHECK-NEXT: adds.w.sx %s2, 1, %s2 ; CHECK-NEXT: and %s2, %s2, (56)0 ; CHECK-NEXT: and %s4, %s3, %s1 ; CHECK-NEXT: or %s2, %s4, %s2 ; CHECK-NEXT: cas.w %s2, (%s0), %s3 ; CHECK-NEXT: brne.w %s2, %s3, .LBB{{[0-9]+}}_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: sll %s0, %s2, 56 ; CHECK-NEXT: sra.l %s0, %s0, 56 ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: b.l.t (, %s10) entry: %0 = atomicrmw add i8* @c, i8 1 seq_cst ret i8 %0 } ; Function Attrs: norecurse nounwind define signext i16 @test_atomic_fetch_sub_2() { ; CHECK-LABEL: test_atomic_fetch_sub_2: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: lea %s0, s@lo ; CHECK-NEXT: and %s0, %s0, (32)0 ; CHECK-NEXT: lea.sl %s0, s@hi(, %s0) ; CHECK-NEXT: and %s0, -4, %s0 ; CHECK-NEXT: ldl.sx %s2, (, %s0) ; CHECK-NEXT: lea %s1, -65536 ; CHECK-NEXT: and %s1, %s1, (32)0 ; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: or %s3, 0, %s2 ; CHECK-NEXT: adds.w.sx %s2, -1, %s2 ; CHECK-NEXT: and %s2, %s2, (48)0 ; CHECK-NEXT: and %s4, %s3, %s1 ; CHECK-NEXT: or %s2, %s4, %s2 ; CHECK-NEXT: cas.w %s2, (%s0), %s3 ; CHECK-NEXT: brne.w %s2, %s3, .LBB{{[0-9]+}}_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: sll %s0, %s2, 48 ; CHECK-NEXT: sra.l %s0, %s0, 48 ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: b.l.t (, %s10) entry: %0 = atomicrmw sub i16* @s, i16 1 seq_cst ret i16 %0 } ; Function Attrs: norecurse nounwind define signext i32 @test_atomic_fetch_and_4() { ; CHECK-LABEL: test_atomic_fetch_and_4: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: lea %s0, i@lo ; CHECK-NEXT: and %s0, %s0, (32)0 ; CHECK-NEXT: lea.sl %s0, i@hi(, %s0) ; CHECK-NEXT: ldl.sx %s1, (, %s0) ; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: or %s2, 0, %s1 ; CHECK-NEXT: and %s1, 1, %s2 ; CHECK-NEXT: cas.w %s1, (%s0), %s2 ; CHECK-NEXT: brne.w %s1, %s2, .LBB{{[0-9]+}}_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: adds.w.sx %s0, %s1, (0)1 ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: b.l.t (, %s10) entry: %0 = atomicrmw and i32* @i, i32 1 seq_cst ret i32 %0 } ; Function Attrs: norecurse nounwind define i64 @test_atomic_fetch_or_8() { ; CHECK-LABEL: test_atomic_fetch_or_8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: lea %s0, l@lo ; CHECK-NEXT: and %s0, %s0, (32)0 ; CHECK-NEXT: lea.sl %s1, l@hi(, %s0) ; CHECK-NEXT: ld %s0, (, %s1) ; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: or %s2, 0, %s0 ; CHECK-NEXT: or %s0, 1, %s0 ; CHECK-NEXT: cas.l %s0, (%s1), %s2 ; CHECK-NEXT: brne.l %s0, %s2, .LBB{{[0-9]+}}_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: b.l.t (, %s10) entry: %0 = atomicrmw or i64* @l, i64 1 seq_cst ret i64 %0 } ; Function Attrs: norecurse nounwind define signext i8 @test_atomic_fetch_xor_1() { ; CHECK-LABEL: test_atomic_fetch_xor_1: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: lea %s0, c@lo ; CHECK-NEXT: and %s0, %s0, (32)0 ; CHECK-NEXT: lea.sl %s0, c@hi(, %s0) ; CHECK-NEXT: and %s1, -4, %s0 ; CHECK-NEXT: ldl.sx %s0, (, %s1) ; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: or %s2, 0, %s0 ; CHECK-NEXT: xor %s0, 1, %s2 ; CHECK-NEXT: cas.w %s0, (%s1), %s2 ; CHECK-NEXT: brne.w %s0, %s2, .LBB{{[0-9]+}}_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: sll %s0, %s0, 56 ; CHECK-NEXT: sra.l %s0, %s0, 56 ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: b.l.t (, %s10) entry: %0 = atomicrmw xor i8* @c, i8 1 seq_cst ret i8 %0 } ; Function Attrs: norecurse nounwind define signext i16 @test_atomic_fetch_nand_2() { ; CHECK-LABEL: test_atomic_fetch_nand_2: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: lea %s0, s@lo ; CHECK-NEXT: and %s0, %s0, (32)0 ; CHECK-NEXT: lea.sl %s0, s@hi(, %s0) ; CHECK-NEXT: and %s0, -4, %s0 ; CHECK-NEXT: ldl.sx %s2, (, %s0) ; CHECK-NEXT: lea %s1, 65534 ; CHECK-NEXT: lea %s3, -65536 ; CHECK-NEXT: and %s3, %s3, (32)0 ; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: or %s4, 0, %s2 ; CHECK-NEXT: xor %s2, -1, %s4 ; CHECK-NEXT: or %s2, %s2, %s1 ; CHECK-NEXT: and %s2, %s2, (48)0 ; CHECK-NEXT: and %s5, %s4, %s3 ; CHECK-NEXT: or %s2, %s5, %s2 ; CHECK-NEXT: cas.w %s2, (%s0), %s4 ; CHECK-NEXT: brne.w %s2, %s4, .LBB{{[0-9]+}}_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: sll %s0, %s2, 48 ; CHECK-NEXT: sra.l %s0, %s0, 48 ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: b.l.t (, %s10) entry: %0 = atomicrmw nand i16* @s, i16 1 seq_cst ret i16 %0 } ; Function Attrs: norecurse nounwind define signext i32 @test_atomic_fetch_max_4() { ; CHECK-LABEL: test_atomic_fetch_max_4: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: lea %s0, i@lo ; CHECK-NEXT: and %s0, %s0, (32)0 ; CHECK-NEXT: lea.sl %s1, i@hi(, %s0) ; CHECK-NEXT: ldl.sx %s0, (, %s1) ; CHECK-NEXT: or %s2, 1, (0)1 ; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: or %s3, 0, %s0 ; CHECK-NEXT: maxs.w.sx %s0, %s0, %s2 ; CHECK-NEXT: cas.w %s0, (%s1), %s3 ; CHECK-NEXT: brne.w %s0, %s3, .LBB{{[0-9]+}}_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: adds.w.sx %s0, %s0, (0)1 ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: b.l.t (, %s10) entry: %0 = atomicrmw max i32* @i, i32 1 seq_cst ret i32 %0 } ; Function Attrs: norecurse nounwind define signext i32 @test_atomic_fetch_min_4() { ; CHECK-LABEL: test_atomic_fetch_min_4: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: lea %s0, i@lo ; CHECK-NEXT: and %s0, %s0, (32)0 ; CHECK-NEXT: lea.sl %s0, i@hi(, %s0) ; CHECK-NEXT: ldl.sx %s1, (, %s0) ; CHECK-NEXT: or %s2, 2, (0)1 ; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: or %s3, 0, %s1 ; CHECK-NEXT: cmps.w.sx %s4, %s1, %s2 ; CHECK-NEXT: or %s1, 1, (0)1 ; CHECK-NEXT: cmov.w.lt %s1, %s3, %s4 ; CHECK-NEXT: cas.w %s1, (%s0), %s3 ; CHECK-NEXT: brne.w %s1, %s3, .LBB{{[0-9]+}}_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: adds.w.sx %s0, %s1, (0)1 ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: b.l.t (, %s10) entry: %0 = atomicrmw min i32* @i, i32 1 seq_cst ret i32 %0 } ; Function Attrs: norecurse nounwind define signext i32 @test_atomic_fetch_umax_4() { ; CHECK-LABEL: test_atomic_fetch_umax_4: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: lea %s0, i@lo ; CHECK-NEXT: and %s0, %s0, (32)0 ; CHECK-NEXT: lea.sl %s0, i@hi(, %s0) ; CHECK-NEXT: ldl.sx %s1, (, %s0) ; CHECK-NEXT: or %s2, 1, (0)1 ; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: or %s3, 0, %s1 ; CHECK-NEXT: cmpu.w %s4, %s1, %s2 ; CHECK-NEXT: or %s1, 1, (0)1 ; CHECK-NEXT: cmov.w.gt %s1, %s3, %s4 ; CHECK-NEXT: cas.w %s1, (%s0), %s3 ; CHECK-NEXT: brne.w %s1, %s3, .LBB{{[0-9]+}}_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: adds.w.sx %s0, %s1, (0)1 ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: b.l.t (, %s10) entry: %0 = atomicrmw umax i32* @i, i32 1 seq_cst ret i32 %0 } ; Function Attrs: norecurse nounwind define signext i32 @test_atomic_fetch_umin_4() { ; CHECK-LABEL: test_atomic_fetch_umin_4: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: lea %s0, i@lo ; CHECK-NEXT: and %s0, %s0, (32)0 ; CHECK-NEXT: lea.sl %s0, i@hi(, %s0) ; CHECK-NEXT: ldl.sx %s1, (, %s0) ; CHECK-NEXT: or %s2, 2, (0)1 ; CHECK-NEXT: .LBB{{[0-9]+}}_1: # %atomicrmw.start ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: or %s3, 0, %s1 ; CHECK-NEXT: cmpu.w %s4, %s1, %s2 ; CHECK-NEXT: or %s1, 1, (0)1 ; CHECK-NEXT: cmov.w.lt %s1, %s3, %s4 ; CHECK-NEXT: cas.w %s1, (%s0), %s3 ; CHECK-NEXT: brne.w %s1, %s3, .LBB{{[0-9]+}}_1 ; CHECK-NEXT: # %bb.2: # %atomicrmw.end ; CHECK-NEXT: adds.w.sx %s0, %s1, (0)1 ; CHECK-NEXT: fencem 3 ; CHECK-NEXT: b.l.t (, %s10) entry: %0 = atomicrmw umin i32* @i, i32 1 seq_cst ret i32 %0 }