; NOTE: Assertions have been autogenerated by utils/update_test_checks.py ; RUN: opt < %s -instcombine -S | FileCheck %s define void @test1(i32* %P) { ; CHECK-LABEL: @test1( ; CHECK-NEXT: store i32 123, i32* undef, align 4 ; CHECK-NEXT: store i32 undef, i32* null, align 536870912 ; CHECK-NEXT: ret void ; store i32 undef, i32* %P store i32 123, i32* undef store i32 124, i32* null ret void } define void @test2(i32* %P) { ; CHECK-LABEL: @test2( ; CHECK-NEXT: ret void ; %X = load i32, i32* %P %Y = add i32 %X, 0 store i32 %Y, i32* %P ret void } define void @store_at_gep_off_null_inbounds(i64 %offset) { ; CHECK-LABEL: @store_at_gep_off_null_inbounds( ; CHECK-NEXT: [[PTR:%.*]] = getelementptr inbounds i32, i32* null, i64 [[OFFSET:%.*]] ; CHECK-NEXT: store i32 undef, i32* [[PTR]], align 4 ; CHECK-NEXT: ret void ; %ptr = getelementptr inbounds i32, i32 *null, i64 %offset store i32 24, i32* %ptr ret void } define void @store_at_gep_off_null_not_inbounds(i64 %offset) { ; CHECK-LABEL: @store_at_gep_off_null_not_inbounds( ; CHECK-NEXT: [[PTR:%.*]] = getelementptr i32, i32* null, i64 [[OFFSET:%.*]] ; CHECK-NEXT: store i32 undef, i32* [[PTR]], align 4 ; CHECK-NEXT: ret void ; %ptr = getelementptr i32, i32 *null, i64 %offset store i32 24, i32* %ptr ret void } define void @store_at_gep_off_no_null_opt(i64 %offset) #0 { ; CHECK-LABEL: @store_at_gep_off_no_null_opt( ; CHECK-NEXT: [[PTR:%.*]] = getelementptr inbounds i32, i32* null, i64 [[OFFSET:%.*]] ; CHECK-NEXT: store i32 24, i32* [[PTR]], align 4 ; CHECK-NEXT: ret void ; %ptr = getelementptr inbounds i32, i32 *null, i64 %offset store i32 24, i32* %ptr ret void } attributes #0 = { null_pointer_is_valid } ;; Simple sinking tests ; "if then else" define i32 @test3(i1 %C) { ; CHECK-LABEL: @test3( ; CHECK-NEXT: br i1 [[C:%.*]], label [[COND:%.*]], label [[COND2:%.*]] ; CHECK: Cond: ; CHECK-NEXT: br label [[CONT:%.*]] ; CHECK: Cond2: ; CHECK-NEXT: br label [[CONT]] ; CHECK: Cont: ; CHECK-NEXT: [[STOREMERGE:%.*]] = phi i32 [ 47, [[COND2]] ], [ -987654321, [[COND]] ] ; CHECK-NEXT: ret i32 [[STOREMERGE]] ; %A = alloca i32 br i1 %C, label %Cond, label %Cond2 Cond: store i32 -987654321, i32* %A br label %Cont Cond2: store i32 47, i32* %A br label %Cont Cont: %V = load i32, i32* %A ret i32 %V } ; "if then" define i32 @test4(i1 %C) { ; CHECK-LABEL: @test4( ; CHECK-NEXT: br i1 [[C:%.*]], label [[COND:%.*]], label [[CONT:%.*]] ; CHECK: Cond: ; CHECK-NEXT: br label [[CONT]] ; CHECK: Cont: ; CHECK-NEXT: [[STOREMERGE:%.*]] = phi i32 [ -987654321, [[COND]] ], [ 47, [[TMP0:%.*]] ] ; CHECK-NEXT: ret i32 [[STOREMERGE]] ; %A = alloca i32 store i32 47, i32* %A br i1 %C, label %Cond, label %Cont Cond: store i32 -987654321, i32* %A br label %Cont Cont: %V = load i32, i32* %A ret i32 %V } ; "if then" define void @test5(i1 %C, i32* %P) { ; CHECK-LABEL: @test5( ; CHECK-NEXT: br i1 [[C:%.*]], label [[COND:%.*]], label [[CONT:%.*]] ; CHECK: Cond: ; CHECK-NEXT: br label [[CONT]] ; CHECK: Cont: ; CHECK-NEXT: [[STOREMERGE:%.*]] = phi i32 [ -987654321, [[COND]] ], [ 47, [[TMP0:%.*]] ] ; CHECK-NEXT: store i32 [[STOREMERGE]], i32* [[P:%.*]], align 1 ; CHECK-NEXT: ret void ; store i32 47, i32* %P, align 1 br i1 %C, label %Cond, label %Cont Cond: store i32 -987654321, i32* %P, align 1 br label %Cont Cont: ret void } ; PR14753 - merging two stores should preserve the TBAA tag. define void @test6(i32 %n, float* %a, i32* %gi) nounwind uwtable ssp { ; CHECK-LABEL: @test6( ; CHECK-NEXT: entry: ; CHECK-NEXT: br label [[FOR_COND:%.*]] ; CHECK: for.cond: ; CHECK-NEXT: [[STOREMERGE:%.*]] = phi i32 [ 42, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[FOR_BODY:%.*]] ] ; CHECK-NEXT: store i32 [[STOREMERGE]], i32* [[GI:%.*]], align 4, [[TBAA0:!tbaa !.*]] ; CHECK-NEXT: [[CMP:%.*]] = icmp slt i32 [[STOREMERGE]], [[N:%.*]] ; CHECK-NEXT: br i1 [[CMP]], label [[FOR_BODY]], label [[FOR_END:%.*]] ; CHECK: for.body: ; CHECK-NEXT: [[IDXPROM:%.*]] = sext i32 [[STOREMERGE]] to i64 ; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds float, float* [[A:%.*]], i64 [[IDXPROM]] ; CHECK-NEXT: store float 0.000000e+00, float* [[ARRAYIDX]], align 4, [[TBAA4:!tbaa !.*]] ; CHECK-NEXT: [[TMP0:%.*]] = load i32, i32* [[GI]], align 4, [[TBAA0]] ; CHECK-NEXT: [[INC]] = add nsw i32 [[TMP0]], 1 ; CHECK-NEXT: br label [[FOR_COND]] ; CHECK: for.end: ; CHECK-NEXT: ret void ; entry: store i32 42, i32* %gi, align 4, !tbaa !0 br label %for.cond for.cond: %storemerge = phi i32 [ 0, %entry ], [ %inc, %for.body ] %0 = load i32, i32* %gi, align 4, !tbaa !0 %cmp = icmp slt i32 %0, %n br i1 %cmp, label %for.body, label %for.end for.body: %idxprom = sext i32 %0 to i64 %arrayidx = getelementptr inbounds float, float* %a, i64 %idxprom store float 0.000000e+00, float* %arrayidx, align 4, !tbaa !3 %1 = load i32, i32* %gi, align 4, !tbaa !0 %inc = add nsw i32 %1, 1 store i32 %inc, i32* %gi, align 4, !tbaa !0 br label %for.cond for.end: ret void } define void @dse1(i32* %p) { ; CHECK-LABEL: @dse1( ; CHECK-NEXT: store i32 0, i32* [[P:%.*]], align 4 ; CHECK-NEXT: ret void ; store i32 0, i32* %p store i32 0, i32* %p ret void } ; Slightly subtle: if we're mixing atomic and non-atomic access to the ; same location, then the contents of the location are undefined if there's ; an actual race. As such, we're free to pick either store under the ; assumption that we're not racing with any other thread. define void @dse2(i32* %p) { ; CHECK-LABEL: @dse2( ; CHECK-NEXT: store i32 0, i32* [[P:%.*]], align 4 ; CHECK-NEXT: ret void ; store atomic i32 0, i32* %p unordered, align 4 store i32 0, i32* %p ret void } define void @dse3(i32* %p) { ; CHECK-LABEL: @dse3( ; CHECK-NEXT: store atomic i32 0, i32* [[P:%.*]] unordered, align 4 ; CHECK-NEXT: ret void ; store i32 0, i32* %p store atomic i32 0, i32* %p unordered, align 4 ret void } define void @dse4(i32* %p) { ; CHECK-LABEL: @dse4( ; CHECK-NEXT: store atomic i32 0, i32* [[P:%.*]] unordered, align 4 ; CHECK-NEXT: ret void ; store atomic i32 0, i32* %p unordered, align 4 store atomic i32 0, i32* %p unordered, align 4 ret void } ; Implementation limit - could remove unordered store here, but ; currently don't. define void @dse5(i32* %p) { ; CHECK-LABEL: @dse5( ; CHECK-NEXT: store atomic i32 0, i32* [[P:%.*]] unordered, align 4 ; CHECK-NEXT: store atomic i32 0, i32* [[P]] seq_cst, align 4 ; CHECK-NEXT: ret void ; store atomic i32 0, i32* %p unordered, align 4 store atomic i32 0, i32* %p seq_cst, align 4 ret void } define void @write_back1(i32* %p) { ; CHECK-LABEL: @write_back1( ; CHECK-NEXT: ret void ; %v = load i32, i32* %p store i32 %v, i32* %p ret void } define void @write_back2(i32* %p) { ; CHECK-LABEL: @write_back2( ; CHECK-NEXT: ret void ; %v = load atomic i32, i32* %p unordered, align 4 store i32 %v, i32* %p ret void } define void @write_back3(i32* %p) { ; CHECK-LABEL: @write_back3( ; CHECK-NEXT: ret void ; %v = load i32, i32* %p store atomic i32 %v, i32* %p unordered, align 4 ret void } define void @write_back4(i32* %p) { ; CHECK-LABEL: @write_back4( ; CHECK-NEXT: ret void ; %v = load atomic i32, i32* %p unordered, align 4 store atomic i32 %v, i32* %p unordered, align 4 ret void } ; Can't remove store due to ordering side effect define void @write_back5(i32* %p) { ; CHECK-LABEL: @write_back5( ; CHECK-NEXT: [[V:%.*]] = load atomic i32, i32* [[P:%.*]] unordered, align 4 ; CHECK-NEXT: store atomic i32 [[V]], i32* [[P]] seq_cst, align 4 ; CHECK-NEXT: ret void ; %v = load atomic i32, i32* %p unordered, align 4 store atomic i32 %v, i32* %p seq_cst, align 4 ret void } define void @write_back6(i32* %p) { ; CHECK-LABEL: @write_back6( ; CHECK-NEXT: [[V:%.*]] = load atomic i32, i32* [[P:%.*]] seq_cst, align 4 ; CHECK-NEXT: ret void ; %v = load atomic i32, i32* %p seq_cst, align 4 store atomic i32 %v, i32* %p unordered, align 4 ret void } define void @write_back7(i32* %p) { ; CHECK-LABEL: @write_back7( ; CHECK-NEXT: [[V:%.*]] = load atomic volatile i32, i32* [[P:%.*]] seq_cst, align 4 ; CHECK-NEXT: ret void ; %v = load atomic volatile i32, i32* %p seq_cst, align 4 store atomic i32 %v, i32* %p unordered, align 4 ret void } @Unknown = external constant i32 define void @store_to_constant() { ; CHECK-LABEL: @store_to_constant( ; CHECK-NEXT: ret void ; store i32 0, i32* @Unknown ret void } !0 = !{!4, !4, i64 0} !1 = !{!"omnipotent char", !2} !2 = !{!"Simple C/C++ TBAA"} !3 = !{!"float", !1} !4 = !{!"int", !1}