; NOTE: Assertions have been autogenerated by utils/update_test_checks.py ; RUN: opt < %s -basic-aa -dse -S | FileCheck %s target datalayout = "e-m:e-p:32:32-i64:64-v128:64:128-a:0:32-n32-S64" declare void @llvm.memset.p0i8.i64(i8* nocapture, i8, i64, i32, i1) nounwind define void @test13(i32* noalias %P) { ; CHECK-LABEL: @test13( ; CHECK-NEXT: entry: ; CHECK-NEXT: br label [[FOR:%.*]] ; CHECK: for: ; CHECK-NEXT: store i32 0, i32* [[P:%.*]], align 4 ; CHECK-NEXT: br i1 false, label [[FOR]], label [[END:%.*]] ; CHECK: end: ; CHECK-NEXT: ret void ; entry: br label %for for: store i32 0, i32* %P br i1 false, label %for, label %end end: ret void } define void @test14(i32* noalias %P) { ; CHECK-LABEL: @test14( ; CHECK-NEXT: entry: ; CHECK-NEXT: br label [[FOR:%.*]] ; CHECK: for: ; CHECK-NEXT: store i32 0, i32* [[P:%.*]], align 4 ; CHECK-NEXT: br i1 false, label [[FOR]], label [[END:%.*]] ; CHECK: end: ; CHECK-NEXT: ret void ; entry: store i32 1, i32* %P br label %for for: store i32 0, i32* %P br i1 false, label %for, label %end end: ret void } define void @test18(i32* noalias %P) { ; CHECK-LABEL: @test18( ; CHECK-NEXT: entry: ; CHECK-NEXT: [[P2:%.*]] = bitcast i32* [[P:%.*]] to i8* ; CHECK-NEXT: store i32 0, i32* [[P]], align 4 ; CHECK-NEXT: br label [[FOR:%.*]] ; CHECK: for: ; CHECK-NEXT: store i8 1, i8* [[P2]], align 1 ; CHECK-NEXT: [[X:%.*]] = load i32, i32* [[P]], align 4 ; CHECK-NEXT: store i8 2, i8* [[P2]], align 1 ; CHECK-NEXT: br i1 false, label [[FOR]], label [[END:%.*]] ; CHECK: end: ; CHECK-NEXT: ret void ; entry: %P2 = bitcast i32* %P to i8* store i32 0, i32* %P br label %for for: store i8 1, i8* %P2 %x = load i32, i32* %P store i8 2, i8* %P2 br i1 false, label %for, label %end end: ret void } define void @test21(i32* noalias %P) { ; CHECK-LABEL: @test21( ; CHECK-NEXT: entry: ; CHECK-NEXT: [[ARRAYIDX0:%.*]] = getelementptr inbounds i32, i32* [[P:%.*]], i64 1 ; CHECK-NEXT: [[P3:%.*]] = bitcast i32* [[ARRAYIDX0]] to i8* ; CHECK-NEXT: [[TMP0:%.*]] = getelementptr inbounds i8, i8* [[P3]], i64 4 ; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* align 4 [[TMP0]], i8 0, i64 24, i1 false) ; CHECK-NEXT: br label [[FOR:%.*]] ; CHECK: for: ; CHECK-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds i32, i32* [[P]], i64 1 ; CHECK-NEXT: store i32 1, i32* [[ARRAYIDX1]], align 4 ; CHECK-NEXT: br i1 false, label [[FOR]], label [[END:%.*]] ; CHECK: end: ; CHECK-NEXT: ret void ; entry: %arrayidx0 = getelementptr inbounds i32, i32* %P, i64 1 %p3 = bitcast i32* %arrayidx0 to i8* call void @llvm.memset.p0i8.i64(i8* %p3, i8 0, i64 28, i32 4, i1 false) br label %for for: %arrayidx1 = getelementptr inbounds i32, i32* %P, i64 1 store i32 1, i32* %arrayidx1, align 4 br i1 false, label %for, label %end end: ret void } define void @test_loop(i32 %N, i32* noalias nocapture readonly %A, i32* noalias nocapture readonly %x, i32* noalias nocapture %b) local_unnamed_addr { ; CHECK-LABEL: @test_loop( ; CHECK-NEXT: entry: ; CHECK-NEXT: [[CMP27:%.*]] = icmp sgt i32 [[N:%.*]], 0 ; CHECK-NEXT: br i1 [[CMP27]], label [[FOR_BODY4_LR_PH_PREHEADER:%.*]], label [[FOR_COND_CLEANUP:%.*]] ; CHECK: for.body4.lr.ph.preheader: ; CHECK-NEXT: br label [[FOR_BODY4_LR_PH:%.*]] ; CHECK: for.cond.cleanup: ; CHECK-NEXT: ret void ; CHECK: for.body4.lr.ph: ; CHECK-NEXT: [[I_028:%.*]] = phi i32 [ [[INC11:%.*]], [[FOR_COND_CLEANUP3:%.*]] ], [ 0, [[FOR_BODY4_LR_PH_PREHEADER]] ] ; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[B:%.*]], i32 [[I_028]] ; CHECK-NEXT: store i32 0, i32* [[ARRAYIDX]], align 4 ; CHECK-NEXT: [[MUL:%.*]] = mul nsw i32 [[I_028]], [[N]] ; CHECK-NEXT: br label [[FOR_BODY4:%.*]] ; CHECK: for.body4: ; CHECK-NEXT: [[TMP0:%.*]] = phi i32 [ 0, [[FOR_BODY4_LR_PH]] ], [ [[ADD9:%.*]], [[FOR_BODY4]] ] ; CHECK-NEXT: [[J_026:%.*]] = phi i32 [ 0, [[FOR_BODY4_LR_PH]] ], [ [[INC:%.*]], [[FOR_BODY4]] ] ; CHECK-NEXT: [[ADD:%.*]] = add nsw i32 [[J_026]], [[MUL]] ; CHECK-NEXT: [[ARRAYIDX5:%.*]] = getelementptr inbounds i32, i32* [[A:%.*]], i32 [[ADD]] ; CHECK-NEXT: [[TMP1:%.*]] = load i32, i32* [[ARRAYIDX5]], align 4 ; CHECK-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds i32, i32* [[X:%.*]], i32 [[J_026]] ; CHECK-NEXT: [[TMP2:%.*]] = load i32, i32* [[ARRAYIDX6]], align 4 ; CHECK-NEXT: [[MUL7:%.*]] = mul nsw i32 [[TMP2]], [[TMP1]] ; CHECK-NEXT: [[ADD9]] = add nsw i32 [[MUL7]], [[TMP0]] ; CHECK-NEXT: [[INC]] = add nuw nsw i32 [[J_026]], 1 ; CHECK-NEXT: [[EXITCOND:%.*]] = icmp eq i32 [[INC]], [[N]] ; CHECK-NEXT: br i1 [[EXITCOND]], label [[FOR_COND_CLEANUP3]], label [[FOR_BODY4]] ; CHECK: for.cond.cleanup3: ; CHECK-NEXT: store i32 [[ADD9]], i32* [[ARRAYIDX]], align 4 ; CHECK-NEXT: [[INC11]] = add nuw nsw i32 [[I_028]], 1 ; CHECK-NEXT: [[EXITCOND29:%.*]] = icmp eq i32 [[INC11]], [[N]] ; CHECK-NEXT: br i1 [[EXITCOND29]], label [[FOR_COND_CLEANUP]], label [[FOR_BODY4_LR_PH]] ; entry: %cmp27 = icmp sgt i32 %N, 0 br i1 %cmp27, label %for.body4.lr.ph.preheader, label %for.cond.cleanup for.body4.lr.ph.preheader: ; preds = %entry br label %for.body4.lr.ph for.cond.cleanup: ; preds = %for.cond.cleanup3, %entry ret void for.body4.lr.ph: ; preds = %for.body4.lr.ph.preheader, %for.cond.cleanup3 %i.028 = phi i32 [ %inc11, %for.cond.cleanup3 ], [ 0, %for.body4.lr.ph.preheader ] %arrayidx = getelementptr inbounds i32, i32* %b, i32 %i.028 store i32 0, i32* %arrayidx, align 4 %mul = mul nsw i32 %i.028, %N br label %for.body4 for.body4: ; preds = %for.body4, %for.body4.lr.ph %0 = phi i32 [ 0, %for.body4.lr.ph ], [ %add9, %for.body4 ] %j.026 = phi i32 [ 0, %for.body4.lr.ph ], [ %inc, %for.body4 ] %add = add nsw i32 %j.026, %mul %arrayidx5 = getelementptr inbounds i32, i32* %A, i32 %add %1 = load i32, i32* %arrayidx5, align 4 %arrayidx6 = getelementptr inbounds i32, i32* %x, i32 %j.026 %2 = load i32, i32* %arrayidx6, align 4 %mul7 = mul nsw i32 %2, %1 %add9 = add nsw i32 %mul7, %0 %inc = add nuw nsw i32 %j.026, 1 %exitcond = icmp eq i32 %inc, %N br i1 %exitcond, label %for.cond.cleanup3, label %for.body4 for.cond.cleanup3: ; preds = %for.body4 store i32 %add9, i32* %arrayidx, align 4 %inc11 = add nuw nsw i32 %i.028, 1 %exitcond29 = icmp eq i32 %inc11, %N br i1 %exitcond29, label %for.cond.cleanup, label %for.body4.lr.ph } declare i1 @cond() readnone ; TODO: We can eliminate the store in for.header, but we currently hit a MemoryPhi. define void @loop_multiple_def_uses(i32* noalias %P) { ; CHECK-LABEL: @loop_multiple_def_uses( ; CHECK-NEXT: entry: ; CHECK-NEXT: br label [[FOR_HEADER:%.*]] ; CHECK: for.header: ; CHECK-NEXT: store i32 1, i32* [[P:%.*]], align 4 ; CHECK-NEXT: [[C1:%.*]] = call i1 @cond() ; CHECK-NEXT: br i1 [[C1]], label [[FOR_BODY:%.*]], label [[END:%.*]] ; CHECK: for.body: ; CHECK-NEXT: store i32 2, i32* [[P]], align 4 ; CHECK-NEXT: [[LV:%.*]] = load i32, i32* [[P]], align 4 ; CHECK-NEXT: br label [[FOR_HEADER]] ; CHECK: end: ; CHECK-NEXT: store i32 3, i32* [[P]], align 4 ; CHECK-NEXT: ret void ; entry: br label %for.header for.header: store i32 1, i32* %P, align 4 %c1 = call i1 @cond() br i1 %c1, label %for.body, label %end for.body: store i32 2, i32* %P, align 4 %lv = load i32, i32* %P br label %for.header end: store i32 3, i32* %P, align 4 ret void } ; We cannot eliminate the store in for.header, as it is only partially ; overwritten in for.body and read afterwards. define void @loop_multiple_def_uses_partial_write(i32* noalias %p) { ; CHECK-LABEL: @loop_multiple_def_uses_partial_write( ; CHECK-NEXT: entry: ; CHECK-NEXT: br label [[FOR_HEADER:%.*]] ; CHECK: for.header: ; CHECK-NEXT: store i32 1239491, i32* [[P:%.*]], align 4 ; CHECK-NEXT: [[C1:%.*]] = call i1 @cond() ; CHECK-NEXT: br i1 [[C1]], label [[FOR_BODY:%.*]], label [[END:%.*]] ; CHECK: for.body: ; CHECK-NEXT: [[C:%.*]] = bitcast i32* [[P]] to i8* ; CHECK-NEXT: store i8 1, i8* [[C]], align 4 ; CHECK-NEXT: [[LV:%.*]] = load i32, i32* [[P]], align 4 ; CHECK-NEXT: br label [[FOR_HEADER]] ; CHECK: end: ; CHECK-NEXT: store i32 3, i32* [[P]], align 4 ; CHECK-NEXT: ret void ; entry: br label %for.header for.header: store i32 1239491, i32* %p, align 4 %c1 = call i1 @cond() br i1 %c1, label %for.body, label %end for.body: %c = bitcast i32* %p to i8* store i8 1, i8* %c, align 4 %lv = load i32, i32* %p br label %for.header end: store i32 3, i32* %p, align 4 ret void } ; We cannot eliminate the store in for.header, as the location is not overwritten ; in for.body and read afterwards. define void @loop_multiple_def_uses_mayalias_write(i32* %p, i32* %q) { ; CHECK-LABEL: @loop_multiple_def_uses_mayalias_write( ; CHECK-NEXT: entry: ; CHECK-NEXT: br label [[FOR_HEADER:%.*]] ; CHECK: for.header: ; CHECK-NEXT: store i32 1239491, i32* [[P:%.*]], align 4 ; CHECK-NEXT: [[C1:%.*]] = call i1 @cond() ; CHECK-NEXT: br i1 [[C1]], label [[FOR_BODY:%.*]], label [[END:%.*]] ; CHECK: for.body: ; CHECK-NEXT: store i32 1, i32* [[Q:%.*]], align 4 ; CHECK-NEXT: [[LV:%.*]] = load i32, i32* [[P]], align 4 ; CHECK-NEXT: br label [[FOR_HEADER]] ; CHECK: end: ; CHECK-NEXT: store i32 3, i32* [[P]], align 4 ; CHECK-NEXT: ret void ; entry: br label %for.header for.header: store i32 1239491, i32* %p, align 4 %c1 = call i1 @cond() br i1 %c1, label %for.body, label %end for.body: store i32 1, i32* %q, align 4 %lv = load i32, i32* %p br label %for.header end: store i32 3, i32* %p, align 4 ret void } %struct.hoge = type { i32, i32 } @global = external local_unnamed_addr global %struct.hoge*, align 8 define void @widget(i8* %tmp) { ; CHECK-LABEL: @widget( ; CHECK-NEXT: bb: ; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 1 [[TMP:%.*]], i8* nonnull align 16 undef, i64 64, i1 false) ; CHECK-NEXT: br label [[BB1:%.*]] ; CHECK: bb1: ; CHECK-NEXT: [[TMP2:%.*]] = load %struct.hoge*, %struct.hoge** @global, align 8 ; CHECK-NEXT: [[TMP3:%.*]] = getelementptr inbounds [[STRUCT_HOGE:%.*]], %struct.hoge* [[TMP2]], i64 undef, i32 1 ; CHECK-NEXT: store i32 0, i32* [[TMP3]], align 4 ; CHECK-NEXT: [[TMP4:%.*]] = load %struct.hoge*, %struct.hoge** @global, align 8 ; CHECK-NEXT: [[TMP5:%.*]] = getelementptr inbounds [[STRUCT_HOGE]], %struct.hoge* [[TMP4]], i64 undef, i32 1 ; CHECK-NEXT: store i32 10, i32* [[TMP5]], align 4 ; CHECK-NEXT: br label [[BB1]] ; bb: call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 1 %tmp, i8* nonnull align 16 undef, i64 64, i1 false) br label %bb1 bb1: ; preds = %bb1, %bb %tmp2 = load %struct.hoge*, %struct.hoge** @global, align 8 %tmp3 = getelementptr inbounds %struct.hoge, %struct.hoge* %tmp2, i64 undef, i32 1 store i32 0, i32* %tmp3, align 4 %tmp4 = load %struct.hoge*, %struct.hoge** @global, align 8 %tmp5 = getelementptr inbounds %struct.hoge, %struct.hoge* %tmp4, i64 undef, i32 1 store i32 10, i32* %tmp5, align 4 br label %bb1 } declare void @llvm.memcpy.p0i8.p0i8.i64(i8* noalias nocapture writeonly, i8* noalias nocapture readonly, i64, i1 immarg) @x = global [10 x i16] zeroinitializer, align 1 ; Make sure we do not eliminate the store in %do.body, because it writes to ; multiple locations in the loop and the store in %if.end10 only stores to ; the last one. define i16 @test_loop_carried_dep() { ; CHECK-LABEL: @test_loop_carried_dep( ; CHECK-NEXT: entry: ; CHECK-NEXT: br label [[DO_BODY:%.*]] ; CHECK: do.body: ; CHECK-NEXT: [[I_0:%.*]] = phi i16 [ 0, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[IF_END:%.*]] ] ; CHECK-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds [10 x i16], [10 x i16]* @x, i16 0, i16 [[I_0]] ; CHECK-NEXT: store i16 2, i16* [[ARRAYIDX2]], align 1 ; CHECK-NEXT: [[EXITCOND:%.*]] = icmp eq i16 [[I_0]], 4 ; CHECK-NEXT: br i1 [[EXITCOND]], label [[IF_END10:%.*]], label [[IF_END]] ; CHECK: if.end: ; CHECK-NEXT: [[INC]] = add nuw nsw i16 [[I_0]], 1 ; CHECK-NEXT: br label [[DO_BODY]] ; CHECK: if.end10: ; CHECK-NEXT: store i16 1, i16* [[ARRAYIDX2]], align 1 ; CHECK-NEXT: ret i16 0 ; entry: br label %do.body do.body: ; preds = %if.end, %entry %i.0 = phi i16 [ 0, %entry ], [ %inc, %if.end ] %arrayidx2 = getelementptr inbounds [10 x i16], [10 x i16]* @x, i16 0, i16 %i.0 store i16 2, i16* %arrayidx2, align 1 %exitcond = icmp eq i16 %i.0, 4 br i1 %exitcond, label %if.end10, label %if.end if.end: ; preds = %do.body %inc = add nuw nsw i16 %i.0, 1 br label %do.body if.end10: ; preds = %do.body store i16 1, i16* %arrayidx2, align 1 ret i16 0 }