359 lines
13 KiB
LLVM
359 lines
13 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
|
|
; RUN: opt < %s -basic-aa -dse -S | FileCheck %s
|
|
|
|
target datalayout = "e-m:e-p:32:32-i64:64-v128:64:128-a:0:32-n32-S64"
|
|
declare void @llvm.memset.p0i8.i64(i8* nocapture, i8, i64, i32, i1) nounwind
|
|
|
|
define void @test13(i32* noalias %P) {
|
|
; CHECK-LABEL: @test13(
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: br label [[FOR:%.*]]
|
|
; CHECK: for:
|
|
; CHECK-NEXT: store i32 0, i32* [[P:%.*]], align 4
|
|
; CHECK-NEXT: br i1 false, label [[FOR]], label [[END:%.*]]
|
|
; CHECK: end:
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
entry:
|
|
br label %for
|
|
for:
|
|
store i32 0, i32* %P
|
|
br i1 false, label %for, label %end
|
|
end:
|
|
ret void
|
|
}
|
|
|
|
|
|
define void @test14(i32* noalias %P) {
|
|
; CHECK-LABEL: @test14(
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: br label [[FOR:%.*]]
|
|
; CHECK: for:
|
|
; CHECK-NEXT: store i32 0, i32* [[P:%.*]], align 4
|
|
; CHECK-NEXT: br i1 false, label [[FOR]], label [[END:%.*]]
|
|
; CHECK: end:
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
entry:
|
|
store i32 1, i32* %P
|
|
br label %for
|
|
for:
|
|
store i32 0, i32* %P
|
|
br i1 false, label %for, label %end
|
|
end:
|
|
ret void
|
|
}
|
|
|
|
define void @test18(i32* noalias %P) {
|
|
; CHECK-LABEL: @test18(
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: [[P2:%.*]] = bitcast i32* [[P:%.*]] to i8*
|
|
; CHECK-NEXT: store i32 0, i32* [[P]], align 4
|
|
; CHECK-NEXT: br label [[FOR:%.*]]
|
|
; CHECK: for:
|
|
; CHECK-NEXT: store i8 1, i8* [[P2]], align 1
|
|
; CHECK-NEXT: [[X:%.*]] = load i32, i32* [[P]], align 4
|
|
; CHECK-NEXT: store i8 2, i8* [[P2]], align 1
|
|
; CHECK-NEXT: br i1 false, label [[FOR]], label [[END:%.*]]
|
|
; CHECK: end:
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
entry:
|
|
%P2 = bitcast i32* %P to i8*
|
|
store i32 0, i32* %P
|
|
br label %for
|
|
for:
|
|
store i8 1, i8* %P2
|
|
%x = load i32, i32* %P
|
|
store i8 2, i8* %P2
|
|
br i1 false, label %for, label %end
|
|
end:
|
|
ret void
|
|
}
|
|
|
|
define void @test21(i32* noalias %P) {
|
|
; CHECK-LABEL: @test21(
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: [[ARRAYIDX0:%.*]] = getelementptr inbounds i32, i32* [[P:%.*]], i64 1
|
|
; CHECK-NEXT: [[P3:%.*]] = bitcast i32* [[ARRAYIDX0]] to i8*
|
|
; CHECK-NEXT: [[TMP0:%.*]] = getelementptr inbounds i8, i8* [[P3]], i64 4
|
|
; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* align 4 [[TMP0]], i8 0, i64 24, i1 false)
|
|
; CHECK-NEXT: br label [[FOR:%.*]]
|
|
; CHECK: for:
|
|
; CHECK-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds i32, i32* [[P]], i64 1
|
|
; CHECK-NEXT: store i32 1, i32* [[ARRAYIDX1]], align 4
|
|
; CHECK-NEXT: br i1 false, label [[FOR]], label [[END:%.*]]
|
|
; CHECK: end:
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
entry:
|
|
%arrayidx0 = getelementptr inbounds i32, i32* %P, i64 1
|
|
%p3 = bitcast i32* %arrayidx0 to i8*
|
|
call void @llvm.memset.p0i8.i64(i8* %p3, i8 0, i64 28, i32 4, i1 false)
|
|
br label %for
|
|
for:
|
|
%arrayidx1 = getelementptr inbounds i32, i32* %P, i64 1
|
|
store i32 1, i32* %arrayidx1, align 4
|
|
br i1 false, label %for, label %end
|
|
end:
|
|
ret void
|
|
}
|
|
|
|
define void @test_loop(i32 %N, i32* noalias nocapture readonly %A, i32* noalias nocapture readonly %x, i32* noalias nocapture %b) local_unnamed_addr {
|
|
; CHECK-LABEL: @test_loop(
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: [[CMP27:%.*]] = icmp sgt i32 [[N:%.*]], 0
|
|
; CHECK-NEXT: br i1 [[CMP27]], label [[FOR_BODY4_LR_PH_PREHEADER:%.*]], label [[FOR_COND_CLEANUP:%.*]]
|
|
; CHECK: for.body4.lr.ph.preheader:
|
|
; CHECK-NEXT: br label [[FOR_BODY4_LR_PH:%.*]]
|
|
; CHECK: for.cond.cleanup:
|
|
; CHECK-NEXT: ret void
|
|
; CHECK: for.body4.lr.ph:
|
|
; CHECK-NEXT: [[I_028:%.*]] = phi i32 [ [[INC11:%.*]], [[FOR_COND_CLEANUP3:%.*]] ], [ 0, [[FOR_BODY4_LR_PH_PREHEADER]] ]
|
|
; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[B:%.*]], i32 [[I_028]]
|
|
; CHECK-NEXT: store i32 0, i32* [[ARRAYIDX]], align 4
|
|
; CHECK-NEXT: [[MUL:%.*]] = mul nsw i32 [[I_028]], [[N]]
|
|
; CHECK-NEXT: br label [[FOR_BODY4:%.*]]
|
|
; CHECK: for.body4:
|
|
; CHECK-NEXT: [[TMP0:%.*]] = phi i32 [ 0, [[FOR_BODY4_LR_PH]] ], [ [[ADD9:%.*]], [[FOR_BODY4]] ]
|
|
; CHECK-NEXT: [[J_026:%.*]] = phi i32 [ 0, [[FOR_BODY4_LR_PH]] ], [ [[INC:%.*]], [[FOR_BODY4]] ]
|
|
; CHECK-NEXT: [[ADD:%.*]] = add nsw i32 [[J_026]], [[MUL]]
|
|
; CHECK-NEXT: [[ARRAYIDX5:%.*]] = getelementptr inbounds i32, i32* [[A:%.*]], i32 [[ADD]]
|
|
; CHECK-NEXT: [[TMP1:%.*]] = load i32, i32* [[ARRAYIDX5]], align 4
|
|
; CHECK-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds i32, i32* [[X:%.*]], i32 [[J_026]]
|
|
; CHECK-NEXT: [[TMP2:%.*]] = load i32, i32* [[ARRAYIDX6]], align 4
|
|
; CHECK-NEXT: [[MUL7:%.*]] = mul nsw i32 [[TMP2]], [[TMP1]]
|
|
; CHECK-NEXT: [[ADD9]] = add nsw i32 [[MUL7]], [[TMP0]]
|
|
; CHECK-NEXT: [[INC]] = add nuw nsw i32 [[J_026]], 1
|
|
; CHECK-NEXT: [[EXITCOND:%.*]] = icmp eq i32 [[INC]], [[N]]
|
|
; CHECK-NEXT: br i1 [[EXITCOND]], label [[FOR_COND_CLEANUP3]], label [[FOR_BODY4]]
|
|
; CHECK: for.cond.cleanup3:
|
|
; CHECK-NEXT: store i32 [[ADD9]], i32* [[ARRAYIDX]], align 4
|
|
; CHECK-NEXT: [[INC11]] = add nuw nsw i32 [[I_028]], 1
|
|
; CHECK-NEXT: [[EXITCOND29:%.*]] = icmp eq i32 [[INC11]], [[N]]
|
|
; CHECK-NEXT: br i1 [[EXITCOND29]], label [[FOR_COND_CLEANUP]], label [[FOR_BODY4_LR_PH]]
|
|
;
|
|
entry:
|
|
%cmp27 = icmp sgt i32 %N, 0
|
|
br i1 %cmp27, label %for.body4.lr.ph.preheader, label %for.cond.cleanup
|
|
|
|
for.body4.lr.ph.preheader: ; preds = %entry
|
|
br label %for.body4.lr.ph
|
|
|
|
for.cond.cleanup: ; preds = %for.cond.cleanup3, %entry
|
|
ret void
|
|
|
|
for.body4.lr.ph: ; preds = %for.body4.lr.ph.preheader, %for.cond.cleanup3
|
|
%i.028 = phi i32 [ %inc11, %for.cond.cleanup3 ], [ 0, %for.body4.lr.ph.preheader ]
|
|
%arrayidx = getelementptr inbounds i32, i32* %b, i32 %i.028
|
|
store i32 0, i32* %arrayidx, align 4
|
|
%mul = mul nsw i32 %i.028, %N
|
|
br label %for.body4
|
|
|
|
for.body4: ; preds = %for.body4, %for.body4.lr.ph
|
|
%0 = phi i32 [ 0, %for.body4.lr.ph ], [ %add9, %for.body4 ]
|
|
%j.026 = phi i32 [ 0, %for.body4.lr.ph ], [ %inc, %for.body4 ]
|
|
%add = add nsw i32 %j.026, %mul
|
|
%arrayidx5 = getelementptr inbounds i32, i32* %A, i32 %add
|
|
%1 = load i32, i32* %arrayidx5, align 4
|
|
%arrayidx6 = getelementptr inbounds i32, i32* %x, i32 %j.026
|
|
%2 = load i32, i32* %arrayidx6, align 4
|
|
%mul7 = mul nsw i32 %2, %1
|
|
%add9 = add nsw i32 %mul7, %0
|
|
%inc = add nuw nsw i32 %j.026, 1
|
|
%exitcond = icmp eq i32 %inc, %N
|
|
br i1 %exitcond, label %for.cond.cleanup3, label %for.body4
|
|
|
|
for.cond.cleanup3: ; preds = %for.body4
|
|
store i32 %add9, i32* %arrayidx, align 4
|
|
%inc11 = add nuw nsw i32 %i.028, 1
|
|
%exitcond29 = icmp eq i32 %inc11, %N
|
|
br i1 %exitcond29, label %for.cond.cleanup, label %for.body4.lr.ph
|
|
}
|
|
|
|
declare i1 @cond() readnone
|
|
|
|
; TODO: We can eliminate the store in for.header, but we currently hit a MemoryPhi.
|
|
define void @loop_multiple_def_uses(i32* noalias %P) {
|
|
; CHECK-LABEL: @loop_multiple_def_uses(
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: br label [[FOR_HEADER:%.*]]
|
|
; CHECK: for.header:
|
|
; CHECK-NEXT: store i32 1, i32* [[P:%.*]], align 4
|
|
; CHECK-NEXT: [[C1:%.*]] = call i1 @cond()
|
|
; CHECK-NEXT: br i1 [[C1]], label [[FOR_BODY:%.*]], label [[END:%.*]]
|
|
; CHECK: for.body:
|
|
; CHECK-NEXT: store i32 2, i32* [[P]], align 4
|
|
; CHECK-NEXT: [[LV:%.*]] = load i32, i32* [[P]], align 4
|
|
; CHECK-NEXT: br label [[FOR_HEADER]]
|
|
; CHECK: end:
|
|
; CHECK-NEXT: store i32 3, i32* [[P]], align 4
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
entry:
|
|
br label %for.header
|
|
|
|
for.header:
|
|
store i32 1, i32* %P, align 4
|
|
%c1 = call i1 @cond()
|
|
br i1 %c1, label %for.body, label %end
|
|
|
|
for.body:
|
|
store i32 2, i32* %P, align 4
|
|
%lv = load i32, i32* %P
|
|
br label %for.header
|
|
|
|
end:
|
|
store i32 3, i32* %P, align 4
|
|
ret void
|
|
}
|
|
|
|
; We cannot eliminate the store in for.header, as it is only partially
|
|
; overwritten in for.body and read afterwards.
|
|
define void @loop_multiple_def_uses_partial_write(i32* noalias %p) {
|
|
; CHECK-LABEL: @loop_multiple_def_uses_partial_write(
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: br label [[FOR_HEADER:%.*]]
|
|
; CHECK: for.header:
|
|
; CHECK-NEXT: store i32 1239491, i32* [[P:%.*]], align 4
|
|
; CHECK-NEXT: [[C1:%.*]] = call i1 @cond()
|
|
; CHECK-NEXT: br i1 [[C1]], label [[FOR_BODY:%.*]], label [[END:%.*]]
|
|
; CHECK: for.body:
|
|
; CHECK-NEXT: [[C:%.*]] = bitcast i32* [[P]] to i8*
|
|
; CHECK-NEXT: store i8 1, i8* [[C]], align 4
|
|
; CHECK-NEXT: [[LV:%.*]] = load i32, i32* [[P]], align 4
|
|
; CHECK-NEXT: br label [[FOR_HEADER]]
|
|
; CHECK: end:
|
|
; CHECK-NEXT: store i32 3, i32* [[P]], align 4
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
entry:
|
|
br label %for.header
|
|
|
|
for.header:
|
|
store i32 1239491, i32* %p, align 4
|
|
%c1 = call i1 @cond()
|
|
br i1 %c1, label %for.body, label %end
|
|
|
|
for.body:
|
|
%c = bitcast i32* %p to i8*
|
|
store i8 1, i8* %c, align 4
|
|
%lv = load i32, i32* %p
|
|
br label %for.header
|
|
|
|
end:
|
|
store i32 3, i32* %p, align 4
|
|
ret void
|
|
}
|
|
|
|
; We cannot eliminate the store in for.header, as the location is not overwritten
|
|
; in for.body and read afterwards.
|
|
define void @loop_multiple_def_uses_mayalias_write(i32* %p, i32* %q) {
|
|
; CHECK-LABEL: @loop_multiple_def_uses_mayalias_write(
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: br label [[FOR_HEADER:%.*]]
|
|
; CHECK: for.header:
|
|
; CHECK-NEXT: store i32 1239491, i32* [[P:%.*]], align 4
|
|
; CHECK-NEXT: [[C1:%.*]] = call i1 @cond()
|
|
; CHECK-NEXT: br i1 [[C1]], label [[FOR_BODY:%.*]], label [[END:%.*]]
|
|
; CHECK: for.body:
|
|
; CHECK-NEXT: store i32 1, i32* [[Q:%.*]], align 4
|
|
; CHECK-NEXT: [[LV:%.*]] = load i32, i32* [[P]], align 4
|
|
; CHECK-NEXT: br label [[FOR_HEADER]]
|
|
; CHECK: end:
|
|
; CHECK-NEXT: store i32 3, i32* [[P]], align 4
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
entry:
|
|
br label %for.header
|
|
|
|
for.header:
|
|
store i32 1239491, i32* %p, align 4
|
|
%c1 = call i1 @cond()
|
|
br i1 %c1, label %for.body, label %end
|
|
|
|
for.body:
|
|
store i32 1, i32* %q, align 4
|
|
%lv = load i32, i32* %p
|
|
br label %for.header
|
|
|
|
end:
|
|
store i32 3, i32* %p, align 4
|
|
ret void
|
|
}
|
|
|
|
%struct.hoge = type { i32, i32 }
|
|
|
|
@global = external local_unnamed_addr global %struct.hoge*, align 8
|
|
|
|
define void @widget(i8* %tmp) {
|
|
; CHECK-LABEL: @widget(
|
|
; CHECK-NEXT: bb:
|
|
; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 1 [[TMP:%.*]], i8* nonnull align 16 undef, i64 64, i1 false)
|
|
; CHECK-NEXT: br label [[BB1:%.*]]
|
|
; CHECK: bb1:
|
|
; CHECK-NEXT: [[TMP2:%.*]] = load %struct.hoge*, %struct.hoge** @global, align 8
|
|
; CHECK-NEXT: [[TMP3:%.*]] = getelementptr inbounds [[STRUCT_HOGE:%.*]], %struct.hoge* [[TMP2]], i64 undef, i32 1
|
|
; CHECK-NEXT: store i32 0, i32* [[TMP3]], align 4
|
|
; CHECK-NEXT: [[TMP4:%.*]] = load %struct.hoge*, %struct.hoge** @global, align 8
|
|
; CHECK-NEXT: [[TMP5:%.*]] = getelementptr inbounds [[STRUCT_HOGE]], %struct.hoge* [[TMP4]], i64 undef, i32 1
|
|
; CHECK-NEXT: store i32 10, i32* [[TMP5]], align 4
|
|
; CHECK-NEXT: br label [[BB1]]
|
|
;
|
|
bb:
|
|
call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 1 %tmp, i8* nonnull align 16 undef, i64 64, i1 false)
|
|
br label %bb1
|
|
|
|
bb1: ; preds = %bb1, %bb
|
|
%tmp2 = load %struct.hoge*, %struct.hoge** @global, align 8
|
|
%tmp3 = getelementptr inbounds %struct.hoge, %struct.hoge* %tmp2, i64 undef, i32 1
|
|
store i32 0, i32* %tmp3, align 4
|
|
%tmp4 = load %struct.hoge*, %struct.hoge** @global, align 8
|
|
%tmp5 = getelementptr inbounds %struct.hoge, %struct.hoge* %tmp4, i64 undef, i32 1
|
|
store i32 10, i32* %tmp5, align 4
|
|
br label %bb1
|
|
}
|
|
|
|
declare void @llvm.memcpy.p0i8.p0i8.i64(i8* noalias nocapture writeonly, i8* noalias nocapture readonly, i64, i1 immarg)
|
|
|
|
@x = global [10 x i16] zeroinitializer, align 1
|
|
|
|
; Make sure we do not eliminate the store in %do.body, because it writes to
|
|
; multiple locations in the loop and the store in %if.end10 only stores to
|
|
; the last one.
|
|
define i16 @test_loop_carried_dep() {
|
|
; CHECK-LABEL: @test_loop_carried_dep(
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: br label [[DO_BODY:%.*]]
|
|
; CHECK: do.body:
|
|
; CHECK-NEXT: [[I_0:%.*]] = phi i16 [ 0, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[IF_END:%.*]] ]
|
|
; CHECK-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds [10 x i16], [10 x i16]* @x, i16 0, i16 [[I_0]]
|
|
; CHECK-NEXT: store i16 2, i16* [[ARRAYIDX2]], align 1
|
|
; CHECK-NEXT: [[EXITCOND:%.*]] = icmp eq i16 [[I_0]], 4
|
|
; CHECK-NEXT: br i1 [[EXITCOND]], label [[IF_END10:%.*]], label [[IF_END]]
|
|
; CHECK: if.end:
|
|
; CHECK-NEXT: [[INC]] = add nuw nsw i16 [[I_0]], 1
|
|
; CHECK-NEXT: br label [[DO_BODY]]
|
|
; CHECK: if.end10:
|
|
; CHECK-NEXT: store i16 1, i16* [[ARRAYIDX2]], align 1
|
|
; CHECK-NEXT: ret i16 0
|
|
;
|
|
entry:
|
|
br label %do.body
|
|
|
|
do.body: ; preds = %if.end, %entry
|
|
%i.0 = phi i16 [ 0, %entry ], [ %inc, %if.end ]
|
|
%arrayidx2 = getelementptr inbounds [10 x i16], [10 x i16]* @x, i16 0, i16 %i.0
|
|
store i16 2, i16* %arrayidx2, align 1
|
|
%exitcond = icmp eq i16 %i.0, 4
|
|
br i1 %exitcond, label %if.end10, label %if.end
|
|
|
|
if.end: ; preds = %do.body
|
|
%inc = add nuw nsw i16 %i.0, 1
|
|
br label %do.body
|
|
|
|
if.end10: ; preds = %do.body
|
|
store i16 1, i16* %arrayidx2, align 1
|
|
ret i16 0
|
|
}
|