llvm-for-llvmta/test/CodeGen/ARM/t2-shrink-ldrpost.ll

77 lines
2.7 KiB
LLVM

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s | FileCheck %s
target datalayout = "e-m:e-p:32:32-i1:8:32-i8:8:32-i16:16:32-f64:32:64-v64:32:64-v128:32:128-a:0:32-n32-S32"
target triple = "thumbv7m--linux-gnu"
; NOTE: When optimising for minimum size, an LDM is expected to be generated
define void @f(i32 %n, i32* nocapture %a, i32* nocapture readonly %b) optsize minsize {
; CHECK-LABEL: f:
; CHECK: @ %bb.0:
; CHECK-NEXT: cmp r0, #1
; CHECK-NEXT: blt .LBB0_2
; CHECK-NEXT: .LBB0_1: @ %.lr.ph
; CHECK-NEXT: @ =>This Inner Loop Header: Depth=1
; CHECK-NEXT: ldm r2!, {r3}
; CHECK-NEXT: adds r3, #3
; CHECK-NEXT: stm r1!, {r3}
; CHECK-NEXT: subs r0, #1
; CHECK-NEXT: bne .LBB0_1
; CHECK-NEXT: .LBB0_2: @ %._crit_edge
; CHECK-NEXT: bx lr
%1 = icmp sgt i32 %n, 0
br i1 %1, label %.lr.ph, label %._crit_edge
.lr.ph: ; preds = %.lr.ph, %0
%i.04 = phi i32 [ %6, %.lr.ph ], [ 0, %0 ]
%.03 = phi i32* [ %2, %.lr.ph ], [ %b, %0 ]
%.012 = phi i32* [ %5, %.lr.ph ], [ %a, %0 ]
%2 = getelementptr inbounds i32, i32* %.03, i32 1
%3 = load i32, i32* %.03, align 4
%4 = add nsw i32 %3, 3
%5 = getelementptr inbounds i32, i32* %.012, i32 1
store i32 %4, i32* %.012, align 4
%6 = add nsw i32 %i.04, 1
%exitcond = icmp eq i32 %6, %n
br i1 %exitcond, label %._crit_edge, label %.lr.ph
._crit_edge: ; preds = %.lr.ph, %0
ret void
}
; NOTE: When not optimising for minimum size, an LDM is expected not to be generated
define void @f_nominsize(i32 %n, i32* nocapture %a, i32* nocapture readonly %b) optsize {
; CHECK-LABEL: f_nominsize:
; CHECK: @ %bb.0:
; CHECK-NEXT: cmp r0, #1
; CHECK-NEXT: it lt
; CHECK-NEXT: bxlt lr
; CHECK-NEXT: .LBB1_1: @ %.lr.ph
; CHECK-NEXT: @ =>This Inner Loop Header: Depth=1
; CHECK-NEXT: ldr r3, [r2], #4
; CHECK-NEXT: subs r0, #1
; CHECK-NEXT: add.w r3, r3, #3
; CHECK-NEXT: str r3, [r1], #4
; CHECK-NEXT: bne .LBB1_1
; CHECK-NEXT: @ %bb.2: @ %._crit_edge
; CHECK-NEXT: bx lr
%1 = icmp sgt i32 %n, 0
br i1 %1, label %.lr.ph, label %._crit_edge
.lr.ph: ; preds = %.lr.ph, %0
%i.04 = phi i32 [ %6, %.lr.ph ], [ 0, %0 ]
%.03 = phi i32* [ %2, %.lr.ph ], [ %b, %0 ]
%.012 = phi i32* [ %5, %.lr.ph ], [ %a, %0 ]
%2 = getelementptr inbounds i32, i32* %.03, i32 1
%3 = load i32, i32* %.03, align 4
%4 = add nsw i32 %3, 3
%5 = getelementptr inbounds i32, i32* %.012, i32 1
store i32 %4, i32* %.012, align 4
%6 = add nsw i32 %i.04, 1
%exitcond = icmp eq i32 %6, %n
br i1 %exitcond, label %._crit_edge, label %.lr.ph
._crit_edge: ; preds = %.lr.ph, %0
ret void
}