llvm-for-llvmta/test/CodeGen/Hexagon/tc_sched.ll

83 lines
2.5 KiB
LLVM

; RUN: llc -march=hexagon -mcpu=hexagonv67t < %s | FileCheck %s
; A simple test case for the tiny core instruction latency information.
; CHECK-LABEL: test
; CHECK-DAG: [[REG1:r([0-9]+)]] = memw([[REG0:r[0-9]+]]+#0)
; CHECK-DAG: [[REG2:r([0-9]+)]] = memw([[REG0]]+#4)
; CHECK-NEXT: }
; CHECK: {
; CHECK: {
; CHECK-NEXT: = add([[REG2]],[[REG1]])
define i32 @test(i32* nocapture readonly %p) local_unnamed_addr #0 {
entry:
%incdec.ptr = getelementptr inbounds i32, i32* %p, i32 1
%0 = load i32, i32* %p, align 4
%incdec.ptr1 = getelementptr inbounds i32, i32* %p, i32 2
%1 = load i32, i32* %incdec.ptr, align 4
%incdec.ptr2 = getelementptr inbounds i32, i32* %p, i32 3
%2 = load i32, i32* %incdec.ptr1, align 4
%3 = load i32, i32* %incdec.ptr2, align 4
%add = add nsw i32 %1, %0
%add4 = add nsw i32 %3, %2
%mul = mul nsw i32 %add4, %add
ret i32 %mul
}
; CHECK-LABEL: test1
; CHECK-DAG: [[REG4:r([0-9]+)]] = memw([[REG3:r[0-9]+]]+#0)
; CHECK-DAG: [[REG5:r([0-9]+)]] = memw([[REG3]]+#4)
; CHECK-NEXT: }
; CHECK: {
; CHECK: {
; CHECK-NEXT: [[REG7:r([0-9]+)]] = add([[REG5]],[[REG4]])
; CHECK: }
; CHECK-NEXT: {
; CHECK-NEXT: = sub([[REG7]]
define i32 @test1(i32* nocapture readonly %p) local_unnamed_addr #0 {
entry:
%incdec.ptr = getelementptr inbounds i32, i32* %p, i32 1
%0 = load i32, i32* %p, align 4
%incdec.ptr1 = getelementptr inbounds i32, i32* %p, i32 2
%1 = load i32, i32* %incdec.ptr, align 4
%incdec.ptr2 = getelementptr inbounds i32, i32* %p, i32 3
%2 = load i32, i32* %incdec.ptr1, align 4
%3 = load i32, i32* %incdec.ptr2, align 4
%add4.neg = add i32 %1, %0
%add = sub i32 %add4.neg, %2
%sub = sub i32 %add, %3
ret i32 %sub
}
; Test that multiplies are not placed in the same packet.
; CHECK-LABEL: test2
; CHECK: = mpyi
; CHECK: }
; CHECK: = mpyi
; CHECK: }
; CHECK: = mpyi
; CHECK: }
; CHECK: = mpyi
define i32 @test2(i32* nocapture readonly %p) local_unnamed_addr #1 {
entry:
%incdec.ptr = getelementptr inbounds i32, i32* %p, i32 1
%0 = load i32, i32* %p, align 4
%incdec.ptr1 = getelementptr inbounds i32, i32* %p, i32 2
%1 = load i32, i32* %incdec.ptr, align 4
%incdec.ptr2 = getelementptr inbounds i32, i32* %p, i32 3
%2 = load i32, i32* %incdec.ptr1, align 4
%3 = load i32, i32* %incdec.ptr2, align 4
%mul = mul nsw i32 %1, %0
%mul4 = mul nsw i32 %3, %2
%mul5 = mul nsw i32 %3, %0
%mul6 = mul nsw i32 %2, %1
%call = tail call i32 @foo(i32 %mul, i32 %mul4, i32 %mul5, i32 %mul6) #3
ret i32 %call
}
declare i32 @foo(i32, i32, i32, i32) local_unnamed_addr #2