245 lines
5.5 KiB
LLVM
245 lines
5.5 KiB
LLVM
; RUN: llc -march=r600 -mcpu=redwood -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
|
|
; RUN: FileCheck --check-prefix=BUG64 %s < %t
|
|
|
|
; RUN: llc -march=r600 -mcpu=sumo -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
|
|
; RUN: FileCheck --check-prefix=BUG64 %s < %t
|
|
|
|
; RUN: llc -march=r600 -mcpu=barts -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
|
|
; RUN: FileCheck --check-prefix=BUG64 %s < %t
|
|
|
|
; RUN: llc -march=r600 -mcpu=turks -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
|
|
; RUN: FileCheck --check-prefix=BUG64 %s < %t
|
|
|
|
; RUN: llc -march=r600 -mcpu=caicos -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
|
|
; RUN: FileCheck --check-prefix=BUG64 %s < %t
|
|
|
|
; RUN: llc -march=r600 -mcpu=cedar -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
|
|
; RUN: FileCheck --check-prefix=BUG32 %s < %t
|
|
|
|
; RUN: llc -march=r600 -mcpu=juniper -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
|
|
; RUN: FileCheck --check-prefix=NOBUG %s < %t
|
|
|
|
; RUN: llc -march=r600 -mcpu=cypress -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
|
|
; RUN: FileCheck --check-prefix=NOBUG %s < %t
|
|
|
|
; RUN: llc -march=r600 -mcpu=cayman -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
|
|
; RUN: FileCheck --check-prefix=NOBUG %s < %t
|
|
|
|
; REQUIRES: asserts
|
|
|
|
; We are currently allocating 2 extra sub-entries on Evergreen / NI for
|
|
; non-WQM push instructions if we change this to 1, then we will need to
|
|
; add one level of depth to each of these tests.
|
|
|
|
; BUG64-NOT: Applying bug work-around
|
|
; BUG32-NOT: Applying bug work-around
|
|
; NOBUG-NOT: Applying bug work-around
|
|
; FUNC-LABEL: {{^}}nested3:
|
|
define amdgpu_kernel void @nested3(i32 addrspace(1)* %out, i32 %cond) {
|
|
entry:
|
|
%0 = icmp sgt i32 %cond, 0
|
|
br i1 %0, label %if.1, label %end
|
|
|
|
if.1:
|
|
%1 = icmp sgt i32 %cond, 10
|
|
br i1 %1, label %if.2, label %if.store.1
|
|
|
|
if.store.1:
|
|
store i32 1, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.2:
|
|
%2 = icmp sgt i32 %cond, 20
|
|
br i1 %2, label %if.3, label %if.2.store
|
|
|
|
if.2.store:
|
|
store i32 2, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.3:
|
|
store i32 3, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
end:
|
|
ret void
|
|
}
|
|
|
|
; BUG64: Applying bug work-around
|
|
; BUG32-NOT: Applying bug work-around
|
|
; NOBUG-NOT: Applying bug work-around
|
|
; FUNC-LABEL: {{^}}nested4:
|
|
define amdgpu_kernel void @nested4(i32 addrspace(1)* %out, i32 %cond) {
|
|
entry:
|
|
%0 = icmp sgt i32 %cond, 0
|
|
br i1 %0, label %if.1, label %end
|
|
|
|
if.1:
|
|
%1 = icmp sgt i32 %cond, 10
|
|
br i1 %1, label %if.2, label %if.1.store
|
|
|
|
if.1.store:
|
|
store i32 1, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.2:
|
|
%2 = icmp sgt i32 %cond, 20
|
|
br i1 %2, label %if.3, label %if.2.store
|
|
|
|
if.2.store:
|
|
store i32 2, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.3:
|
|
%3 = icmp sgt i32 %cond, 30
|
|
br i1 %3, label %if.4, label %if.3.store
|
|
|
|
if.3.store:
|
|
store i32 3, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.4:
|
|
store i32 4, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
end:
|
|
ret void
|
|
}
|
|
|
|
; BUG64: Applying bug work-around
|
|
; BUG32-NOT: Applying bug work-around
|
|
; NOBUG-NOT: Applying bug work-around
|
|
; FUNC-LABEL: {{^}}nested7:
|
|
define amdgpu_kernel void @nested7(i32 addrspace(1)* %out, i32 %cond) {
|
|
entry:
|
|
%0 = icmp sgt i32 %cond, 0
|
|
br i1 %0, label %if.1, label %end
|
|
|
|
if.1:
|
|
%1 = icmp sgt i32 %cond, 10
|
|
br i1 %1, label %if.2, label %if.1.store
|
|
|
|
if.1.store:
|
|
store i32 1, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.2:
|
|
%2 = icmp sgt i32 %cond, 20
|
|
br i1 %2, label %if.3, label %if.2.store
|
|
|
|
if.2.store:
|
|
store i32 2, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.3:
|
|
%3 = icmp sgt i32 %cond, 30
|
|
br i1 %3, label %if.4, label %if.3.store
|
|
|
|
if.3.store:
|
|
store i32 3, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.4:
|
|
%4 = icmp sgt i32 %cond, 40
|
|
br i1 %4, label %if.5, label %if.4.store
|
|
|
|
if.4.store:
|
|
store i32 4, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.5:
|
|
%5 = icmp sgt i32 %cond, 50
|
|
br i1 %5, label %if.6, label %if.5.store
|
|
|
|
if.5.store:
|
|
store i32 5, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.6:
|
|
%6 = icmp sgt i32 %cond, 60
|
|
br i1 %6, label %if.7, label %if.6.store
|
|
|
|
if.6.store:
|
|
store i32 6, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.7:
|
|
store i32 7, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
end:
|
|
ret void
|
|
}
|
|
|
|
; BUG64: Applying bug work-around
|
|
; BUG32: Applying bug work-around
|
|
; NOBUG-NOT: Applying bug work-around
|
|
; FUNC-LABEL: {{^}}nested8:
|
|
define amdgpu_kernel void @nested8(i32 addrspace(1)* %out, i32 %cond) {
|
|
entry:
|
|
%0 = icmp sgt i32 %cond, 0
|
|
br i1 %0, label %if.1, label %end
|
|
|
|
if.1:
|
|
%1 = icmp sgt i32 %cond, 10
|
|
br i1 %1, label %if.2, label %if.1.store
|
|
|
|
if.1.store:
|
|
store i32 1, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.2:
|
|
%2 = icmp sgt i32 %cond, 20
|
|
br i1 %2, label %if.3, label %if.2.store
|
|
|
|
if.2.store:
|
|
store i32 2, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.3:
|
|
%3 = icmp sgt i32 %cond, 30
|
|
br i1 %3, label %if.4, label %if.3.store
|
|
|
|
if.3.store:
|
|
store i32 3, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.4:
|
|
%4 = icmp sgt i32 %cond, 40
|
|
br i1 %4, label %if.5, label %if.4.store
|
|
|
|
if.4.store:
|
|
store i32 4, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.5:
|
|
%5 = icmp sgt i32 %cond, 50
|
|
br i1 %5, label %if.6, label %if.5.store
|
|
|
|
if.5.store:
|
|
store i32 5, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.6:
|
|
%6 = icmp sgt i32 %cond, 60
|
|
br i1 %6, label %if.7, label %if.6.store
|
|
|
|
if.6.store:
|
|
store i32 6, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.7:
|
|
%7 = icmp sgt i32 %cond, 70
|
|
br i1 %7, label %if.8, label %if.7.store
|
|
|
|
if.7.store:
|
|
store i32 7, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
if.8:
|
|
store i32 8, i32 addrspace(1)* %out
|
|
br label %end
|
|
|
|
end:
|
|
ret void
|
|
}
|