32 lines
1.1 KiB
LLVM
32 lines
1.1 KiB
LLVM
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -infer-address-spaces -o - %s | FileCheck %s
|
|
|
|
@c0 = addrspace(4) global float* undef
|
|
|
|
; CHECK-LABEL: @generic_ptr_from_constant
|
|
; CHECK: addrspacecast float* %p to float addrspace(1)*
|
|
; CHECK-NEXT: load float, float addrspace(1)*
|
|
define float @generic_ptr_from_constant() {
|
|
%p = load float*, float* addrspace(4)* @c0
|
|
%v = load float, float* %p
|
|
ret float %v
|
|
}
|
|
|
|
%struct.S = type { i32*, float* }
|
|
|
|
; CHECK-LABEL: @generic_ptr_from_aggregate_argument
|
|
; CHECK: addrspacecast i32* %p0 to i32 addrspace(1)*
|
|
; CHECK: addrspacecast float* %p1 to float addrspace(1)*
|
|
; CHECK: load i32, i32 addrspace(1)*
|
|
; CHECK: store float %v1, float addrspace(1)*
|
|
; CHECK: ret
|
|
define amdgpu_kernel void @generic_ptr_from_aggregate_argument(%struct.S addrspace(4)* byref(%struct.S) align 8 %0) {
|
|
%f0 = getelementptr inbounds %struct.S, %struct.S addrspace(4)* %0, i64 0, i32 0
|
|
%p0 = load i32*, i32* addrspace(4)* %f0
|
|
%f1 = getelementptr inbounds %struct.S, %struct.S addrspace(4)* %0, i64 0, i32 1
|
|
%p1 = load float*, float* addrspace(4)* %f1
|
|
%v0 = load i32, i32* %p0
|
|
%v1 = sitofp i32 %v0 to float
|
|
store float %v1, float* %p1
|
|
ret void
|
|
}
|