By default clang emits complete contructors as alias of base constructors if they are the same. The backend is supposed to emit symbols for the alias, otherwise it causes undefined symbols. @yaxunl observed that this issue is related to the llvm options `-amdgpu-early-inline-all=true` and `-amdgpu-function-calls=false`. This issue is resolved by only inlining global values with internal linkage. The `getCalleeFunction()` in AMDGPUResourceUsageAnalysis also had to be extended to support aliases to functions. inline-calls.ll was corrected appropriately. Reviewed By: yaxunl, #amdgpu Differential Revision: https://reviews.llvm.org/D109707
34 lines
956 B
LLVM
34 lines
956 B
LLVM
; RUN: llc -mtriple amdgcn-unknown-linux-gnu -mcpu=tahiti -verify-machineinstrs < %s | FileCheck %s
|
|
; RUN: llc -mtriple amdgcn-unknown-linux-gnu -mcpu=tonga -verify-machineinstrs < %s | FileCheck %s
|
|
; RUN: llc -mtriple r600-unknown-linux-gnu -mcpu=redwood -verify-machineinstrs < %s | FileCheck %s --check-prefix=R600
|
|
|
|
; ALL-NOT: {{^}}func:
|
|
define internal i32 @func(i32 %a) {
|
|
entry:
|
|
%tmp0 = add i32 %a, 1
|
|
ret i32 %tmp0
|
|
}
|
|
|
|
; CHECK: {{^}}kernel:
|
|
; GCN-NOT: s_swappc_b64
|
|
define amdgpu_kernel void @kernel(i32 addrspace(1)* %out) {
|
|
entry:
|
|
%tmp0 = call i32 @func(i32 1)
|
|
store i32 %tmp0, i32 addrspace(1)* %out
|
|
ret void
|
|
}
|
|
|
|
; CHECK: func_alias
|
|
; R600-NOT: func_alias
|
|
@func_alias = alias i32 (i32), i32 (i32)* @func
|
|
|
|
; CHECK-NOT: {{^}}kernel3:
|
|
; GCN-NOT: s_swappc_b64
|
|
; R600: {{^}}kernel3:
|
|
define amdgpu_kernel void @kernel3(i32 addrspace(1)* %out) {
|
|
entry:
|
|
%tmp0 = call i32 @func_alias(i32 1)
|
|
store i32 %tmp0, i32 addrspace(1)* %out
|
|
ret void
|
|
}
|