24 lines
1.2 KiB
LLVM
24 lines
1.2 KiB
LLVM
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx940 -amdgpu-kernarg-preload-count=1 -asm-verbose=0 < %s | FileCheck -check-prefixes=GCN,HSA,ASM %s
|
|
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx940 -amdgpu-kernarg-preload-count=1 -filetype=obj < %s | llvm-objdump --arch=amdgcn --mcpu=gfx940 --disassemble - | FileCheck -check-prefixes=GCN,HSA,OBJ %s
|
|
; RUN: llc -mtriple=amdgcn -mcpu=gfx940 -amdgpu-kernarg-preload-count=1 -filetype=obj < %s | llvm-objdump --arch=amdgcn --mcpu=gfx940 --disassemble - | FileCheck -check-prefixes=GCN,NON-HSA,OBJ %s
|
|
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx940 -amdgpu-kernarg-preload-count=1 -asm-verbose=0 < %s | llvm-mc -triple amdgcn-amd-amdhsa -mcpu=gfx940 -filetype=obj | llvm-objdump --arch=amdgcn --mcpu=gfx940 --disassemble - | FileCheck -check-prefixes=GCN,HSA,OBJ %s
|
|
|
|
; GCN: preload_kernarg_header
|
|
; HSA: s_trap 2
|
|
; NON-HSA: s_endpgm
|
|
; ASM: .fill 63, 4, 0xbf800000 ; s_nop 0
|
|
; OBJ-COUNT-63: s_nop 0
|
|
define amdgpu_kernel void @preload_kernarg_header(ptr %arg) {
|
|
store ptr %arg, ptr %arg
|
|
ret void
|
|
}
|
|
|
|
; GCN: non_kernel_function
|
|
; GCN-NOT: s_trap 2
|
|
; GCN-NOT: s_nop 0
|
|
; GCN: flat_store
|
|
define void @non_kernel_function(ptr %arg) {
|
|
store ptr %arg, ptr %arg
|
|
ret void
|
|
}
|