ptxas is a proprietary compiler from Nvidia that can compile PTX to machine code (SASS). It has a lot of diagnostics to catch errors in PTX, which can be used to verify PTX output from llc. Set -DPXTAS_EXECUTABLE=/path/to/ptxas CMake option to enable it. If this option is not set, then ptxas is substituted to true which effectively disables all ptxas RUN lines. LLVM_PTXAS_EXECUTABLE environment variable takes precedence over the CMake option, and allows to override ptxas executable that is used for LIT without complete re-configuration. Differential Revision: https://reviews.llvm.org/D121727
15 lines
620 B
LLVM
15 lines
620 B
LLVM
; RUN: llc < %s -O0 -march=nvptx64 -mcpu=sm_20 | FileCheck %s
|
|
; RUN: %if ptxas %{ llc < %s -O0 -march=nvptx64 -mcpu=sm_20 | %ptxas-verify %}
|
|
|
|
; CHECK-LABEL: .visible .func (.param .align 16 .b8 func_retval0[32]) foo(
|
|
define { i128, i128 } @foo(i64 %a, i32 %b) {
|
|
%1 = sext i64 %a to i128
|
|
%2 = sext i32 %b to i128
|
|
%3 = insertvalue { i128, i128 } undef, i128 %1, 0
|
|
%4 = insertvalue { i128, i128 } %3, i128 %2, 1
|
|
|
|
; CHECK: st.param.v2.b64 [func_retval0+0], {%[[REG1:rd[0-9]+]], %[[REG2:rd[0-9]+]]};
|
|
; CHECK: st.param.v2.b64 [func_retval0+16], {%[[REG3:rd[0-9]+]], %[[REG4:rd[0-9]+]]};
|
|
ret { i128, i128 } %4
|
|
}
|