ptxas is a proprietary compiler from Nvidia that can compile PTX to machine code (SASS). It has a lot of diagnostics to catch errors in PTX, which can be used to verify PTX output from llc. Set -DPXTAS_EXECUTABLE=/path/to/ptxas CMake option to enable it. If this option is not set, then ptxas is substituted to true which effectively disables all ptxas RUN lines. LLVM_PTXAS_EXECUTABLE environment variable takes precedence over the CMake option, and allows to override ptxas executable that is used for LIT without complete re-configuration. Differential Revision: https://reviews.llvm.org/D121727
20 lines
765 B
LLVM
20 lines
765 B
LLVM
; RUN: llc < %s -march=nvptx -mcpu=sm_20 %if ptxas %{ | %ptxas-verify %}
|
|
; RUN: llc < %s -march=nvptx64 -mcpu=sm_20 %if ptxas %{ | %ptxas-verify %}
|
|
|
|
; This test makes sure that the result of vector compares are properly
|
|
; scalarized. If codegen fails, then the type legalizer incorrectly
|
|
; tried to promote <2 x i1> to <2 x i8> and instruction selection failed.
|
|
|
|
define void @foo(<2 x i32>* %a, <2 x i32>* %b, i32* %r1, i32* %r2) {
|
|
%aval = load <2 x i32>, <2 x i32>* %a
|
|
%bval = load <2 x i32>, <2 x i32>* %b
|
|
%res = icmp slt <2 x i32> %aval, %bval
|
|
%t1 = extractelement <2 x i1> %res, i32 0
|
|
%t2 = extractelement <2 x i1> %res, i32 1
|
|
%t1a = zext i1 %t1 to i32
|
|
%t2a = zext i1 %t2 to i32
|
|
store i32 %t1a, i32* %r1
|
|
store i32 %t2a, i32* %r2
|
|
ret void
|
|
}
|