Similar to 806761a762.
For IR files without a target triple, -mtriple= specifies the full
target triple while -march= merely sets the architecture part of the
default target triple, leaving a target triple which may not make sense,
e.g. amdgpu-apple-darwin.
Therefore, -march= is error-prone and not recommended for tests without
a target triple. The issue has been benign as we recognize
$unknown-apple-darwin as ELF instead of rejecting it outrightly.
This patch changes AMDGPU tests to not rely on the default
OS/environment components. Tests that need fixes are not changed:
```
LLVM :: CodeGen/AMDGPU/fabs.f64.ll
LLVM :: CodeGen/AMDGPU/fabs.ll
LLVM :: CodeGen/AMDGPU/floor.ll
LLVM :: CodeGen/AMDGPU/fneg-fabs.f64.ll
LLVM :: CodeGen/AMDGPU/fneg-fabs.ll
LLVM :: CodeGen/AMDGPU/r600-infinite-loop-bug-while-reorganizing-vector.ll
LLVM :: CodeGen/AMDGPU/schedule-if-2.ll
```
51 lines
2.4 KiB
LLVM
51 lines
2.4 KiB
LLVM
; RUN: llc -mtriple=amdgcn -mcpu=gfx906 -mattr=+wavefrontsize64 -stop-after=amdgpu-remove-incompatible-functions\
|
|
; RUN: -pass-remarks=amdgpu-remove-incompatible-functions < %s 2>%t | FileCheck -check-prefixes=GFX906 %s
|
|
; RUN: FileCheck --check-prefix=WARN-GFX906 %s < %t
|
|
; RUN: llc -mtriple=amdgcn -mcpu=gfx906 -mattr=+wavefrontsize64 -verify-machineinstrs < %s
|
|
|
|
; RUN: llc -mtriple=amdgcn -mcpu=gfx90a -mattr=+wavefrontsize64 -stop-after=amdgpu-remove-incompatible-functions\
|
|
; RUN: -pass-remarks=amdgpu-remove-incompatible-functions < %s 2>%t | FileCheck -check-prefixes=GFX90A %s
|
|
; RUN: FileCheck --check-prefix=WARN-GFX90A %s < %t
|
|
; RUN: llc -mtriple=amdgcn -mcpu=gfx90a -mattr=+wavefrontsize64 -verify-machineinstrs < %s
|
|
|
|
; RUN: llc -mtriple=amdgcn -mcpu=gfx1011 -mattr=+wavefrontsize64 -stop-after=amdgpu-remove-incompatible-functions\
|
|
; RUN: -pass-remarks=amdgpu-remove-incompatible-functions < %s 2>%t | FileCheck -check-prefixes=GFX10 %s
|
|
; RUN: llc -mtriple=amdgcn -mcpu=gfx1011 -mattr=+wavefrontsize64 -verify-machineinstrs < %s
|
|
|
|
; RUN: llc -mtriple=amdgcn -mcpu=gfx1100 -mattr=+wavefrontsize64 -stop-after=amdgpu-remove-incompatible-functions\
|
|
; RUN: -pass-remarks=amdgpu-remove-incompatible-functions < %s 2>%t | FileCheck -check-prefixes=GFX11 %s
|
|
; RUN: llc -mtriple=amdgcn -mcpu=gfx1100 -mattr=+wavefrontsize64 -verify-machineinstrs < %s
|
|
|
|
; WARN-GFX906: removing function 'needs_wavefrontsize32': +wavefrontsize32 is not supported on the current target
|
|
; WARN-GFX906-NOT: not supported
|
|
|
|
; WARN-GFX90A: removing function 'needs_wavefrontsize32': +wavefrontsize32 is not supported on the current target
|
|
; WARN-GFX90A-NOT: not supported
|
|
|
|
define void @needs_wavefrontsize32(ptr %out) #0 {
|
|
; GFX906-NOT: @needs_wavefrontsize32
|
|
; GFX90A-NOT: @needs_wavefrontsize32
|
|
; GFX10: define void @needs_wavefrontsize32(
|
|
; GFX11: define void @needs_wavefrontsize32(
|
|
%1 = tail call i32 @llvm.read_register.i32(metadata !0)
|
|
%2 = tail call i32 @llvm.ctpop.i32(i32 %1)
|
|
store i32 %2, ptr %out, align 4
|
|
ret void
|
|
}
|
|
|
|
define void @caller(ptr %out) {
|
|
; GFX906: call void null(
|
|
; GFX90A: call void null(
|
|
; GFX10: call void @needs_wavefrontsize32(
|
|
; GFX11: call void @needs_wavefrontsize32(
|
|
call void @needs_wavefrontsize32(ptr %out)
|
|
ret void
|
|
}
|
|
|
|
declare i32 @llvm.read_register.i32(metadata)
|
|
declare i32 @llvm.ctpop.i32(i32)
|
|
|
|
!0 = !{!"exec_lo"}
|
|
|
|
attributes #0 = { "target-features"="+wavefrontsize32" }
|