Similar to 806761a762.
For IR files without a target triple, -mtriple= specifies the full
target triple while -march= merely sets the architecture part of the
default target triple, leaving a target triple which may not make sense,
e.g. amdgpu-apple-darwin.
Therefore, -march= is error-prone and not recommended for tests without
a target triple. The issue has been benign as we recognize
$unknown-apple-darwin as ELF instead of rejecting it outrightly.
This patch changes AMDGPU tests to not rely on the default
OS/environment components. Tests that need fixes are not changed:
```
LLVM :: CodeGen/AMDGPU/fabs.f64.ll
LLVM :: CodeGen/AMDGPU/fabs.ll
LLVM :: CodeGen/AMDGPU/floor.ll
LLVM :: CodeGen/AMDGPU/fneg-fabs.f64.ll
LLVM :: CodeGen/AMDGPU/fneg-fabs.ll
LLVM :: CodeGen/AMDGPU/r600-infinite-loop-bug-while-reorganizing-vector.ll
LLVM :: CodeGen/AMDGPU/schedule-if-2.ll
```
188 lines
3.5 KiB
YAML
188 lines
3.5 KiB
YAML
# RUN: llc -mtriple=amdgcn -mcpu=fiji -run-pass si-insert-waitcnts %s -o - | FileCheck %s
|
|
|
|
--- |
|
|
define amdgpu_kernel void @basic_insert_dcache_wb() {
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @explicit_flush_after() {
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @explicit_flush_before() {
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @no_scalar_store() {
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @multi_block_store() {
|
|
bb0:
|
|
br i1 undef, label %bb1, label %bb2
|
|
|
|
bb1:
|
|
ret void
|
|
|
|
bb2:
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @one_block_store() {
|
|
bb0:
|
|
br i1 undef, label %bb1, label %bb2
|
|
|
|
bb1:
|
|
ret void
|
|
|
|
bb2:
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_ps float @si_return() {
|
|
ret float undef
|
|
}
|
|
|
|
...
|
|
---
|
|
# CHECK-LABEL: name: basic_insert_dcache_wb
|
|
# CHECK: bb.0:
|
|
# CHECK-NEXT: S_STORE_DWORD
|
|
# CHECK-NEXT: S_DCACHE_WB
|
|
# CHECK-NEXT: S_ENDPGM 0
|
|
|
|
name: basic_insert_dcache_wb
|
|
tracksRegLiveness: false
|
|
machineFunctionInfo:
|
|
isEntryFunction: true
|
|
|
|
body: |
|
|
bb.0:
|
|
S_STORE_DWORD_SGPR undef $sgpr2, undef $sgpr0_sgpr1, undef $m0, 0
|
|
S_ENDPGM 0
|
|
...
|
|
---
|
|
# Already has an explicitly requested flush after the last store.
|
|
# CHECK-LABEL: name: explicit_flush_after
|
|
# CHECK: bb.0:
|
|
# CHECK-NEXT: S_STORE_DWORD
|
|
# CHECK-NEXT: S_DCACHE_WB
|
|
# CHECK-NEXT: S_ENDPGM 0
|
|
|
|
name: explicit_flush_after
|
|
tracksRegLiveness: false
|
|
machineFunctionInfo:
|
|
isEntryFunction: true
|
|
|
|
body: |
|
|
bb.0:
|
|
S_STORE_DWORD_SGPR undef $sgpr2, undef $sgpr0_sgpr1, undef $m0, 0
|
|
S_DCACHE_WB
|
|
S_ENDPGM 0
|
|
...
|
|
---
|
|
# Already has an explicitly requested flush before the last store.
|
|
# CHECK-LABEL: name: explicit_flush_before
|
|
# CHECK: bb.0:
|
|
# CHECK-NEXT: S_DCACHE_WB
|
|
# CHECK-NEXT: S_STORE_DWORD
|
|
# CHECK-NEXT: S_DCACHE_WB
|
|
# CHECK-NEXT: S_ENDPGM 0
|
|
|
|
name: explicit_flush_before
|
|
tracksRegLiveness: false
|
|
machineFunctionInfo:
|
|
isEntryFunction: true
|
|
|
|
body: |
|
|
bb.0:
|
|
S_DCACHE_WB
|
|
S_STORE_DWORD_SGPR undef $sgpr2, undef $sgpr0_sgpr1, undef $m0, 0
|
|
S_ENDPGM 0
|
|
...
|
|
---
|
|
# CHECK-LABEL: no_scalar_store
|
|
# CHECK: bb.0
|
|
# CHECK-NEXT: S_ENDPGM 0
|
|
name: no_scalar_store
|
|
tracksRegLiveness: false
|
|
machineFunctionInfo:
|
|
isEntryFunction: true
|
|
|
|
body: |
|
|
bb.0:
|
|
S_ENDPGM 0
|
|
...
|
|
|
|
# CHECK-LABEL: name: multi_block_store
|
|
# CHECK: bb.0:
|
|
# CHECK-NEXT: S_STORE_DWORD
|
|
# CHECK-NEXT: S_DCACHE_WB
|
|
# CHECK-NEXT: S_ENDPGM 0
|
|
|
|
# CHECK: bb.1:
|
|
# CHECK-NEXT: S_STORE_DWORD
|
|
# CHECK-NEXT: S_DCACHE_WB
|
|
# CHECK-NEXT: S_ENDPGM 0
|
|
|
|
name: multi_block_store
|
|
tracksRegLiveness: false
|
|
machineFunctionInfo:
|
|
isEntryFunction: true
|
|
|
|
body: |
|
|
bb.0:
|
|
S_STORE_DWORD_SGPR undef $sgpr2, undef $sgpr0_sgpr1, undef $m0, 0
|
|
S_ENDPGM 0
|
|
|
|
bb.1:
|
|
S_STORE_DWORD_SGPR undef $sgpr4, undef $sgpr6_sgpr7, undef $m0, 0
|
|
S_ENDPGM 0
|
|
...
|
|
...
|
|
|
|
# This one should be able to omit the flush in the storeless block but
|
|
# this isn't handled now.
|
|
|
|
# CHECK-LABEL: name: one_block_store
|
|
# CHECK: bb.0:
|
|
# CHECK-NEXT: S_DCACHE_WB
|
|
# CHECK-NEXT: S_ENDPGM 0
|
|
|
|
# CHECK: bb.1:
|
|
# CHECK-NEXT: S_STORE_DWORD
|
|
# CHECK-NEXT: S_DCACHE_WB
|
|
# CHECK-NEXT: S_ENDPGM 0
|
|
|
|
name: one_block_store
|
|
tracksRegLiveness: false
|
|
machineFunctionInfo:
|
|
isEntryFunction: true
|
|
|
|
body: |
|
|
bb.0:
|
|
S_ENDPGM 0
|
|
|
|
bb.1:
|
|
S_STORE_DWORD_SGPR undef $sgpr4, undef $sgpr6_sgpr7, undef $m0, 0
|
|
S_ENDPGM 0
|
|
...
|
|
---
|
|
# CHECK-LABEL: name: si_return
|
|
# CHECK: bb.0:
|
|
# CHECK-NEXT: S_STORE_DWORD
|
|
# CHECK-NEXT: S_WAITCNT
|
|
# CHECK-NEXT: S_DCACHE_WB
|
|
# CHECK-NEXT: SI_RETURN
|
|
|
|
name: si_return
|
|
tracksRegLiveness: false
|
|
machineFunctionInfo:
|
|
isEntryFunction: true
|
|
|
|
body: |
|
|
bb.0:
|
|
S_STORE_DWORD_SGPR undef $sgpr2, undef $sgpr0_sgpr1, undef $m0, 0
|
|
SI_RETURN_TO_EPILOG undef $vgpr0
|
|
...
|