Similar to 806761a762.
For IR files without a target triple, -mtriple= specifies the full
target triple while -march= merely sets the architecture part of the
default target triple, leaving a target triple which may not make sense,
e.g. amdgpu-apple-darwin.
Therefore, -march= is error-prone and not recommended for tests without
a target triple. The issue has been benign as we recognize
$unknown-apple-darwin as ELF instead of rejecting it outrightly.
This patch changes AMDGPU tests to not rely on the default
OS/environment components. Tests that need fixes are not changed:
```
LLVM :: CodeGen/AMDGPU/fabs.f64.ll
LLVM :: CodeGen/AMDGPU/fabs.ll
LLVM :: CodeGen/AMDGPU/floor.ll
LLVM :: CodeGen/AMDGPU/fneg-fabs.f64.ll
LLVM :: CodeGen/AMDGPU/fneg-fabs.ll
LLVM :: CodeGen/AMDGPU/r600-infinite-loop-bug-while-reorganizing-vector.ll
LLVM :: CodeGen/AMDGPU/schedule-if-2.ll
```
70 lines
2.5 KiB
YAML
70 lines
2.5 KiB
YAML
# RUN: llc -mtriple=amdgcn -mcpu=gfx1010 -run-pass=si-fold-operands,dead-mi-elimination -verify-machineinstrs %s -o - | FileCheck -check-prefix=GCN %s
|
|
# RUN: llc -mtriple=amdgcn -mcpu=gfx1100 -run-pass=si-fold-operands,dead-mi-elimination -verify-machineinstrs %s -o - | FileCheck -check-prefix=GCN %s
|
|
|
|
# GCN-LABEL: name: fold_vgpr_to_vgpr_copy
|
|
# GCN: %0:vreg_64 = IMPLICIT_DEF
|
|
# GCN-NEXT: %1:vgpr_32 = IMPLICIT_DEF
|
|
# GCN-NEXT: %2:vgpr_32 = IMPLICIT_DEF
|
|
# GCN-NEXT: DS_WRITE2_B32_gfx9 %0.sub0, killed %1, killed %2, 0, 1, 0, implicit $exec
|
|
|
|
---
|
|
name: fold_vgpr_to_vgpr_copy
|
|
body: |
|
|
bb.0:
|
|
|
|
%0:vreg_64 = IMPLICIT_DEF
|
|
%4:vgpr_32 = IMPLICIT_DEF
|
|
%3:vgpr_32 = IMPLICIT_DEF
|
|
%1:vgpr_32 = COPY %0.sub0
|
|
%2:vgpr_32 = COPY %1
|
|
DS_WRITE2_B32_gfx9 %2, killed %4, killed %3, 0, 1, 0, implicit $exec
|
|
...
|
|
|
|
# GCN-LABEL: name: fold_sgpr_to_vgpr_copy
|
|
# GCN: %0:sreg_64 = IMPLICIT_DEF
|
|
# GCN-NEXT: %1:vgpr_32 = IMPLICIT_DEF
|
|
# GCN-NEXT: %2:vgpr_32 = IMPLICIT_DEF
|
|
# GCN-NEXT: %4:vgpr_32 = COPY %0.sub0
|
|
# GCN-NEXT: DS_WRITE2_B32_gfx9 %4, killed %1, killed %2, 0, 1, 0, implicit $exec
|
|
name: fold_sgpr_to_vgpr_copy
|
|
body: |
|
|
bb.0:
|
|
|
|
%0:sreg_64 = IMPLICIT_DEF
|
|
%4:vgpr_32 = IMPLICIT_DEF
|
|
%3:vgpr_32 = IMPLICIT_DEF
|
|
%1:sgpr_32 = COPY %0.sub0
|
|
%2:vgpr_32 = COPY %1
|
|
DS_WRITE2_B32_gfx9 %2, killed %4, killed %3, 0, 1, 0, implicit $exec
|
|
...
|
|
|
|
# GCN-LABEL: name: fma_sgpr_use
|
|
# GCN: %0:sreg_64_xexec = IMPLICIT_DEF
|
|
# GCN-NEXT: %4:vgpr_32 = nnan ninf nsz arcp contract afn reassoc V_FMA_F32_e64 2, %0.sub0, 0, 1073741824, 0, %0.sub1, 0, 0, implicit $mode, implicit $exec
|
|
---
|
|
name: fma_sgpr_use
|
|
body: |
|
|
bb.0:
|
|
%0:sreg_64_xexec = IMPLICIT_DEF
|
|
%1:sgpr_32 = COPY %0.sub0
|
|
%2:sgpr_32 = COPY %0.sub1
|
|
%3:vgpr_32 = COPY %2
|
|
%4:vgpr_32 = nnan ninf nsz arcp contract afn reassoc V_FMAC_F32_e64 2, %1, 0, 1073741824, 0, %3, 0, 0, implicit $mode, implicit $exec
|
|
DS_WRITE2_B32_gfx9 undef %5:vgpr_32, killed %4, undef %6:vgpr_32, 0, 1, 0, implicit $exec
|
|
...
|
|
|
|
# GCN-LABEL: name: fma_sgpr_sgpr_use
|
|
# GCN: %0:sgpr_32 = IMPLICIT_DEF
|
|
# GCN-NEXT: %2:vgpr_32 = V_MOV_B32_e32 1234567, implicit $exec
|
|
# GCN-NEXT: %3:vgpr_32 = V_FMAC_F32_e64 0, %0, 0, 1234567, 0, %2, 0, 0, implicit $mode, implicit $exec
|
|
---
|
|
name: fma_sgpr_sgpr_use
|
|
body: |
|
|
bb.0:
|
|
%0:sgpr_32 = IMPLICIT_DEF
|
|
%1:sgpr_32 = S_MOV_B32 1234567
|
|
%2:vgpr_32 = COPY %1
|
|
%3:vgpr_32 = V_FMAC_F32_e64 0, %0, 0, %1, 0, %2, 0, 0, implicit $mode, implicit $exec
|
|
S_ENDPGM 0, implicit %3
|
|
...
|