The motivation is that the update script has at least two deviations (`<...>@GOT`/`<...>@PLT`/ and not hiding pointer arithmetics) from what pretty much all the checklines were generated with, and most of the tests are still not updated, so each time one of the non-up-to-date tests is updated to see the effect of the code change, there is a lot of noise. Instead of having to deal with that each time, let's just deal with everything at once. This has been done via: ``` cd llvm-project/llvm/test/CodeGen/X86 grep -rl "; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py" | xargs -L1 <...>/llvm-project/llvm/utils/update_llc_test_checks.py --llc-binary <...>/llvm-project/build/bin/llc ``` Not all tests were regenerated, however.
227 lines
7.1 KiB
LLVM
227 lines
7.1 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx | FileCheck %s
|
|
|
|
define <8 x i32> @cmp00(<8 x float> %a, <8 x float> %b) nounwind {
|
|
; CHECK-LABEL: cmp00:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vcmpltps %ymm1, %ymm0, %ymm0
|
|
; CHECK-NEXT: retq
|
|
%bincmp = fcmp olt <8 x float> %a, %b
|
|
%s = sext <8 x i1> %bincmp to <8 x i32>
|
|
ret <8 x i32> %s
|
|
}
|
|
|
|
define <4 x i64> @cmp01(<4 x double> %a, <4 x double> %b) nounwind {
|
|
; CHECK-LABEL: cmp01:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vcmpltpd %ymm1, %ymm0, %ymm0
|
|
; CHECK-NEXT: retq
|
|
%bincmp = fcmp olt <4 x double> %a, %b
|
|
%s = sext <4 x i1> %bincmp to <4 x i64>
|
|
ret <4 x i64> %s
|
|
}
|
|
|
|
declare void @scale() nounwind
|
|
|
|
define void @render(double %a0) nounwind {
|
|
; CHECK-LABEL: render:
|
|
; CHECK: # %bb.0: # %entry
|
|
; CHECK-NEXT: pushq %rbp
|
|
; CHECK-NEXT: pushq %rbx
|
|
; CHECK-NEXT: pushq %rax
|
|
; CHECK-NEXT: vmovsd %xmm0, (%rsp) # 8-byte Spill
|
|
; CHECK-NEXT: xorl %eax, %eax
|
|
; CHECK-NEXT: testb %al, %al
|
|
; CHECK-NEXT: jne .LBB2_6
|
|
; CHECK-NEXT: # %bb.1: # %for.cond5.preheader
|
|
; CHECK-NEXT: xorl %ebx, %ebx
|
|
; CHECK-NEXT: movb $1, %bpl
|
|
; CHECK-NEXT: .p2align 4, 0x90
|
|
; CHECK-NEXT: .LBB2_2: # %for.cond5
|
|
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
|
|
; CHECK-NEXT: testb %bl, %bl
|
|
; CHECK-NEXT: jne .LBB2_2
|
|
; CHECK-NEXT: # %bb.3: # %for.cond5
|
|
; CHECK-NEXT: # in Loop: Header=BB2_2 Depth=1
|
|
; CHECK-NEXT: testb %bpl, %bpl
|
|
; CHECK-NEXT: jne .LBB2_2
|
|
; CHECK-NEXT: # %bb.4: # %for.body33.preheader
|
|
; CHECK-NEXT: # in Loop: Header=BB2_2 Depth=1
|
|
; CHECK-NEXT: vmovsd (%rsp), %xmm0 # 8-byte Reload
|
|
; CHECK-NEXT: # xmm0 = mem[0],zero
|
|
; CHECK-NEXT: vucomisd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0
|
|
; CHECK-NEXT: jne .LBB2_5
|
|
; CHECK-NEXT: jnp .LBB2_2
|
|
; CHECK-NEXT: .LBB2_5: # %if.then
|
|
; CHECK-NEXT: # in Loop: Header=BB2_2 Depth=1
|
|
; CHECK-NEXT: callq scale@PLT
|
|
; CHECK-NEXT: jmp .LBB2_2
|
|
; CHECK-NEXT: .LBB2_6: # %for.end52
|
|
; CHECK-NEXT: addq $8, %rsp
|
|
; CHECK-NEXT: popq %rbx
|
|
; CHECK-NEXT: popq %rbp
|
|
; CHECK-NEXT: retq
|
|
entry:
|
|
br i1 undef, label %for.cond5, label %for.end52
|
|
|
|
for.cond5:
|
|
%or.cond = and i1 undef, false
|
|
br i1 %or.cond, label %for.body33, label %for.cond5
|
|
|
|
for.cond30:
|
|
br i1 false, label %for.body33, label %for.cond5
|
|
|
|
for.body33:
|
|
%tobool = fcmp une double %a0, 0.000000e+00
|
|
br i1 %tobool, label %if.then, label %for.cond30
|
|
|
|
if.then:
|
|
call void @scale()
|
|
br label %for.cond30
|
|
|
|
for.end52:
|
|
ret void
|
|
}
|
|
|
|
define <8 x i32> @int256_cmp(<8 x i32> %i, <8 x i32> %j) nounwind {
|
|
; CHECK-LABEL: int256_cmp:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vextractf128 $1, %ymm0, %xmm2
|
|
; CHECK-NEXT: vextractf128 $1, %ymm1, %xmm3
|
|
; CHECK-NEXT: vpcmpgtd %xmm2, %xmm3, %xmm2
|
|
; CHECK-NEXT: vpcmpgtd %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: vinsertf128 $1, %xmm2, %ymm0, %ymm0
|
|
; CHECK-NEXT: retq
|
|
%bincmp = icmp slt <8 x i32> %i, %j
|
|
%x = sext <8 x i1> %bincmp to <8 x i32>
|
|
ret <8 x i32> %x
|
|
}
|
|
|
|
define <4 x i64> @v4i64_cmp(<4 x i64> %i, <4 x i64> %j) nounwind {
|
|
; CHECK-LABEL: v4i64_cmp:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vextractf128 $1, %ymm0, %xmm2
|
|
; CHECK-NEXT: vextractf128 $1, %ymm1, %xmm3
|
|
; CHECK-NEXT: vpcmpgtq %xmm2, %xmm3, %xmm2
|
|
; CHECK-NEXT: vpcmpgtq %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: vinsertf128 $1, %xmm2, %ymm0, %ymm0
|
|
; CHECK-NEXT: retq
|
|
%bincmp = icmp slt <4 x i64> %i, %j
|
|
%x = sext <4 x i1> %bincmp to <4 x i64>
|
|
ret <4 x i64> %x
|
|
}
|
|
|
|
define <16 x i16> @v16i16_cmp(<16 x i16> %i, <16 x i16> %j) nounwind {
|
|
; CHECK-LABEL: v16i16_cmp:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vextractf128 $1, %ymm0, %xmm2
|
|
; CHECK-NEXT: vextractf128 $1, %ymm1, %xmm3
|
|
; CHECK-NEXT: vpcmpgtw %xmm2, %xmm3, %xmm2
|
|
; CHECK-NEXT: vpcmpgtw %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: vinsertf128 $1, %xmm2, %ymm0, %ymm0
|
|
; CHECK-NEXT: retq
|
|
%bincmp = icmp slt <16 x i16> %i, %j
|
|
%x = sext <16 x i1> %bincmp to <16 x i16>
|
|
ret <16 x i16> %x
|
|
}
|
|
|
|
define <32 x i8> @v32i8_cmp(<32 x i8> %i, <32 x i8> %j) nounwind {
|
|
; CHECK-LABEL: v32i8_cmp:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vextractf128 $1, %ymm0, %xmm2
|
|
; CHECK-NEXT: vextractf128 $1, %ymm1, %xmm3
|
|
; CHECK-NEXT: vpcmpgtb %xmm2, %xmm3, %xmm2
|
|
; CHECK-NEXT: vpcmpgtb %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: vinsertf128 $1, %xmm2, %ymm0, %ymm0
|
|
; CHECK-NEXT: retq
|
|
%bincmp = icmp slt <32 x i8> %i, %j
|
|
%x = sext <32 x i1> %bincmp to <32 x i8>
|
|
ret <32 x i8> %x
|
|
}
|
|
|
|
define <8 x i32> @int256_cmpeq(<8 x i32> %i, <8 x i32> %j) nounwind {
|
|
; CHECK-LABEL: int256_cmpeq:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vextractf128 $1, %ymm1, %xmm2
|
|
; CHECK-NEXT: vextractf128 $1, %ymm0, %xmm3
|
|
; CHECK-NEXT: vpcmpeqd %xmm2, %xmm3, %xmm2
|
|
; CHECK-NEXT: vpcmpeqd %xmm1, %xmm0, %xmm0
|
|
; CHECK-NEXT: vinsertf128 $1, %xmm2, %ymm0, %ymm0
|
|
; CHECK-NEXT: retq
|
|
%bincmp = icmp eq <8 x i32> %i, %j
|
|
%x = sext <8 x i1> %bincmp to <8 x i32>
|
|
ret <8 x i32> %x
|
|
}
|
|
|
|
define <4 x i64> @v4i64_cmpeq(<4 x i64> %i, <4 x i64> %j) nounwind {
|
|
; CHECK-LABEL: v4i64_cmpeq:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vextractf128 $1, %ymm1, %xmm2
|
|
; CHECK-NEXT: vextractf128 $1, %ymm0, %xmm3
|
|
; CHECK-NEXT: vpcmpeqq %xmm2, %xmm3, %xmm2
|
|
; CHECK-NEXT: vpcmpeqq %xmm1, %xmm0, %xmm0
|
|
; CHECK-NEXT: vinsertf128 $1, %xmm2, %ymm0, %ymm0
|
|
; CHECK-NEXT: retq
|
|
%bincmp = icmp eq <4 x i64> %i, %j
|
|
%x = sext <4 x i1> %bincmp to <4 x i64>
|
|
ret <4 x i64> %x
|
|
}
|
|
|
|
define <16 x i16> @v16i16_cmpeq(<16 x i16> %i, <16 x i16> %j) nounwind {
|
|
; CHECK-LABEL: v16i16_cmpeq:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vextractf128 $1, %ymm1, %xmm2
|
|
; CHECK-NEXT: vextractf128 $1, %ymm0, %xmm3
|
|
; CHECK-NEXT: vpcmpeqw %xmm2, %xmm3, %xmm2
|
|
; CHECK-NEXT: vpcmpeqw %xmm1, %xmm0, %xmm0
|
|
; CHECK-NEXT: vinsertf128 $1, %xmm2, %ymm0, %ymm0
|
|
; CHECK-NEXT: retq
|
|
%bincmp = icmp eq <16 x i16> %i, %j
|
|
%x = sext <16 x i1> %bincmp to <16 x i16>
|
|
ret <16 x i16> %x
|
|
}
|
|
|
|
define <32 x i8> @v32i8_cmpeq(<32 x i8> %i, <32 x i8> %j) nounwind {
|
|
; CHECK-LABEL: v32i8_cmpeq:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vextractf128 $1, %ymm1, %xmm2
|
|
; CHECK-NEXT: vextractf128 $1, %ymm0, %xmm3
|
|
; CHECK-NEXT: vpcmpeqb %xmm2, %xmm3, %xmm2
|
|
; CHECK-NEXT: vpcmpeqb %xmm1, %xmm0, %xmm0
|
|
; CHECK-NEXT: vinsertf128 $1, %xmm2, %ymm0, %ymm0
|
|
; CHECK-NEXT: retq
|
|
%bincmp = icmp eq <32 x i8> %i, %j
|
|
%x = sext <32 x i1> %bincmp to <32 x i8>
|
|
ret <32 x i8> %x
|
|
}
|
|
|
|
;; Scalar comparison
|
|
|
|
define i32 @scalarcmpA(double %a0) uwtable ssp {
|
|
; CHECK-LABEL: scalarcmpA:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vxorpd %xmm1, %xmm1, %xmm1
|
|
; CHECK-NEXT: vcmpeqsd %xmm1, %xmm0, %xmm0
|
|
; CHECK-NEXT: vmovq %xmm0, %rax
|
|
; CHECK-NEXT: andl $1, %eax
|
|
; CHECK-NEXT: # kill: def $eax killed $eax killed $rax
|
|
; CHECK-NEXT: retq
|
|
%cmp29 = fcmp oeq double %a0, 0.000000e+00
|
|
%res = zext i1 %cmp29 to i32
|
|
ret i32 %res
|
|
}
|
|
|
|
define i32 @scalarcmpB(float %a0) uwtable ssp {
|
|
; CHECK-LABEL: scalarcmpB:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vxorps %xmm1, %xmm1, %xmm1
|
|
; CHECK-NEXT: vcmpeqss %xmm1, %xmm0, %xmm0
|
|
; CHECK-NEXT: vmovd %xmm0, %eax
|
|
; CHECK-NEXT: andl $1, %eax
|
|
; CHECK-NEXT: retq
|
|
%cmp29 = fcmp oeq float %a0, 0.000000e+00
|
|
%res = zext i1 %cmp29 to i32
|
|
ret i32 %res
|
|
}
|
|
|