Files
clang-p2996/clang/test/CodeGenOpenCL/builtins-amdgcn-gfx1250-load-tr.cl

131 lines
5.3 KiB
Common Lisp

// NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py
// REQUIRES: amdgpu-registered-target
// RUN: %clang_cc1 -triple amdgcn-unknown-unknown -target-cpu gfx1250 -target-feature +wavefrontsize32 -emit-llvm -o - %s | FileCheck %s --check-prefix=CHECK-GFX1250
typedef int v2i __attribute__((ext_vector_type(2)));
typedef int v3i __attribute__((ext_vector_type(3)));
typedef int v4i __attribute__((ext_vector_type(4)));
typedef short v8s __attribute__((ext_vector_type(8)));
typedef half v8h __attribute__((ext_vector_type(8)));
typedef __bf16 v8y __attribute__((ext_vector_type(8)));
// CHECK-GFX1250-LABEL: @test_amdgcn_global_load_tr4_b64_v2i32(
// CHECK-GFX1250-NEXT: entry:
// CHECK-GFX1250-NEXT: [[TMP0:%.*]] = tail call <2 x i32> @llvm.amdgcn.global.load.tr4.b64.v2i32(ptr addrspace(1) [[INPTR:%.*]])
// CHECK-GFX1250-NEXT: ret <2 x i32> [[TMP0]]
//
v2i test_amdgcn_global_load_tr4_b64_v2i32(global v2i* inptr)
{
return __builtin_amdgcn_global_load_tr4_b64_v2i32(inptr);
}
// CHECK-GFX1250-LABEL: @test_amdgcn_global_load_tr8_b64_v2i32(
// CHECK-GFX1250-NEXT: entry:
// CHECK-GFX1250-NEXT: [[TMP0:%.*]] = tail call <2 x i32> @llvm.amdgcn.global.load.tr.b64.v2i32(ptr addrspace(1) [[INPTR:%.*]])
// CHECK-GFX1250-NEXT: ret <2 x i32> [[TMP0]]
//
v2i test_amdgcn_global_load_tr8_b64_v2i32(global v2i* inptr)
{
return __builtin_amdgcn_global_load_tr8_b64_v2i32(inptr);
}
// CHECK-GFX1250-LABEL: @test_amdgcn_global_load_tr6_b96_v3i32(
// CHECK-GFX1250-NEXT: entry:
// CHECK-GFX1250-NEXT: [[TMP0:%.*]] = tail call <3 x i32> @llvm.amdgcn.global.load.tr6.b96.v3i32(ptr addrspace(1) [[INPTR:%.*]])
// CHECK-GFX1250-NEXT: ret <3 x i32> [[TMP0]]
//
v3i test_amdgcn_global_load_tr6_b96_v3i32(global v3i* inptr)
{
return __builtin_amdgcn_global_load_tr6_b96_v3i32(inptr);
}
// CHECK-GFX1250-LABEL: @test_amdgcn_global_load_tr16_b128_v8i16(
// CHECK-GFX1250-NEXT: entry:
// CHECK-GFX1250-NEXT: [[TMP0:%.*]] = tail call <8 x i16> @llvm.amdgcn.global.load.tr.b128.v8i16(ptr addrspace(1) [[INPTR:%.*]])
// CHECK-GFX1250-NEXT: ret <8 x i16> [[TMP0]]
//
v8s test_amdgcn_global_load_tr16_b128_v8i16(global v8s* inptr)
{
return __builtin_amdgcn_global_load_tr16_b128_v8i16(inptr);
}
// CHECK-GFX1250-LABEL: @test_amdgcn_global_load_tr16_b128_v8f16(
// CHECK-GFX1250-NEXT: entry:
// CHECK-GFX1250-NEXT: [[TMP0:%.*]] = tail call <8 x half> @llvm.amdgcn.global.load.tr.b128.v8f16(ptr addrspace(1) [[INPTR:%.*]])
// CHECK-GFX1250-NEXT: ret <8 x half> [[TMP0]]
//
v8h test_amdgcn_global_load_tr16_b128_v8f16(global v8h* inptr)
{
return __builtin_amdgcn_global_load_tr16_b128_v8f16(inptr);
}
// CHECK-GFX1250-LABEL: @test_amdgcn_global_load_tr16_b128_v8bf16(
// CHECK-GFX1250-NEXT: entry:
// CHECK-GFX1250-NEXT: [[TMP0:%.*]] = tail call <8 x bfloat> @llvm.amdgcn.global.load.tr.b128.v8bf16(ptr addrspace(1) [[INPTR:%.*]])
// CHECK-GFX1250-NEXT: ret <8 x bfloat> [[TMP0]]
//
v8y test_amdgcn_global_load_tr16_b128_v8bf16(global v8y* inptr)
{
return __builtin_amdgcn_global_load_tr16_b128_v8bf16(inptr);
}
// CHECK-GFX1250-LABEL: @test_amdgcn_ds_load_tr4_b64_v2i32(
// CHECK-GFX1250-NEXT: entry:
// CHECK-GFX1250-NEXT: [[TMP0:%.*]] = tail call <2 x i32> @llvm.amdgcn.ds.load.tr4.b64.v2i32(ptr addrspace(3) [[INPTR:%.*]])
// CHECK-GFX1250-NEXT: ret <2 x i32> [[TMP0]]
//
v2i test_amdgcn_ds_load_tr4_b64_v2i32(local v2i* inptr)
{
return __builtin_amdgcn_ds_load_tr4_b64_v2i32(inptr);
}
// CHECK-GFX1250-LABEL: @test_amdgcn_ds_load_tr8_b64_v2i32(
// CHECK-GFX1250-NEXT: entry:
// CHECK-GFX1250-NEXT: [[TMP0:%.*]] = tail call <2 x i32> @llvm.amdgcn.ds.load.tr8.b64.v2i32(ptr addrspace(3) [[INPTR:%.*]])
// CHECK-GFX1250-NEXT: ret <2 x i32> [[TMP0]]
//
v2i test_amdgcn_ds_load_tr8_b64_v2i32(local v2i* inptr)
{
return __builtin_amdgcn_ds_load_tr8_b64_v2i32(inptr);
}
// CHECK-GFX1250-LABEL: @test_amdgcn_ds_load_tr6_b96_v3i32(
// CHECK-GFX1250-NEXT: entry:
// CHECK-GFX1250-NEXT: [[TMP0:%.*]] = tail call <3 x i32> @llvm.amdgcn.ds.load.tr6.b96.v3i32(ptr addrspace(3) [[INPTR:%.*]])
// CHECK-GFX1250-NEXT: ret <3 x i32> [[TMP0]]
//
v3i test_amdgcn_ds_load_tr6_b96_v3i32(local v3i* inptr)
{
return __builtin_amdgcn_ds_load_tr6_b96_v3i32(inptr);
}
// CHECK-GFX1250-LABEL: @test_amdgcn_ds_load_tr16_b128_v8i16(
// CHECK-GFX1250-NEXT: entry:
// CHECK-GFX1250-NEXT: [[TMP0:%.*]] = tail call <8 x i16> @llvm.amdgcn.ds.load.tr16.b128.v8i16(ptr addrspace(3) [[INPTR:%.*]])
// CHECK-GFX1250-NEXT: ret <8 x i16> [[TMP0]]
//
v8s test_amdgcn_ds_load_tr16_b128_v8i16(local v8s* inptr)
{
return __builtin_amdgcn_ds_load_tr16_b128_v8i16(inptr);
}
// CHECK-GFX1250-LABEL: @test_amdgcn_ds_load_tr16_b128_v8f16(
// CHECK-GFX1250-NEXT: entry:
// CHECK-GFX1250-NEXT: [[TMP0:%.*]] = tail call <8 x half> @llvm.amdgcn.ds.load.tr16.b128.v8f16(ptr addrspace(3) [[INPTR:%.*]])
// CHECK-GFX1250-NEXT: ret <8 x half> [[TMP0]]
//
v8h test_amdgcn_ds_load_tr16_b128_v8f16(local v8h* inptr)
{
return __builtin_amdgcn_ds_load_tr16_b128_v8f16(inptr);
}
// CHECK-GFX1250-LABEL: @test_amdgcn_ds_load_tr16_b128_v8bf16(
// CHECK-GFX1250-NEXT: entry:
// CHECK-GFX1250-NEXT: [[TMP0:%.*]] = tail call <8 x bfloat> @llvm.amdgcn.ds.load.tr16.b128.v8bf16(ptr addrspace(3) [[INPTR:%.*]])
// CHECK-GFX1250-NEXT: ret <8 x bfloat> [[TMP0]]
//
v8y test_amdgcn_ds_load_tr16_b128_v8bf16(local v8y* inptr)
{
return __builtin_amdgcn_ds_load_tr16_b128_v8bf16(inptr);
}