Files
clang-p2996/clang/test/OpenMP/target_num_teams_num_threads_attributes.cpp
Johannes Doerfert 31b91213bd [OpenMP] Unify the min/max thread/teams pathways
We used to pass the min/max threads/teams values through different paths
from the frontend to the middle end. This simplifies the situation by
passing the values once, only when we will create the KernelEnvironment,
which contains the values. At that point we also manifest the metadata,
as appropriate. Some footguns have also been removed, e.g., our target
check is now triple-based, not calling convention-based, as the latter
is dependent on the ordering of operations. The types of the values have
been unified to int32_t.
2023-10-29 10:53:20 -07:00

92 lines
2.8 KiB
C++

// RUN: %clang_cc1 -fopenmp -x c++ -std=c++11 -triple x86_64-unknown-unknown -fopenmp-targets=amdgcn-amd-amdhsa -emit-llvm-bc %s -o %t-ppc-host.bc
// RUN: %clang_cc1 -fopenmp -x c++ -std=c++11 -triple amdgcn-amd-amdhsa -fopenmp-targets=amdgcn-amd-amdhsa -emit-llvm %s -fopenmp-is-target-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - | FileCheck %s
// RUN: %clang_cc1 -target-cpu gfx900 -fopenmp -x c++ -std=c++11 -triple amdgcn-amd-amdhsa -fopenmp-targets=amdgcn-amd-amdhsa -emit-llvm %s -fopenmp-is-target-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - | FileCheck %s
// RUN: %clang_cc1 -fopenmp -x c++ -std=c++11 -triple x86_64-unknown-unknown -fopenmp-targets=nvptx64 -emit-llvm-bc %s -o %t-ppc-host.bc
// RUN: %clang_cc1 -fopenmp -x c++ -std=c++11 -triple nvptx64 -fopenmp-targets=nvptx64 -emit-llvm %s -fopenmp-is-target-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - | FileCheck %s
// RUN: %clang_cc1 -target-cpu sm_80 -fopenmp -x c++ -std=c++11 -triple nvptx64 -fopenmp-targets=nvptx64 -emit-llvm %s -fopenmp-is-target-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - | FileCheck %s
// expected-no-diagnostics
#ifndef HEADER
#define HEADER
void default_val_num_teams() {
#pragma omp target simd
for (int i = 0; i < 22; i++)
int a_var;
}
void foo1() {
#pragma omp target teams num_teams(22)
{ int a_var; }
}
void foo2() {
#pragma omp target teams distribute num_teams(22)
for (int i = 0; i < 22; i++)
int a_var;
}
void foo3() {
#pragma omp target teams distribute parallel for num_teams(22)
for (int i = 0; i < 22; i++)
int a_var;
}
void bar1() {
#pragma omp target teams num_teams(22)
{ int a_var; }
}
void bar2() {
#pragma omp target teams distribute num_teams(33)
for (int i = 0; i < 22; i++)
int a_var;
}
void bar3() {
#pragma omp target teams distribute parallel for num_teams(44)
for (int i = 0; i < 22; i++)
int a_var;
}
void const_int() {
const int NT = 22;
#pragma omp target teams num_teams(NT)
{ int a_var; }
}
void thread_limit() {
#pragma omp target teams thread_limit(22)
{ int a_var; }
}
void num_threads() {
#pragma omp target teams distribute parallel for thread_limit(22) num_threads(11)
for (int i = 0; i < 22; i++)
int a_var;
}
void threads_and_teams() {
#pragma omp target teams distribute parallel for thread_limit(22) num_teams(33)
for (int i = 0; i < 22; i++)
int a_var;
}
#endif
// CHECK: "omp_target_num_teams"="1"
// CHECK: "omp_target_num_teams"="22"
// CHECK: "omp_target_num_teams"="33"
// CHECK: "omp_target_num_teams"="44"
// CHECK: "omp_target_thread_limit"="22"
// CHECK: "omp_target_thread_limit"="11"
// CHECK: "omp_target_num_teams"="33"
// CHECK-SAME: "omp_target_thread_limit"="22"