Many tests in the `offload` project have requirements defined by which targets are not supported rather than which platforms are supported. This patch aims to streamline the requirement definitions by adding four new feature tags: `host`, `gpu`, `amdgpu`, and `nvidiagpu`.
41 lines
1.5 KiB
C
41 lines
1.5 KiB
C
// clang-format off
|
|
// RUN: %libomptarget-compile-generic
|
|
// RUN: env LIBOMPTARGET_INFO=16 \
|
|
// RUN: %libomptarget-run-generic 2>&1 | %fcheck-generic --check-prefix=DEFAULT
|
|
// RUN: env LIBOMPTARGET_INFO=16 LIBOMPTARGET_MIN_THREADS_FOR_LOW_TRIP_COUNT=8 \
|
|
// RUN: %libomptarget-run-generic 2>&1 | %fcheck-generic --check-prefix=EIGHT
|
|
|
|
// REQUIRES: gpu
|
|
|
|
#define N 128
|
|
|
|
__attribute__((optnone)) void optnone() {}
|
|
|
|
int main() {
|
|
// DEFAULT: Launching kernel {{.+_main_.+}} with 4 blocks and 32 threads in SPMD mode
|
|
// EIGHT: Launching kernel {{.+_main_.+}} with 16 blocks and 8 threads in SPMD mode
|
|
#pragma omp target teams distribute parallel for simd
|
|
for (int i = 0; i < N; ++i) {
|
|
optnone();
|
|
}
|
|
// DEFAULT: Launching kernel {{.+_main_.+}} with 4 blocks and 32 threads in SPMD mode
|
|
// EIGHT: Launching kernel {{.+_main_.+}} with 16 blocks and 8 threads in SPMD mode
|
|
#pragma omp target teams distribute parallel for simd
|
|
for (int i = 0; i < N - 1; ++i) {
|
|
optnone();
|
|
}
|
|
// DEFAULT: Launching kernel {{.+_main_.+}} with 5 blocks and 32 threads in SPMD mode
|
|
// EIGHT: Launching kernel {{.+_main_.+}} with 17 blocks and 8 threads in SPMD mode
|
|
#pragma omp target teams distribute parallel for simd
|
|
for (int i = 0; i < N + 1; ++i) {
|
|
optnone();
|
|
}
|
|
// DEFAULT: Launching kernel {{.+_main_.+}} with 32 blocks and 4 threads in SPMD mode
|
|
// EIGHT: Launching kernel {{.+_main_.+}} with 32 blocks and 4 threads in SPMD mode
|
|
#pragma omp target teams distribute parallel for simd thread_limit(4)
|
|
for (int i = 0; i < N; ++i) {
|
|
optnone();
|
|
}
|
|
}
|
|
|