Files
clang-p2996/offload/test/offloading/barrier_fence.c
Ethan Luis McDonough 8823448807 [Offload] Refactor offload test requirements (#95196)
Many tests in the `offload` project have requirements defined by which
targets are not supported rather than which platforms are supported.
This patch aims to streamline the requirement definitions by adding four
new feature tags: `host`, `gpu`, `amdgpu`, and `nvidiagpu`.
2024-06-29 00:56:18 -05:00

80 lines
2.4 KiB
C

// RUN: %libomptarget-compile-generic -fopenmp-offload-mandatory -O3
// RUN: %libomptarget-run-generic
// RUN: %libomptarget-compileopt-generic -fopenmp-offload-mandatory -O3
// RUN: %libomptarget-run-generic
// REQUIRES: gpu
#include <omp.h>
#include <stdio.h>
struct IdentTy;
void __kmpc_barrier_simple_spmd(struct IdentTy *Loc, int32_t TId);
void __kmpc_barrier_simple_generic(struct IdentTy *Loc, int32_t TId);
#pragma omp begin declare target device_type(nohost)
static int A[512] __attribute__((address_space(3), loader_uninitialized));
static int B[512 * 32] __attribute__((loader_uninitialized));
#pragma omp end declare target
int main() {
printf("Testing simple spmd barrier\n");
for (int r = 0; r < 50; r++) {
#pragma omp target teams distribute thread_limit(512) num_teams(440)
for (int j = 0; j < 512 * 32; ++j) {
#pragma omp parallel firstprivate(j)
{
int TId = omp_get_thread_num();
int TeamId = omp_get_team_num();
int NT = omp_get_num_threads();
// Sequential
for (int i = 0; i < NT; ++i) {
// Test shared memory globals
if (TId == i)
A[i] = i + j;
__kmpc_barrier_simple_spmd(0, TId);
if (A[i] != i + j)
__builtin_trap();
__kmpc_barrier_simple_spmd(0, TId);
// Test generic globals
if (TId == i)
B[TeamId] = i;
__kmpc_barrier_simple_spmd(0, TId);
if (B[TeamId] != i)
__builtin_trap();
__kmpc_barrier_simple_spmd(0, TId);
}
}
}
}
printf("Testing simple generic barrier\n");
for (int r = 0; r < 50; r++) {
#pragma omp target teams distribute thread_limit(512) num_teams(440)
for (int j = 0; j < 512 * 32; ++j) {
#pragma omp parallel firstprivate(j)
{
int TId = omp_get_thread_num();
int TeamId = omp_get_team_num();
int NT = omp_get_num_threads();
// Sequential
for (int i = 0; i < NT; ++i) {
if (TId == i)
A[i] = i + j;
__kmpc_barrier_simple_generic(0, TId);
if (A[i] != i + j)
__builtin_trap();
__kmpc_barrier_simple_generic(0, TId);
if (TId == i)
B[TeamId] = i;
__kmpc_barrier_simple_generic(0, TId);
if (B[TeamId] != i)
__builtin_trap();
__kmpc_barrier_simple_generic(0, TId);
}
}
}
}
return 0;
}