clang-p2996/offload/test/mapping/target_uses_allocator.c

// RUN: %libomptarget-compile-run-and-check-generic

// FIXME: https://github.com/llvm/llvm-project/issues/77841
// UNSUPPORTED: amdgcn-amd-amdhsa
// UNSUPPORTED: nvptx64-nvidia-cuda
// UNSUPPORTED: nvptx64-nvidia-cuda-LTO

#include <omp.h>
#include <stdio.h>

#define N 1024

int test_omp_aligned_alloc_on_device() {
  int errors = 0;

  omp_memspace_handle_t memspace = omp_default_mem_space;
  omp_alloctrait_t traits[2] = {{omp_atk_alignment, 64}, {omp_atk_access, 64}};
  omp_allocator_handle_t alloc =
      omp_init_allocator(omp_default_mem_space, 1, traits);

#pragma omp target map(tofrom : errors) uses_allocators(alloc(traits))
  {
    int *x;
    int not_correct_array_values = 0;

    x = (int *)omp_aligned_alloc(64, N * sizeof(int), alloc);
    if (x == NULL) {
      errors++;
    } else {
#pragma omp parallel for simd simdlen(16) aligned(x : 64)
      for (int i = 0; i < N; i++) {
        x[i] = i;
      }

#pragma omp parallel for simd simdlen(16) aligned(x : 64)
      for (int i = 0; i < N; i++) {
        if (x[i] != i) {
#pragma omp atomic write
          not_correct_array_values = 1;
        }
      }
      if (not_correct_array_values) {
        errors++;
      }
      omp_free(x, alloc);
    }
  }

  omp_destroy_allocator(alloc);

  return errors;
}

int main() {
  int errors = 0;
  if (test_omp_aligned_alloc_on_device())
    printf("FAILE\n");
  else
    // CHECK: PASSED
    printf("PASSED\n");
}