//===--------- Misc.cpp - OpenMP device misc interfaces ----------- C++ -*-===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // //===----------------------------------------------------------------------===// #include "Allocator.h" #include "Configuration.h" #include "Types.h" #include "Debug.h" #pragma omp begin declare target device_type(nohost) namespace ompx { namespace impl { double getWTick(); double getWTime(); /// AMDGCN Implementation /// ///{ #pragma omp begin declare variant match(device = {arch(amdgcn)}) double getWTick() { // The number of ticks per second for the AMDGPU clock varies by card and can // only be retrived by querying the driver. We rely on the device environment // to inform us what the proper frequency is. return 1.0 / config::getClockFrequency(); } double getWTime() { uint64_t NumTicks = 0; if constexpr (__has_builtin(__builtin_amdgcn_s_sendmsg_rtnl)) NumTicks = __builtin_amdgcn_s_sendmsg_rtnl(0x83); else if constexpr (__has_builtin(__builtin_amdgcn_s_memrealtime)) NumTicks = __builtin_amdgcn_s_memrealtime(); else if constexpr (__has_builtin(__builtin_amdgcn_s_memtime)) NumTicks = __builtin_amdgcn_s_memtime(); return static_cast(NumTicks) * getWTick(); } #pragma omp end declare variant /// NVPTX Implementation /// ///{ #pragma omp begin declare variant match( \ device = {arch(nvptx, nvptx64)}, \ implementation = {extension(match_any)}) double getWTick() { // Timer precision is 1ns return ((double)1E-9); } double getWTime() { uint64_t nsecs = __nvvm_read_ptx_sreg_globaltimer(); return static_cast(nsecs) * getWTick(); } #pragma omp end declare variant /// Lookup a device-side function using a host pointer /p HstPtr using the table /// provided by the device plugin. The table is an ordered pair of host and /// device pointers sorted on the value of the host pointer. void *indirectCallLookup(void *HstPtr) { if (!HstPtr) return nullptr; struct IndirectCallTable { void *HstPtr; void *DevPtr; }; IndirectCallTable *Table = reinterpret_cast(config::getIndirectCallTablePtr()); uint64_t TableSize = config::getIndirectCallTableSize(); // If the table is empty we assume this is device pointer. if (!Table || !TableSize) return HstPtr; uint32_t Left = 0; uint32_t Right = TableSize; // If the pointer is definitely not contained in the table we exit early. if (HstPtr < Table[Left].HstPtr || HstPtr > Table[Right - 1].HstPtr) return HstPtr; while (Left != Right) { uint32_t Current = Left + (Right - Left) / 2; if (Table[Current].HstPtr == HstPtr) return Table[Current].DevPtr; if (HstPtr < Table[Current].HstPtr) Right = Current; else Left = Current; } // If we searched the whole table and found nothing this is a device pointer. return HstPtr; } } // namespace impl } // namespace ompx /// Interfaces /// ///{ extern "C" { int32_t __kmpc_cancellationpoint(IdentTy *, int32_t, int32_t) { return 0; } int32_t __kmpc_cancel(IdentTy *, int32_t, int32_t) { return 0; } double omp_get_wtick(void) { return ompx::impl::getWTick(); } double omp_get_wtime(void) { return ompx::impl::getWTime(); } void *__llvm_omp_indirect_call_lookup(void *HstPtr) { return ompx::impl::indirectCallLookup(HstPtr); } void *omp_alloc(size_t size, omp_allocator_handle_t allocator) { switch (allocator) { case omp_default_mem_alloc: case omp_large_cap_mem_alloc: case omp_const_mem_alloc: case omp_high_bw_mem_alloc: case omp_low_lat_mem_alloc: return malloc(size); default: return nullptr; } } void omp_free(void *ptr, omp_allocator_handle_t allocator) { switch (allocator) { case omp_default_mem_alloc: case omp_large_cap_mem_alloc: case omp_const_mem_alloc: case omp_high_bw_mem_alloc: case omp_low_lat_mem_alloc: free(ptr); case omp_null_allocator: default: return; } } } ///} #pragma omp end declare target