With this PR, if we have customized implementation for scalar or vector length = 2, we don't need to write new macros, e.g. https://github.com/intel/llvm/blob/fb18321705f6/libclc/clc/include/clc/clcmacro.h#L15 Undef __HALF_ONLY, __FLOAT_ONLY and __DOUBLE_ONLY at the end of clc/include/clc/math/gentype.inc llvm-diff shows no change to nvptx64--nvidiacl.bc and amdgcn--amdhsa.bc
54 lines
1.8 KiB
Common Lisp
54 lines
1.8 KiB
Common Lisp
//===----------------------------------------------------------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include <clc/clc_convert.h>
|
|
#include <clc/integer/clc_clz.h>
|
|
#include <clc/integer/clc_mul_hi.h>
|
|
#include <clc/internal/clc.h>
|
|
#include <clc/math/clc_fma.h>
|
|
#include <clc/math/clc_mad.h>
|
|
#include <clc/math/clc_native_divide.h>
|
|
#include <clc/math/clc_trunc.h>
|
|
#include <clc/math/math.h>
|
|
|
|
#define bitalign(hi, lo, shift) ((hi) << (32 - (shift))) | ((lo) >> (shift));
|
|
|
|
#define FULL_MUL(A, B, HI, LO) \
|
|
LO = A * B; \
|
|
HI = __clc_mul_hi(A, B)
|
|
|
|
#define FULL_MAD(A, B, C, HI, LO) \
|
|
LO = ((A) * (B) + (C)); \
|
|
HI = __clc_mul_hi(A, B); \
|
|
HI += LO < C ? 1U : 0U;
|
|
|
|
#define __FLOAT_ONLY
|
|
#define __CLC_BODY <clc_sincos_helpers.inc>
|
|
|
|
#include <clc/math/gentype.inc>
|
|
|
|
#ifdef cl_khr_fp64
|
|
|
|
#pragma OPENCL EXTENSION cl_khr_fp64 : enable
|
|
|
|
#include <clc/math/clc_fract.h>
|
|
#include <clc/math/tables.h>
|
|
#include <clc/shared/clc_max.h>
|
|
|
|
#define bytealign(src0, src1, src2) \
|
|
(__CLC_CONVERT_UINTN( \
|
|
((__CLC_CONVERT_LONGN((src0)) << 32) | __CLC_CONVERT_LONGN((src1))) >> \
|
|
(((src2) & 3) * 8)))
|
|
|
|
#define __DOUBLE_ONLY
|
|
#define __CLC_BODY <clc_sincos_helpers_fp64.inc>
|
|
|
|
#include <clc/math/gentype.inc>
|
|
|
|
#endif
|