With this PR, if we have customized implementation for scalar or vector length = 2, we don't need to write new macros, e.g. https://github.com/intel/llvm/blob/fb18321705f6/libclc/clc/include/clc/clcmacro.h#L15 Undef __HALF_ONLY, __FLOAT_ONLY and __DOUBLE_ONLY at the end of clc/include/clc/math/gentype.inc llvm-diff shows no change to nvptx64--nvidiacl.bc and amdgcn--amdhsa.bc
21 lines
657 B
C
21 lines
657 B
C
//===----------------------------------------------------------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef __CLC_MATH_CLC_HALF_DIVIDE_H__
|
|
#define __CLC_MATH_CLC_HALF_DIVIDE_H__
|
|
|
|
#define __FLOAT_ONLY
|
|
#define __CLC_FUNCTION __clc_half_divide
|
|
#define __CLC_BODY <clc/shared/binary_decl.inc>
|
|
|
|
#include <clc/math/gentype.inc>
|
|
|
|
#undef __CLC_FUNCTION
|
|
|
|
#endif // __CLC_MATH_CLC_HALF_DIVIDE_H__
|