Headers/openmp_wrappers/math.h

f85ae058SJohannes Doerfert/*===---- openmp_wrapper/math.h -------- OpenMP math.h intercept ------ c++ -===
e62c693cSGheorghe-Teodor Bercea *
e62c693cSGheorghe-Teodor Bercea * Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
e62c693cSGheorghe-Teodor Bercea * See https://llvm.org/LICENSE.txt for license information.
e62c693cSGheorghe-Teodor Bercea * SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
e62c693cSGheorghe-Teodor Bercea *
e62c693cSGheorghe-Teodor Bercea *===-----------------------------------------------------------------------===
e62c693cSGheorghe-Teodor Bercea */
e62c693cSGheorghe-Teodor Bercea
17d83342SJohannes Doerfert// If we are in C++ mode and include <math.h> (not <cmath>) first, we still need
17d83342SJohannes Doerfert// to make sure <cmath> is read first. The problem otherwise is that we haven't
17d83342SJohannes Doerfert// seen the declarations of the math.h functions when the system math.h includes
17d83342SJohannes Doerfert// our cmath overlay. However, our cmath overlay, or better the underlying
17d83342SJohannes Doerfert// overlay, e.g. CUDA, uses the math.h functions. Since we haven't declared them
17d83342SJohannes Doerfert// yet we get errors. CUDA avoids this by eagerly declaring all math functions
17d83342SJohannes Doerfert// (in the __device__ space) but we cannot do this. Instead we break the
17d83342SJohannes Doerfert// dependence by forcing cmath to go first. While our cmath will in turn include
17d83342SJohannes Doerfert// this file, the cmath guards will prevent recursion.
17d83342SJohannes Doerfert#ifdef __cplusplus
17d83342SJohannes Doerfert#include <cmath>
17d83342SJohannes Doerfert#endif
17d83342SJohannes Doerfert
f85ae058SJohannes Doerfert#ifndef __CLANG_OPENMP_MATH_H__
f85ae058SJohannes Doerfert#define __CLANG_OPENMP_MATH_H__
e62c693cSGheorghe-Teodor Bercea
f85ae058SJohannes Doerfert#ifndef _OPENMP
f85ae058SJohannes Doerfert#error "This file is for OpenMP compilation only."
e62c693cSGheorghe-Teodor Bercea#endif
e62c693cSGheorghe-Teodor Bercea
f85ae058SJohannes Doerfert#include_next <math.h>
f85ae058SJohannes Doerfert
f85ae058SJohannes Doerfert// We need limits.h for __clang_cuda_math.h below and because it should not hurt
f85ae058SJohannes Doerfert// we include it eagerly here.
f85ae058SJohannes Doerfert#include <limits.h>
f85ae058SJohannes Doerfert
f85ae058SJohannes Doerfert// We need stdlib.h because (for now) __clang_cuda_math.h below declares `abs`
f85ae058SJohannes Doerfert// which should live in stdlib.h.
f85ae058SJohannes Doerfert#include <stdlib.h>
f85ae058SJohannes Doerfert
f85ae058SJohannes Doerfert#pragma omp begin declare variant match(                                       \
f85ae058SJohannes Doerfert    device = {arch(nvptx, nvptx64)}, implementation = {extension(match_any)})
f85ae058SJohannes Doerfert
f85ae058SJohannes Doerfert#define __CUDA__
7f1e6fcfSJohannes Doerfert#define __OPENMP_NVPTX__
f85ae058SJohannes Doerfert#include <__clang_cuda_math.h>
7f1e6fcfSJohannes Doerfert#undef __OPENMP_NVPTX__
f85ae058SJohannes Doerfert#undef __CUDA__
f85ae058SJohannes Doerfert
f85ae058SJohannes Doerfert#pragma omp end declare variant
f85ae058SJohannes Doerfert
*713a5d12SPushpinder Singh#ifdef __AMDGCN__
*713a5d12SPushpinder Singh#pragma omp begin declare variant match(device = {arch(amdgcn)})
*713a5d12SPushpinder Singh
*713a5d12SPushpinder Singh#define __OPENMP_AMDGCN__
*713a5d12SPushpinder Singh#include <__clang_hip_math.h>
*713a5d12SPushpinder Singh#undef __OPENMP_AMDGCN__
*713a5d12SPushpinder Singh
*713a5d12SPushpinder Singh#pragma omp end declare variant
*713a5d12SPushpinder Singh#endif
*713a5d12SPushpinder Singh
f85ae058SJohannes Doerfert#endif