amdgcn_device_function_call.cpp
996 Bytes
// REQUIRES: amdgpu-registered-target
// RUN: %clang_cc1 -fopenmp -x c++ -std=c++11 -triple x86_64-unknown-unknown -fopenmp-targets=amdgcn-amd-amdhsa -emit-llvm-bc %s -o %t-ppc-host.bc
// RUN: %clang_cc1 -fopenmp -x c++ -std=c++11 -triple amdgcn-amd-amdhsa -fopenmp-targets=amdgcn-amd-amdhsa -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - | FileCheck %s
// RUN: llvm-dis < %t-ppc-host.bc | FileCheck %s -check-prefix=HOST
// device side declarations
#pragma omp declare target
extern "C" float cosf(float __x);
#pragma omp end declare target
// host side declaration
extern "C" float cosf(float __x);
void test_amdgcn_openmp_device(float __x) {
// the default case where predefined library functions are treated as
// builtins on the host
// HOST: call float @llvm.cos.f32(float
__x = cosf(__x);
#pragma omp target
{
// cosf should not be treated as builtin on device
// CHECK-NOT: call float @llvm.cos.f32(float
__x = cosf(__x);
}
}