blob: 41b8a3bdae07735b7d9490ccfa62b352ec1947a6 [file] [edit]
// REQUIRES: amdgpu-registered-target
// REQUIRES: nvptx-registered-target
// Implicit-H+D functions reached only via an explicit template instantiation
// get a real body if their device codegen is clean, or a trap body if it
// would otherwise raise a target-mismatch diagnostic.
// RUN: %clang_cc1 -triple amdgcn-amd-amdhsa -fcuda-is-device -x hip \
// RUN: -emit-llvm -o - %s | FileCheck %s
// RUN: %clang_cc1 -triple nvptx64-nvidia-cuda -fcuda-is-device -x hip \
// RUN: -emit-llvm -o - %s | FileCheck %s
#include "Inputs/cuda.h"
__host__ int host_only() { return 7; }
// Class-template member, safe body.
template <typename T>
struct ETI_Safe {
constexpr T add_one(T x) { return x + (T)1; }
};
template class ETI_Safe<float>;
// CHECK: define {{.*}} float @_ZN8ETI_SafeIfE7add_oneEf(
// CHECK-NOT: call void @llvm.trap()
// CHECK: ret float
// Class-template member, body calls a __host__-only function.
template <typename T>
struct ETI_BadBody {
constexpr T call_host(T x) { return x + (T)host_only(); }
};
template class ETI_BadBody<float>;
// CHECK-LABEL: define {{.*}} float @_ZN11ETI_BadBodyIfE9call_hostEf(
// CHECK: call void @llvm.trap()
// CHECK-NEXT: ret float poison
// Function-template form, safe body.
template <typename T>
constexpr T ft_safe(T x) { return x + (T)1; }
template float ft_safe<float>(float);
// CHECK: define {{.*}} float @_Z7ft_safeIfET_S0_(
// CHECK-NOT: call void @llvm.trap()
// CHECK: ret float
// Function-template form, body calls a __host__-only function.
template <typename T>
constexpr T ft_bad(T x) { return x + (T)host_only(); }
template float ft_bad<float>(float);
// CHECK-LABEL: define {{.*}} float @_Z6ft_badIfET_S0_(
// CHECK: call void @llvm.trap()
// CHECK-NEXT: ret float poison
__global__ void kernel(float *p) { *p = 1.0f; }
// CHECK-NOT: __clang_hip_unreachable_dtor
// CHECK-NOT: __clang_cuda_unreachable_dtor