// REQUIRES: amdgpu-registered-target // RUN: %clang_cc1 -no-opaque-pointers -include __clang_hip_runtime_wrapper.h \ // RUN: -internal-isystem %S/../../lib/Headers/cuda_wrappers \ // RUN: -internal-isystem %S/Inputs/include \ // RUN: -triple amdgcn-amd-amdhsa -aux-triple x86_64-unknown-unknown \ // RUN: -target-cpu gfx906 -emit-llvm %s -fcuda-is-device -o - \ // RUN: -D__HIPCC_RTC__ | FileCheck -check-prefixes=CHECK,NOMALLOC %s // RUN: %clang_cc1 -no-opaque-pointers -include __clang_hip_runtime_wrapper.h \ // RUN: -internal-isystem %S/../../lib/Headers/cuda_wrappers \ // RUN: -internal-isystem %S/Inputs/include \ // RUN: -include cmath \ // RUN: -triple amdgcn-amd-amdhsa -aux-triple x86_64-unknown-unknown \ // RUN: -target-cpu gfx906 -emit-llvm %s -fcuda-is-device -o - \ // RUN: -D__HIPCC_RTC__ | FileCheck %s -check-prefixes=AMD_BOOL_RETURN // RUN: %clang_cc1 -no-opaque-pointers -include __clang_hip_runtime_wrapper.h \ // RUN: -internal-isystem %S/../../lib/Headers/cuda_wrappers \ // RUN: -internal-isystem %S/Inputs/include \ // RUN: -include cmath \ // RUN: -triple amdgcn-amd-amdhsa -aux-triple x86_64-unknown-unknown \ // RUN: -target-cpu gfx906 -emit-llvm %s -fcuda-is-device -o - \ // RUN: -D__HIPCC_RTC__ -DUSE_ISNAN_WITH_INT_RETURN | FileCheck %s -check-prefixes=AMD_INT_RETURN // RUN: %clang_cc1 -no-opaque-pointers -include __clang_hip_runtime_wrapper.h \ // RUN: -internal-isystem %S/../../lib/Headers/cuda_wrappers \ // RUN: -internal-isystem %S/Inputs/include \ // RUN: -triple amdgcn-amd-amdhsa -aux-triple x86_64-unknown-unknown \ // RUN: -target-cpu gfx906 -emit-llvm %s -fcuda-is-device -o - \ // RUN: -D__HIPCC_RTC__ -std=c++14 | FileCheck -check-prefixes=CHECK,CXX14 %s // RUN: %clang_cc1 -no-opaque-pointers -include __clang_hip_runtime_wrapper.h \ // RUN: -internal-isystem %S/../../lib/Headers/cuda_wrappers \ // RUN: -internal-isystem %S/Inputs/include \ // RUN: -triple amdgcn-amd-amdhsa -aux-triple x86_64-unknown-unknown \ // RUN: -target-cpu gfx906 -emit-llvm %s -fcuda-is-device -o - \ // RUN: -DHIP_VERSION_MAJOR=4 -DHIP_VERSION_MINOR=5 \ // RUN: -D__HIPCC_RTC__ | FileCheck -check-prefixes=CHECK,MALLOC %s // expected-no-diagnostics // Check support for pure and deleted virtual functions struct base { __host__ __device__ virtual void pv() = 0; __host__ __device__ virtual void dv() = delete; }; struct derived:base { __host__ __device__ virtual void pv() override {}; }; __device__ void test_vf() { derived d; } // CHECK: @_ZTV7derived = linkonce_odr unnamed_addr addrspace(1) constant { [4 x i8*] } { [4 x i8*] [i8* null, i8* null, i8* bitcast (void (%struct.derived*)* @_ZN7derived2pvEv to i8*), i8* bitcast (void ()* @__cxa_deleted_virtual to i8*)] }, comdat, align 8 // CHECK: @_ZTV4base = linkonce_odr unnamed_addr addrspace(1) constant { [4 x i8*] } { [4 x i8*] [i8* null, i8* null, i8* bitcast (void ()* @__cxa_pure_virtual to i8*), i8* bitcast (void ()* @__cxa_deleted_virtual to i8*)] }, comdat, align 8 // CHECK: define{{.*}}void @__cxa_pure_virtual() // CHECK: define{{.*}}void @__cxa_deleted_virtual() struct Number { __device__ Number(float _x) : x(_x) {} float x; }; #if __cplusplus >= 201103L // Check __hip::__numeric_type can be used with a class without default ctor. __device__ void test_numeric_type() { int x = __hip::__numeric_type<Number>::value; } // ToDo: Fix __clang_hip_cmake.h to specialize __hip::is_arithmetic<_Float16> // to resolve fma(_Float16, _Float16, int) to fma(double, double, double) // instead of fma(_Float16, _Float16, _Float16). // CXX14-LABEL: define{{.*}}@_Z8test_fma // CXX14: call {{.*}}@__ocml_fma_f16 __device__ double test_fma(_Float16 h, int i) { return fma(h, h, i); } #endif // CHECK-LABEL: amdgpu_kernel void @_Z4kernPff __global__ void kern(float *x, float y) { *x = sin(y); } // CHECK-LABEL: define{{.*}} i64 @_Z11test_size_tv // CHECK: ret i64 8 __device__ size_t test_size_t() { return sizeof(size_t); } // Check there is no ambiguity when calling overloaded math functions. // CHECK-LABEL: define{{.*}}@_Z10test_floorv // CHECK: call {{.*}}double @__ocml_floor_f64(double __device__ float test_floor() { return floor(5); } // CHECK-LABEL: define{{.*}}@_Z8test_maxv // CHECK: call {{.*}}double @__ocml_fmax_f64(double {{.*}}, double __device__ float test_max() { return max(5, 6.0); } // CHECK-LABEL: define{{.*}}@_Z10test_isnanv __device__ double test_isnan() { double r = 0; double d = 5.0; float f = 5.0; // AMD_INT_RETURN: call i32 @__ocml_isnan_f32(float // AMD_BOOL_RETURN: call i32 @__ocml_isnan_f32(float r += isnan(f); // AMD_INT_RETURN: call i32 @__ocml_isnan_f64(double // AMD_BOOL_RETURN: call i32 @__ocml_isnan_f64(double r += isnan(d); return r ; } // Check that device malloc and free do not conflict with std headers. #include <cstdlib> // CHECK-LABEL: define{{.*}}@_Z11test_malloc // CHECK: call {{.*}}i8* @malloc(i64 // CHECK-LABEL: define weak {{.*}}i8* @malloc(i64 // MALLOC: call i64 @__ockl_dm_alloc // NOMALLOC: call void @llvm.trap __device__ void test_malloc(void *a) { a = malloc(42); } // CHECK-LABEL: define{{.*}}@_Z9test_free // CHECK: call {{.*}}void @free(i8* // CHECK-LABEL: define weak {{.*}}void @free(i8* // MALLOC: call void @__ockl_dm_dealloc // NOMALLOC: call void @llvm.trap __device__ void test_free(void *a) { free(a); }