| 1 | // RUN: %clang_cc1 -triple amdgcn -fcuda-is-device -emit-llvm %s -o - | FileCheck %s |
| 2 | #include "Inputs/cuda.h" |
| 3 | |
| 4 | // CHECK: define amdgpu_kernel void @_ZN1A6kernelEv |
| 5 | class A { |
| 6 | public: |
| 7 | static __global__ void kernel(){} |
| 8 | }; |
| 9 | |
| 10 | // CHECK: define void @_Z10non_kernelv |
| 11 | __device__ void non_kernel(){} |
| 12 | |
| 13 | // CHECK: define amdgpu_kernel void @_Z6kerneli |
| 14 | __global__ void kernel(int x) { |
| 15 | non_kernel(); |
| 16 | } |
| 17 | |
| 18 | // CHECK: define amdgpu_kernel void @_Z11EmptyKernelIvEvv |
| 19 | template <typename T> |
| 20 | __global__ void EmptyKernel(void) {} |
| 21 | |
| 22 | struct Dummy { |
| 23 | /// Type definition of the EmptyKernel kernel entry point |
| 24 | typedef void (*EmptyKernelPtr)(); |
| 25 | EmptyKernelPtr Empty() { return EmptyKernel<void>; } |
| 26 | }; |
| 27 | |
| 28 | // CHECK: define amdgpu_kernel void @_Z15template_kernelI1AEvT_ |
| 29 | template<class T> |
| 30 | __global__ void template_kernel(T x) {} |
| 31 | |
| 32 | void launch(void *f); |
| 33 | |
| 34 | int main() { |
| 35 | Dummy D; |
| 36 | launch((void*)A::kernel); |
| 37 | launch((void*)kernel); |
| 38 | launch((void*)template_kernel<A>); |
| 39 | launch((void*)D.Empty()); |
| 40 | return 0; |
| 41 | } |
| 42 | |