
This patch is part of the upstreaming effort for supporting SYCL language front end. It makes the following changes: 1. Adds sycl_external attribute for functions with external linkage, which is intended for use to implement the SYCL_EXTERNAL macro as specified by the SYCL 2020 specification 2. Adds checks to avoid emitting device code when sycl_external and sycl_kernel_entry_point attributes are not enabled 3. Fixes test failures caused by the above changes This patch is missing diagnostics for the following diagnostics listed in the SYCL 2020 specification's section 5.10.1, which will be addressed in a subsequent PR: Functions that are declared using SYCL_EXTERNAL have the following additional restrictions beyond those imposed on other device functions: 1. If the SYCL backend does not support the generic address space then the function cannot use raw pointers as parameter or return types. Explicit pointer classes must be used instead; 2. The function cannot call group::parallel_for_work_item; 3. The function cannot be called from a parallel_for_work_group scope. In addition to that, the subsequent PR will also implement diagnostics for inline functions including virtual functions defined as inline. --------- Co-authored-by: Mariya Podchishchaeva <mariya.podchishchaeva@intel.com>
61 lines
2.1 KiB
C++
61 lines
2.1 KiB
C++
// RUN: %clang_cc1 %s -o - -O0 -emit-llvm \
|
|
// RUN: -triple spir64-unknown-unknown \
|
|
// RUN: -aux-triple x86_64-unknown-linux-gnu \
|
|
// RUN: -fsycl-is-device \
|
|
// RUN: -finclude-default-header \
|
|
// RUN: -debug-info-kind=limited -gno-column-info \
|
|
// RUN: | FileCheck %s
|
|
//
|
|
// In spir functions, validate the llvm.dbg.declare intrinsics created for
|
|
// parameters and locals refer to the stack allocation in the alloca address
|
|
// space.
|
|
//
|
|
|
|
#define KERNEL __attribute__((sycl_kernel))
|
|
|
|
template <typename KernelName, typename KernelType>
|
|
KERNEL void parallel_for(const KernelType &KernelFunc) {
|
|
KernelFunc();
|
|
}
|
|
|
|
[[clang::sycl_external]] void my_kernel(int my_param) {
|
|
int my_local = 0;
|
|
my_local = my_param;
|
|
}
|
|
|
|
int my_host() {
|
|
parallel_for<class K>([=]() { my_kernel(42); });
|
|
return 0;
|
|
}
|
|
|
|
// CHECK: define {{.*}}spir_func void @_Z9my_kerneli(
|
|
// CHECK-SAME i32 %my_param
|
|
// CHECK-SAME: !dbg [[MY_KERNEL:![0-9]+]]
|
|
// CHECK-SAME: {
|
|
// CHECK: %my_param.addr = alloca i32, align 4
|
|
// CHECK: %my_local = alloca i32, align 4
|
|
// CHECK: #dbg_declare(
|
|
// CHECK-SAME: ptr %my_param.addr,
|
|
// CHECK-SAME: [[MY_PARAM:![0-9]+]],
|
|
// CHECK-SAME: !DIExpression(DW_OP_constu, 4, DW_OP_swap, DW_OP_xderef)
|
|
// CHECK-SAME: )
|
|
// CHECK: #dbg_declare(
|
|
// CHECK-SAME: ptr %my_local,
|
|
// CHECK-SAME: [[MY_LOCAL:![0-9]+]],
|
|
// CHECK-SAME: !DIExpression(DW_OP_constu, 4, DW_OP_swap, DW_OP_xderef)
|
|
// CHECK-SAME: )
|
|
// CHECK: }
|
|
|
|
// CHECK: [[MY_KERNEL]] = distinct !DISubprogram(
|
|
// CHECK-SAME: name: "my_kernel"
|
|
// CHECK-SAME: )
|
|
// CHECK: [[MY_PARAM]] = !DILocalVariable(
|
|
// CHECK-SAME: name: "my_param"
|
|
// CHECK-SAME: arg: 1
|
|
// CHECK-SAME: scope: [[MY_KERNEL]]
|
|
// CHECK-SAME: )
|
|
// CHECK: [[MY_LOCAL]] = !DILocalVariable(
|
|
// CHECK-SAME: name: "my_local"
|
|
// CHECK-SAME: scope: [[MY_KERNEL]]
|
|
// CHECK-SAME: )
|