| /llvm-project-15.0.7/clang/test/SemaOpenCLCXX/ |
| H A D | invalid-kernel.clcpp | 9 kernel void m(); //expected-error{{kernel functions cannot be class members}} 25 kernel void int_v(int in); 26 kernel void int_p(__global int *in); 27 kernel void int_r(__global int &in); 32 kernel void k_atomic_v(atomic_int in); 40 kernel void k_sampler(sampler_t in); 41 kernel void k_void(__global void *in); 45 kernel void int4_v(int4 in); 46 kernel void int4_p(__global int4 *in); 55 kernel void pod_v(POD in) {} [all …]
|
| /llvm-project-15.0.7/llvm/test/MC/AMDGPU/ |
| H A D | sym_kernel_scope.s | 3 .byte .kernel.sgpr_count 5 .byte .kernel.vgpr_count 9 .byte .kernel.sgpr_count 11 .byte .kernel.vgpr_count 16 .byte .kernel.sgpr_count 18 .byte .kernel.vgpr_count 22 .byte .kernel.sgpr_count 24 .byte .kernel.vgpr_count 44 A = .kernel.vgpr_count 46 B = .kernel.vgpr_count [all …]
|
| H A D | sym_kernel_scope_agpr.s | 5 .byte .kernel.agpr_count 7 .byte .kernel.vgpr_count 13 .byte .kernel.agpr_count 16 .byte .kernel.vgpr_count 22 .byte .kernel.agpr_count 24 .byte .kernel.vgpr_count 28 .byte .kernel.agpr_count 31 .byte .kernel.vgpr_count 36 .byte .kernel.agpr_count 38 .byte .kernel.vgpr_count [all …]
|
| /llvm-project-15.0.7/clang/test/SemaOpenCL/ |
| H A D | amdgpu-attrs.cl | 27 …num_sgpr_32() {} // expected-error {{'amdgpu_num_sgpr' attribute only applies to kernel functions}} 56 __attribute__((amdgpu_flat_work_group_size(0, 0))) kernel void kernel_flat_work_group_size_0_0() {} 57 __attribute__((amdgpu_waves_per_eu(0))) kernel void kernel_waves_per_eu_0() {} 58 __attribute__((amdgpu_waves_per_eu(0, 0))) kernel void kernel_waves_per_eu_0_0() {} 59 __attribute__((amdgpu_num_sgpr(0))) kernel void kernel_num_sgpr_0() {} 60 __attribute__((amdgpu_num_vgpr(0))) kernel void kernel_num_vgpr_0() {} 62 kernel __attribute__((amdgpu_flat_work_group_size(32, 64))) void kernel_flat_work_group_size_32_64(… 63 kernel __attribute__((amdgpu_waves_per_eu(2))) void kernel_waves_per_eu_2() {} 64 kernel __attribute__((amdgpu_waves_per_eu(2, 4))) void kernel_waves_per_eu_2_4() {} 65 kernel __attribute__((amdgpu_num_sgpr(32))) void kernel_num_sgpr_32() {} [all …]
|
| H A D | invalid-kernel-parameters.cl | 13 kernel void no_ptrptr(global int * global *i) { } 14 kernel void no_lptrcptr(constant int * local *i) { } 30 kernel void no_genericptr(generic int *ptr) { } 76 kernel void bool_arg(bool x) { } // expected-error{{'__private bool' cannot be used as the type of … 79 kernel void half_arg(half x) { } 98 kernel void image_in_struct_arg(FooImage2D arg) { } // expected-error{{struct kernel parameters may… 105 kernel void pointer_in_struct_arg(Foo arg) { } // expected-error{{struct kernel parameters may not … 112 kernel void pointer_in_union_arg(FooUnion arg) { }// expected-error{{union kernel parameters may no… 123 kernel void pointer_in_nested_struct_arg(NestedPointer arg) { }// expected-error{{struct kernel par… 206 kernel void array_of_ptr(struct ArrayOfPtr arr) {} // expected-error{{struct kernel parameters may … [all …]
|
| H A D | invalid-kernel-attrs.cl | 3 kernel __attribute__((vec_type_hint)) void kernel1() {} //expected-error{{'vec_type_hint' attribute… 5 kernel __attribute__((vec_type_hint(not_type))) void kernel2() {} //expected-error{{unknown type na… 13 kernel __attribute__((work_group_size_hint(8,16,32,4))) void kernel6() {} //expected-error{{'work_g… 17 …(){} // expected-error {{attribute 'reqd_work_group_size' can only be applied to an OpenCL kernel}} 19 …(){} // expected-error {{attribute 'work_group_size_hint' can only be applied to an OpenCL kernel}} 21 …ernel10(){} // expected-error {{attribute 'vec_type_hint' can only be applied to an OpenCL kernel}} 29 void f_kernel_image2d_t( kernel image2d_t image ) { // expected-error {{'kernel' attribute only app… 33 kernel __attribute__((reqd_work_group_size(1,2,0))) void kernel11(){} // expected-error {{'reqd_wor… 34 kernel __attribute__((reqd_work_group_size(1,0,2))) void kernel12(){} // expected-error {{'reqd_wor… 35 kernel __attribute__((reqd_work_group_size(0,1,2))) void kernel13(){} // expected-error {{'reqd_wor… [all …]
|
| H A D | access-qualifier.cl | 43 kernel void k1(img1d_wo img) { 52 kernel void k2(img1d_ro img) { 61 kernel void k3(img1d_wo img) { 66 kernel void k4(img1d_rw img) { 71 kernel void k5(img1d_ro_default img) { 80 kernel void k6(img1d_ro img) { 84 kernel void k7(read_only img1d_wo img){} // expected-error {{multiple access qualifiers}} 86 kernel void k8(write_only img1d_ro_default img){} // expected-error {{multiple access qualifiers}} 92 kernel void k11(read_only write_only image1d_t i){} // expected-error{{multiple access qualifiers}} 113 kernel void k14(read_only pipe int p) { [all …]
|
| /llvm-project-15.0.7/clang/test/SemaCUDA/ |
| H A D | lambda.cu | 13 __global__ void kernel(F f) { f(); } in kernel() function 27 kernel<<<1,1>>>([](){ hd(0); }); in test() 29 kernel<<<1,1>>>([=](){ hd(b); }); in test() 32 kernel<<<1,1>>>([&](){ hd(b); }); in test() 38 kernel<<<1,1>>>([&](){ in test() 46 kernel<<<1,1>>>(lambda1); in test() 59 kernel<<<1,1>>>(global_lambda); in main() 61 kernel<<<1,1>>>([](){ hd(0); }); in main() 63 kernel<<<1,1>>>([=](){ hd(b); }); in main() 65 kernel<<<1,1>>>([b](){ hd(b); }); in main() [all …]
|
| /llvm-project-15.0.7/polly/lib/External/ppcg/ |
| H A D | gpu_tree.c | 324 id = isl_id_alloc(kernel->ctx, name, kernel); in create_sync_domain() 341 return isl_id_get_user(id) == kernel; in gpu_tree_id_is_sync() 348 struct ppcg_kernel *kernel) in domain_is_sync() argument 369 struct ppcg_kernel *kernel) in node_is_sync_filter() argument 393 struct ppcg_kernel *kernel) in has_preceding_sync() argument 418 struct ppcg_kernel *kernel) in has_following_sync() argument 443 struct ppcg_kernel *kernel) in has_sync_before_core() argument 450 node = core_child(node, kernel->core); in has_sync_before_core() 468 struct ppcg_kernel *kernel) in has_sync_after_core() argument 500 domain = create_sync_domain(kernel); in insert_sync_before() [all …]
|
| H A D | cuda.c | 201 struct ppcg_kernel *kernel) in print_grid_size() argument 230 struct ppcg_kernel *kernel) in print_grid() argument 430 struct ppcg_kernel *kernel) in print_kernel_vars() argument 604 struct ppcg_kernel *kernel; in print_host_user() local 630 p = print_reverse_list(p, kernel->n_block, kernel->block_dim); in print_host_user() 634 p = print_grid(p, kernel); in print_host_user() 692 isl_printer *kernel; in print_cuda() local 695 kernel = isl_printer_set_output_format(kernel, ISL_FORMAT_C); in print_cuda() 696 kernel = gpu_print_types(kernel, types, prog); in print_cuda() 697 isl_printer_free(kernel); in print_cuda() [all …]
|
| H A D | gpu.c | 676 kernel->block_dim, kernel->n_block); in read_grid_and_block_sizes() 678 kernel->grid_dim, kernel->n_grid); in read_grid_and_block_sizes() 1156 if (!kernel) in ppcg_kernel_free() 1193 free(kernel); in ppcg_kernel_free() 1865 if (kernel) in create_domain_leaf() 1874 data.kernel = kernel; in create_domain_leaf() 2433 kernel = data->kernel; in after_mark() 3062 kernel->grid_size, kernel->block_ids); in insert_context() 3064 kernel->block_dim, kernel->thread_ids); in insert_context() 3561 if (tile->n > kernel->n_block && kernel->n_block > 0) in add_copies_group_shared() [all …]
|
| H A D | gpu_group.c | 967 p = isl_printer_print_int(p, kernel->id); in report_no_reuse_and_coalesced() 1127 report_no_reuse_and_coalesced(kernel, access); in compute_group_bounds_core() 1505 if (!kernel->options->live_range_reordering) in check_can_be_private_live_ranges() 1508 kernel->any_force_private = 0; in check_can_be_private_live_ranges() 1517 for (i = 0; i < kernel->n_array; ++i) { in check_can_be_private_live_ranges() 1533 kernel->any_force_private = 1; in check_can_be_private_live_ranges() 1562 struct ppcg_kernel *kernel) in compute_privatization() argument 1637 data.scop = kernel->prog->scop; in gpu_group_references() 1678 compute_privatization(&data, kernel); in gpu_group_references() 1680 for (i = 0; i < kernel->n_array; ++i) { in gpu_group_references() [all …]
|
| /llvm-project-15.0.7/llvm/test/CodeGen/AMDGPU/ |
| H A D | lower-kernel-lds-constexpr.ll | 9 ; CHECK: %llvm.amdgcn.kernel.k2.lds.t = type { i32 } 17 ; CHECK: @llvm.amdgcn.kernel.k0.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k0.lds.t und… 18 ; CHECK: @llvm.amdgcn.kernel.k1.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k1.lds.t und… 19 ; CHECK: @llvm.amdgcn.kernel.k2.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k2.lds.t und… 20 ; CHECK: @llvm.amdgcn.kernel.k3.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k3.lds.t und… 21 ; CHECK: @llvm.amdgcn.kernel.k4.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k4.lds.t und… 22 ; CHECK: @llvm.amdgcn.kernel.k5.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k5.lds.t und… 23 ; CHECK: @llvm.amdgcn.kernel.k6.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k6.lds.t und… 53 ; Use constant twice from the same kernel 56 …getelementptr inbounds (%llvm.amdgcn.kernel.k2.lds.t, %llvm.amdgcn.kernel.k2.lds.t addrspace(3)* @… [all …]
|
| H A D | lower-kernel-and-module-lds.ll | 13 ; CHECK: %llvm.amdgcn.kernel..lds.t = type { [2 x i8] } 14 ; CHECK: %llvm.amdgcn.kernel..lds.t.0 = type { [4 x i8] } 19 ; CHECK: @llvm.amdgcn.kernel.k0.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k0.lds.t und… 20 ; CHECK: @llvm.amdgcn.kernel.k1.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k1.lds.t und… 21 ; CHECK: @llvm.amdgcn.kernel..lds = internal addrspace(3) global %llvm.amdgcn.kernel..lds.t undef, … 22 ; CHECK: @llvm.amdgcn.kernel..lds.1 = internal addrspace(3) global %llvm.amdgcn.kernel..lds.t.0 und… 28 …getelementptr inbounds (%llvm.amdgcn.kernel.k0.lds.t, %llvm.amdgcn.kernel.k0.lds.t addrspace(3)* @… 30 …getelementptr inbounds (%llvm.amdgcn.kernel.k0.lds.t, %llvm.amdgcn.kernel.k0.lds.t addrspace(3)* @… 53 …getelementptr inbounds (%llvm.amdgcn.kernel.k1.lds.t, %llvm.amdgcn.kernel.k1.lds.t addrspace(3)* @… 55 …getelementptr inbounds (%llvm.amdgcn.kernel.k1.lds.t, %llvm.amdgcn.kernel.k1.lds.t addrspace(3)* @… [all …]
|
| H A D | lower-kernel-lds.ll | 10 ; CHECK: %llvm.amdgcn.kernel.k0.lds.t = type { [16 x i8], [4 x i8], [2 x i8], [1 x i8] } 11 ; CHECK: %llvm.amdgcn.kernel.k1.lds.t = type { [16 x i8], [4 x i8], [2 x i8] } 16 ; CHECK: @llvm.amdgcn.kernel.k0.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k0.lds.t und… 17 ; CHECK: @llvm.amdgcn.kernel.k1.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k1.lds.t und… 21 …getelementptr inbounds (%llvm.amdgcn.kernel.k0.lds.t, %llvm.amdgcn.kernel.k0.lds.t addrspace(3)* @… 23 …getelementptr inbounds (%llvm.amdgcn.kernel.k0.lds.t, %llvm.amdgcn.kernel.k0.lds.t addrspace(3)* @… 25 …getelementptr inbounds (%llvm.amdgcn.kernel.k0.lds.t, %llvm.amdgcn.kernel.k0.lds.t addrspace(3)* @… 27 …getelementptr inbounds (%llvm.amdgcn.kernel.k0.lds.t, %llvm.amdgcn.kernel.k0.lds.t addrspace(3)* @… 48 …getelementptr inbounds (%llvm.amdgcn.kernel.k1.lds.t, %llvm.amdgcn.kernel.k1.lds.t addrspace(3)* @… 50 …getelementptr inbounds (%llvm.amdgcn.kernel.k1.lds.t, %llvm.amdgcn.kernel.k1.lds.t addrspace(3)* @… [all …]
|
| H A D | lower-kernel-lds-super-align.ll | 6 ; CHECK: %llvm.amdgcn.kernel.k1.lds.t = type { [32 x i8] } 18 ; SUPER-ALIGN_ON: @llvm.amdgcn.kernel.k1.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k1.… 19 ; SUPER-ALIGN_OFF: @llvm.amdgcn.kernel.k1.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k1… 21 ; CHECK: @llvm.amdgcn.kernel.k2.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k2.lds.t und… 22 ; SUPER-ALIGN_ON: @llvm.amdgcn.kernel.k3.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k3… 23 ; SUPER-ALIGN_OFF: @llvm.amdgcn.kernel.k3.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k3… 25 ; SUPER-ALIGN_ON: @llvm.amdgcn.kernel.k4.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k4… 26 ; SUPER-ALIGN_OFF: @llvm.amdgcn.kernel.k4.lds = internal addrspace(3) global %llvm.amdgcn.kernel.k4… 29 …getelementptr inbounds (%llvm.amdgcn.kernel.k1.lds.t, %llvm.amdgcn.kernel.k1.lds.t addrspace(3)* @… 45 …getelementptr inbounds (%llvm.amdgcn.kernel.k2.lds.t, %llvm.amdgcn.kernel.k2.lds.t addrspace(3)* @… [all …]
|
| /llvm-project-15.0.7/clang/test/Index/ |
| H A D | opencl-types.cl | 10 void kernel testFloatTypes() { 28 void kernel OCLImage1dROTest(read_only image1d_t scalarOCLImage1dRO); 31 void kernel OCLImage2dROTest(read_only image2d_t scalarOCLImage2dRO); 39 void kernel OCLImage3dROTest(read_only image3d_t scalarOCLImage3dRO); 54 void kernel OCLImage1dWOTest(write_only image1d_t scalarOCLImage1dWO); 57 void kernel OCLImage2dWOTest(write_only image2d_t scalarOCLImage2dWO); 65 void kernel OCLImage3dWOTest(write_only image3d_t scalarOCLImage3dWO); 106 void kernel intPipeTestRO(read_only pipe int scalarPipe); 107 void kernel intPipeTestWO(write_only pipe int scalarPipe); 116 void kernel testMiscOpenCLTypes() { [all …]
|
| /llvm-project-15.0.7/clang/test/CodeGenOpenCL/ |
| H A D | amdgpu-attrs.cl | 6 kernel void flat_work_group_size_0_0() {} 8 kernel void waves_per_eu_0() {} 10 kernel void waves_per_eu_0_0() {} 12 kernel void num_sgpr0() {} 14 kernel void num_vgpr0() {} 33 kernel void num_sgpr_0_num_vgpr_0() {} 54 kernel void waves_per_eu_2() { 58 kernel void waves_per_eu_2_4() { 62 kernel void num_sgpr_32() { 66 kernel void num_vgpr_64() { [all …]
|
| /llvm-project-15.0.7/clang/test/SemaSYCL/ |
| H A D | zero-length-arrays.cpp | 7 __attribute__((sycl_kernel)) void kernel(const Func &kernelFunc) { in kernel() function 51 kernel<class TempContext>([=] { in templatedContext() 58 kernel<class TempContext1>([Var] { in templatedContext() 68 kernel<class Simple>([=]() { in foo() 77 …kernel<class Simple1>([Arr] { // expected-error {{zero-length arrays are not permitted in SYCL dev… in foo() 82 kernel<class SimpleStruct>([=] { in foo() 89 …kernel<class SimpleStruct1>([St] { // expected-error 2{{zero-length arrays are not permitted in SY… in foo() 97 kernel<class UseTemplated>([=] { in foo() 108 …kernel<class UseTemplated1>([Zero] { // expected-error 2{{zero-length arrays are not permitted in … in foo() 118 kernel<class UseFunctor>(K); in foo() [all …]
|
| /llvm-project-15.0.7/lldb/docs/use/ |
| H A D | qemu-testing.rst | 22 Once we have booted our kernel we can run lldb-server in emulation environment. 50 Build QEMU or cross compile Linux kernel from source using setup.sh 53 **Example:** Build QEMU binaries and Arm/AArch64 Linux kernel image 56 $ bash setup.sh --qemu --kernel arm 57 $ bash setup.sh --qemu --kernel arm64 59 **Example:** Build Linux kernel image only 62 $ bash setup.sh --kernel arm 63 $ bash setup.sh --kernel arm64 89 --kernel commandline argument. 92 setup.sh was used to build Linux kernel and QEMU binaries. [all …]
|
| /llvm-project-15.0.7/mlir/test/Conversion/GPUToVulkan/ |
| H A D | lower-gpu-launch-vulkan-launch.mlir | 5 …dex]], %[[index]], %[[index]], %[[resource]]) {spirv_blob = "{{.*}}", spirv_entry_point = "kernel"} 10 spv.func @kernel() "None" attributes {workgroup_attributions = 0 : i64} { 18 spv.EntryPoint "GLCompute" @kernel 19 spv.ExecutionMode @kernel "LocalSize", 1, 1, 1 22 gpu.func @kernel(%arg0: memref<12xf32>) kernel { 29 gpu.launch_func @kernels::@kernel
|
| /llvm-project-15.0.7/llvm/test/Transforms/OpenMP/ |
| H A D | barrier_removal.ll | 232 !0 = !{void ()* @pos_empty_1, !"kernel", i32 1} 233 !1 = !{void ()* @pos_empty_2, !"kernel", i32 1} 234 !2 = !{void ()* @pos_empty_3, !"kernel", i32 1} 235 !3 = !{void ()* @pos_empty_4, !"kernel", i32 1} 236 !4 = !{void ()* @pos_empty_5, !"kernel", i32 1} 237 !5 = !{void ()* @pos_empty_6, !"kernel", i32 1} 238 !6 = !{void ()* @neg_empty_7, !"kernel", i32 1} 240 !8 = !{void ()* @neg_loads, !"kernel", i32 1} 241 !9 = !{void ()* @pos_priv_mem, !"kernel", i32 1} 242 !10 = !{void ()* @neg_mem, !"kernel", i32 1} [all …]
|
| /llvm-project-15.0.7/llvm/test/CodeGen/NVPTX/ |
| H A D | load-with-non-coherent-cache.ll | 218 ; This test captures the case of a non-kernel function. In a 222 ; kernel). For both reasons, we cannot use a cached load here. 248 !1 = !{void (float *, float *)* @foo1, !"kernel", i32 1} 249 !2 = !{void (double *, double *)* @foo2, !"kernel", i32 1} 250 !3 = !{void (i16 *, i16 *)* @foo3, !"kernel", i32 1} 251 !4 = !{void (i32 *, i32 *)* @foo4, !"kernel", i32 1} 252 !5 = !{void (i64 *, i64 *)* @foo5, !"kernel", i32 1} 253 !6 = !{void (i128 *, i128 *)* @foo6, !"kernel", i32 1} 254 !7 = !{void (<2 x i8> *, <2 x i8> *)* @foo7, !"kernel", i32 1} 265 !18 = !{void (float **, float **)* @foo18, !"kernel", i32 1} [all …]
|
| /llvm-project-15.0.7/mlir/test/Conversion/GPUToCUDA/ |
| H A D | lower-nvvm-kernel-to-cubin.mlir | 5 llvm.func @kernel(%arg0 : f32, %arg1 : !llvm.ptr<f32>) 6 // CHECK: attributes {gpu.kernel} 7 attributes { gpu.kernel } { 16 attributes { gpu.kernel } { 22 attributes { gpu.kernel } {
|
| /llvm-project-15.0.7/mlir/test/Conversion/GPUToROCm/ |
| H A D | lower-rocdl-kernel-to-hsaco.mlir | 5 llvm.func @kernel(%arg0 : f32, %arg1 : !llvm.ptr<f32>) 6 // CHECK: attributes {gpu.kernel} 7 attributes { gpu.kernel } { 16 attributes { gpu.kernel } { 22 attributes { gpu.kernel } {
|