Home
last modified time | relevance | path

Searched refs:KERNEL (Results 1 – 25 of 99) sorted by relevance

1234

/external/llvm-project/polly/test/GPGPU/
Dhost-control-flow.ll5 ; RUN: -polly-acc-dump-kernel-ir < %s | FileCheck %s -check-prefix=KERNEL-IR
44 ; KERNEL-IR: define ptx_kernel void @FUNC_foo_SCOP_0_KERNEL_0(i8 addrspace(1)* %MemRef_A, i64 %c0)
45 ; KERNEL-IR-LABEL: entry:
46 ; KERNEL-IR-NEXT: %0 = call i32 @llvm.nvvm.read.ptx.sreg.ctaid.x()
47 ; KERNEL-IR-NEXT: %b0 = zext i32 %0 to i64
48 ; KERNEL-IR-NEXT: %1 = call i32 @llvm.nvvm.read.ptx.sreg.tid.x()
49 ; KERNEL-IR-NEXT: %t0 = zext i32 %1 to i64
50 ; KERNEL-IR-NEXT: br label %polly.cond
52 ; KERNEL-IR-LABEL: polly.cond: ; preds = %entry
53 ; KERNEL-IR-NEXT: %2 = mul nsw i64 32, %b0
[all …]
Ddouble-parallel-loop.ll15 ; RUN: FileCheck %s -check-prefix=KERNEL-IR
19 ; RUN: FileCheck %s -check-prefix=KERNEL-ASM
139 ; KERNEL-IR-LABEL: define ptx_kernel void @kernel_0(i8* %MemRef_A) #0 {
140 ; KERNEL-IR-NEXT: entry:
141 ; KERNEL-IR-NEXT: %0 = call i32 @llvm.nvvm.read.ptx.sreg.ctaid.x()
142 ; KERNEL-IR-NEXT: %b0 = zext i32 %0 to i64
143 ; KERNEL-IR-NEXT: %1 = call i32 @llvm.nvvm.read.ptx.sreg.ctaid.y()
144 ; KERNEL-IR-NEXT: %b1 = zext i32 %1 to i64
145 ; KERNEL-IR-NEXT: %2 = call i32 @llvm.nvvm.read.ptx.sreg.tid.x()
146 ; KERNEL-IR-NEXT: %t0 = zext i32 %2 to i64
[all …]
Dkernel-params-only-some-arrays.ll3 ; RUN: FileCheck -check-prefix=KERNEL %s
19 ; KERNEL: ; ModuleID = 'FUNC_kernel_params_only_some_arrays_SCOP_0_KERNEL_0'
20 ; KERNEL-NEXT: source_filename = "FUNC_kernel_params_only_some_arrays_SCOP_0_KERNEL_0"
21 ; KERNEL-NEXT: target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-i128:1…
22 ; KERNEL-NEXT: target triple = "nvptx64-nvidia-cuda"
24 ; KERNEL: define ptx_kernel void @FUNC_kernel_params_only_some_arrays_SCOP_0_KERNEL_0(i8 addrspace(…
25 ; KERNEL-NEXT: entry:
26 ; KERNEL-NEXT: %0 = call i32 @llvm.nvvm.read.ptx.sreg.ctaid.x()
27 ; KERNEL-NEXT: %b0 = zext i32 %0 to i64
28 ; KERNEL-NEXT: %1 = call i32 @llvm.nvvm.read.ptx.sreg.tid.x()
[all …]
Dprivate-memory.ll9 ; RUN: FileCheck -check-prefix=KERNEL %s
27 ; KERNEL: %private_array = alloca [1 x float]
29 ; KERNEL: %polly.access.cast.private_array = bitcast [1 x float]* %private_array to float*
30 ; KERNEL-NEXT: %polly.access.private_array = getelementptr float, float* %polly.access.cast.priva…
31 ; KERNEL-NEXT: %polly.access.cast.MemRef_A = bitcast i8 addrspace(1)* %MemRef_A to float addrspac…
32 ; KERNEL-NEXT: %polly.access.MemRef_A = getelementptr float, float addrspace(1)* %polly.access.ca…
33 ; KERNEL-NEXT: %shared.read = load float, float addrspace(1)* %polly.access.MemRef_A
34 ; KERNEL-NEXT: store float %shared.read, float* %polly.access.private_array
36 ; KERNEL: %polly.access.cast.private_array5 = bitcast [1 x float]* %private_array to float*
37 ; KERNEL-NEXT: %polly.access.private_array6 = getelementptr float, float* %polly.access.cast.priv…
[all …]
Dshared-memory.ll9 ; RUN: FileCheck -check-prefix=KERNEL %s
29 ; KERNEL: @shared_MemRef_A = internal addrspace(3) global [32 x float] zeroinitializer, align 4
31 ; KERNEL: %polly.access.shared_MemRef_A = getelementptr float, float addrspace(3)* getelementptr …
32 ; KERNEL-NEXT: %polly.access.cast.MemRef_A = bitcast i8 addrspace(1)* %MemRef_A to float addrspac…
33 ; KERNEL-NEXT: %polly.access.MemRef_A = getelementptr float, float addrspace(1)* %polly.access.ca…
34 ; KERNEL-NEXT: %shared.read = load float, float addrspace(1)* %polly.access.MemRef_A
35 ; KERNEL-NEXT: store float %shared.read, float addrspace(3)* %polly.access.shared_MemRef_A
37 ; KERNEL: %polly.access.shared_MemRef_A3 = getelementptr float, float addrspace(3)* getelementptr…
38 ; KERNEL-NEXT: %polly.access.cast.MemRef_A4 = bitcast i8 addrspace(1)* %MemRef_A to float addrspa…
39 ; KERNEL-NEXT: %polly.access.MemRef_A5 = getelementptr float, float addrspace(1)* %polly.access.c…
[all …]
Dshared-memory-two-dimensional.ll9 ; RUN: FileCheck -check-prefix=KERNEL %s
35 ; KERNEL: @shared_MemRef_b = internal addrspace(3) global [16 x [8 x float]] zeroinitializer, align…
37 ; KERNEL: %polly.access.mul.MemRef_b = mul nsw i64 %polly.indvar, 8
38 ; KERNEL-NEXT: %polly.access.add.MemRef_b = add nsw i64 %polly.access.mul.MemRef_b, %t0
39 ; KERNEL-NEXT: %polly.access.MemRef_b = getelementptr float, float addrspace(1)* %polly.access.ca…
40 ; KERNEL-NEXT: %shared.read = load float, float addrspace(1)* %polly.access.MemRef_b
41 ; KERNEL-NEXT: store float %shared.read, float addrspace(3)* %polly.access.shared_MemRef_b
Dcuda-annotations.ll3 ; RUN: FileCheck -check-prefix=KERNEL %s
7 ; KERNEL: define ptx_kernel void @FUNC_foo_SCOP_0_KERNEL_0(i8 addrspace(1)* %MemRef_A, i64 %n) #0 {
9 ; KERNEL: !nvvm.annotations = !{!0}
11 ; KERNEL: !0 = !{void (i8 addrspace(1)*, i64)* @FUNC_foo_SCOP_0_KERNEL_0, !"maxntidx", i32 32, !"ma…
Dnon-read-only-scalars.ll7 ; RUN: FileCheck %s -check-prefix=KERNEL-IR
82 ; KERNEL-IR: define ptx_kernel void @FUNC_foo_SCOP_0_KERNEL_1(i8 addrspace(1)* %MemRef_sum_0__phi)
83 ; KERNEL-IR: store float 0.000000e+00, float* %sum.0.phiops
84 ; KERNEL-IR: [[REGA:%.+]] = addrspacecast i8 addrspace(1)* %MemRef_sum_0__phi to float*
85 ; KERNEL-IR: [[REGB:%.+]] = load float, float* %sum.0.phiops
86 ; KERNEL-IR: store float [[REGB]], float* [[REGA]]
88 ; KERNEL-IR: define ptx_kernel void @FUNC_foo_SCOP_0_KERNEL_2(i8 addrspace(1)* %MemRef_A, i8 addrsp…
Dlibdevice-functions-copied-into-kernel.ll6 ; RUN: < %s | FileCheck %s --check-prefix=KERNEL-IR
21 ; KERNEL-IR: %p_expf = tail call float @__nv_expf(float %A.arr.i.val_p_scalar_)
22 ; KERNEL-IR: %p_cosf = tail call float @__nv_cosf(float %p_expf)
23 ; KERNEL-IR: %p_logf = tail call float @__nv_logf(float %p_cosf)
27 ; KERNEL-IR: %p_powi = tail call float @__nv_powif(float %p_logf, i32 2)
28 ; KERNEL-IR: %p_exp = tail call float @__nv_expf(float %p_powi)
Dinvariant-load-of-scalar.ll12 ; RUN: FileCheck -check-prefix=KERNEL-IR %s
39 ; KERNEL-IR: define ptx_kernel void @FUNC_checkPrivatization_SCOP_0_KERNEL_0
40 ; KERNEL-IR-SAME: (i8 addrspace(1)* %MemRef_A, i32 %tmp,
41 ; KERNEL-IR-SAME: i32 %tmp2, i32 %polly.access.begin.load,
42 ; KERNEL-IR-SAME: i32 %polly.access.end.load)
/external/llvm-project/polly/test/ScheduleOptimizer/
Dpattern-matching-based-opts_3.ll16 ; RUN: | FileCheck %s --check-prefix=EXTRACTION-OF-MACRO-KERNEL
80 ; EXTRACTION-OF-MACRO-KERNEL-LABEL: Printing analysis 'Polly - Generate an AST from the SCoP (isl)'…
81 ; EXTRACTION-OF-MACRO-KERNEL: {
82 ; EXTRACTION-OF-MACRO-KERNEL-NEXT: // 1st level tiling - Tiles
83 ; EXTRACTION-OF-MACRO-KERNEL-NEXT: for (int c0 = 0; c0 <= 32; c0 += 1)
84 ; EXTRACTION-OF-MACRO-KERNEL-NEXT: for (int c1 = 0; c1 <= 32; c1 += 1) {
85 ; EXTRACTION-OF-MACRO-KERNEL-NEXT: // 1st level tiling - Points
86 ; EXTRACTION-OF-MACRO-KERNEL-NEXT: for (int c2 = 0; c2 <= 31; c2 += 1)
87 ; EXTRACTION-OF-MACRO-KERNEL-NEXT: for (int c3 = 0; c3 <= 31; c3 += 1)
88 ; EXTRACTION-OF-MACRO-KERNEL-NEXT: Stmt_bb9(32 * c0 + c2, 32 * c1 + c3);
[all …]
/external/OpenCL-CTS/test_conformance/device_execution/
Dexecute_block.cpp951 KERNEL(block_global_scope),
952 KERNEL(block_kernel_scope),
953 KERNEL(block_statement_scope),
954 KERNEL(block_function_scope),
955 KERNEL(block_nested_scope),
958 KERNEL(block_in_for_init),
959 KERNEL(block_in_for_cond),
960 KERNEL(block_in_for_iter),
961 KERNEL(block_in_while_cond),
962 KERNEL(block_in_while_body),
[all …]
Denqueue_block.cpp588 KERNEL(enqueue_simple_block),
590 KERNEL(enqueue_block_with_local_arg1),
591 KERNEL(enqueue_block_with_local_arg2),
592 KERNEL(enqueue_block_with_wait_list),
593 KERNEL(enqueue_block_with_wait_list_and_local_arg),
595 KERNEL(enqueue_block_get_kernel_work_group_size),
596 KERNEL(enqueue_block_get_kernel_preferred_work_group_size_multiple),
598 KERNEL(enqueue_block_capture_event_profiling_info_after_execution),
599 KERNEL(enqueue_block_capture_event_profiling_info_before_execution),
601 KERNEL(enqueue_marker_with_block_event),
[all …]
Denqueue_flags.cpp662 KERNEL(enqueue_flags_wait_kernel_simple),
663 KERNEL(enqueue_flags_wait_kernel_event),
664 KERNEL(enqueue_flags_wait_kernel_local),
665 KERNEL(enqueue_flags_wait_kernel_event_local),
666 KERNEL(enqueue_flags_wait_work_group_simple),
667 KERNEL(enqueue_flags_wait_work_group_event),
668 KERNEL(enqueue_flags_wait_work_group_local),
669 KERNEL(enqueue_flags_wait_work_group_event_local)
Denqueue_wg_size.cpp1597 { KERNEL(enqueue_1D_wg_size_single), check_single },
1598 { KERNEL(enqueue_1D_wg_size_some_eq), check_some_eq_1D },
1599 { KERNEL(enqueue_1D_wg_size_some_diff), check_some_diff_1D },
1600 { KERNEL(enqueue_1D_wg_size_all_eq), check_all_eq_1D },
1601 { KERNEL(enqueue_1D_wg_size_all_diff), check_all_diff_1D },
1603 { KERNEL(enqueue_2D_wg_size_single), check_single },
1604 { KERNEL(enqueue_2D_wg_size_some_eq), check_some_eq_2D },
1605 { KERNEL(enqueue_2D_wg_size_some_diff), check_some_diff_2D },
1606 { KERNEL(enqueue_2D_wg_size_all_eq), check_all_eq_2D },
1607 { KERNEL(enqueue_2D_wg_size_all_diff), check_all_diff_2D },
[all …]
/external/libyuv/files/util/
Dssim.cc35 enum { KERNEL = 3, KERNEL_SIZE = 2 * KERNEL + 1 }; enumerator
43 static const double kiW[KERNEL + 1 + 1] = {
122 org += (yo - KERNEL) * stride; in GetSSIM()
123 org += (xo - KERNEL); in GetSSIM()
124 rec += (yo - KERNEL) * stride; in GetSSIM()
125 rec += (xo - KERNEL); in GetSSIM()
127 if (((yo - KERNEL + y_) < 0) || ((yo - KERNEL + y_) >= H)) { in GetSSIM()
133 if (((xo - KERNEL + x_) >= 0) && ((xo - KERNEL + x_) < W)) { in GetSSIM()
160 for (int y = 1; y <= KERNEL; y++) { in GetSSIMFullKernel()
163 const int Wy = K[KERNEL + y]; in GetSSIMFullKernel()
[all …]
/external/llvm-project/llvm/test/CodeGen/X86/
Dcodemodel.ll2 ; RUN: llc < %s -code-model=kernel | FileCheck -check-prefix CHECK-KERNEL %s
15 ; CHECK-KERNEL-LABEL: foo:
16 ; CHECK-KERNEL: movl data(%rip), %eax
25 ; CHECK-KERNEL-LABEL: foo1:
26 ; CHECK-KERNEL: movl data+16777212(%rip), %eax
35 ; CHECK-KERNEL-LABEL: foo2:
36 ; CHECK-KERNEL: movl data+40(%rip), %eax
45 ; CHECK-KERNEL-LABEL: foo3:
46 ; CHECK-KERNEL: movq $-40, %rax
47 ; CHECK-KERNEL: movl data(%rax), %eax
[all …]
Dstack-protector.ll3 …-model=kernel -mtriple=x86_64-pc-linux-gnu < %s -o - | FileCheck --check-prefix=LINUX-KERNEL-X64 %s
39 ; LINUX-KERNEL-X64-LABEL: test1a:
40 ; LINUX-KERNEL-X64-NOT: callq __stack_chk_fail
41 ; LINUX-KERNEL-X64: .cfi_endproc
80 ; LINUX-KERNEL-X64-LABEL: test1b:
81 ; LINUX-KERNEL-X64: mov{{l|q}} %gs:
82 ; LINUX-KERNEL-X64: callq __stack_chk_fail
125 ; LINUX-KERNEL-X64-LABEL: test1c:
126 ; LINUX-KERNEL-X64: mov{{l|q}} %gs:
127 ; LINUX-KERNEL-X64: callq __stack_chk_fail
[all …]
/external/llvm/test/CodeGen/X86/
Dcodemodel.ll2 ; RUN: llc < %s -code-model=kernel | FileCheck -check-prefix CHECK-KERNEL %s
12 ; CHECK-KERNEL-LABEL: foo:
13 ; CHECK-KERNEL: movl data, %eax
22 ; CHECK-KERNEL-LABEL: foo2:
23 ; CHECK-KERNEL: movl data+40, %eax
32 ; CHECK-KERNEL-LABEL: foo3:
33 ; CHECK-KERNEL: movq $-40, %rax
44 ; CHECK-KERNEL-LABEL: foo4:
45 ; CHECK-KERNEL: movl data+16777216, %eax
54 ; CHECK-KERNEL-LABEL: foo1:
[all …]
Dstack-protector.ll3 …-model=kernel -mtriple=x86_64-pc-linux-gnu < %s -o - | FileCheck --check-prefix=LINUX-KERNEL-X64 %s
37 ; LINUX-KERNEL-X64-LABEL: test1a:
38 ; LINUX-KERNEL-X64-NOT: callq __stack_chk_fail
39 ; LINUX-KERNEL-X64: .cfi_endproc
73 ; LINUX-KERNEL-X64-LABEL: test1b:
74 ; LINUX-KERNEL-X64: mov{{l|q}} %gs:
75 ; LINUX-KERNEL-X64: callq __stack_chk_fail
113 ; LINUX-KERNEL-X64-LABEL: test1c:
114 ; LINUX-KERNEL-X64: mov{{l|q}} %gs:
115 ; LINUX-KERNEL-X64: callq __stack_chk_fail
[all …]
/external/deqp-deps/amber/tests/cases/
Dopencl_set_arg.amber31 BIND BUFFER in_buf KERNEL ARG_NAME in
32 BIND BUFFER out_buf1 KERNEL ARG_NAME out
33 SET KERNEL ARG_NAME offset AS uint32 1
34 SET KERNEL ARG_NAME slope AS int32 2
38 BIND BUFFER out_buf2 KERNEL ARG_NAME out
45 BIND BUFFER out_buf3 KERNEL ARG_NAME out
52 BIND BUFFER out_buf4 KERNEL ARG_NAME out
53 SET KERNEL ARG_NAME slope AS int32 3
61 BIND BUFFER out_buf5 KERNEL ARG_NAME out
62 SET KERNEL ARG_NAME slope AS int32 3
Dopencl_read_and_write_image3d_rgba32i.amber54 BIND BUFFER im3d KERNEL ARG_NAME im
59 BIND BUFFER im3d KERNEL ARG_NAME im
60 BIND SAMPLER sampler KERNEL ARG_NAME sampler
61 BIND BUFFER out_buf KERNEL ARG_NAME out
Dopencl_read_image.amber47 BIND BUFFER out_buf KERNEL ARG_NAME out
48 BIND BUFFER texture KERNEL ARG_NAME image
49 BIND SAMPLER sampler KERNEL ARG_NAME sampler
/external/tensorflow/tensorflow/compiler/jit/
Dxla_device_ops.h56 #define REGISTER_XLA_LAUNCH_KERNEL(DEVICE, KERNEL, TYPES) \ argument
61 KERNEL);
63 #define REGISTER_XLA_COMPILE_KERNEL(DEVICE, KERNEL, TYPES) \ argument
70 KERNEL);
72 #define REGISTER_XLA_RUN_KERNEL(DEVICE, KERNEL, TYPES) \ argument
73 REGISTER_KERNEL_BUILDER(Name("_XlaRun").Device(DEVICE), KERNEL);
/external/ltp/testcases/kernel/sched/sched_stress/
Dsched_stress.sh29 export KERNEL=./sched_datafile
30 touch $KERNEL

1234