Home
last modified time | relevance | path

Searched full:kernel_name (Results 1 – 25 of 361) sorted by relevance

12345678910>>...15

/external/executorch/kernels/portable/
Dfunctions.yaml23 kernel_name: torch::executor::_cdist_forward_out
28 kernel_name: torch::executor::log_softmax_out
33 kernel_name: torch::executor::_native_batch_norm_legit_out
38 kernel_name: torch::executor::_native_batch_norm_legit_no_stats_out
43 kernel_name: torch::executor::_native_batch_norm_legit_no_training_out
48 kernel_name: torch::executor::_pdist_forward_out
53 kernel_name: torch::executor::softmax_out
58 kernel_name: torch::executor::to_copy_out
63 kernel_name: torch::executor::abs_out
68 kernel_name: torch::executor::acos_out
[all …]
/external/executorch/backends/vulkan/runtime/graph/ops/utils/
DStagingUtils.cpp26 std::string kernel_name; in get_nchw_to_tensor_shader() local
27 kernel_name.reserve(kShaderNameReserve); in get_nchw_to_tensor_shader()
31 kernel_name = "nchw_to_bitw8_image_nobitw8buffer"; in get_nchw_to_tensor_shader()
32 add_storage_type_suffix(kernel_name, v_dst); in get_nchw_to_tensor_shader()
33 add_dtype_suffix(kernel_name, v_dst); in get_nchw_to_tensor_shader()
34 return VK_KERNEL_FROM_STR(kernel_name); in get_nchw_to_tensor_shader()
38 kernel_name = "nchw_to_buffer"; in get_nchw_to_tensor_shader()
39 add_dtype_suffix(kernel_name, v_dst); in get_nchw_to_tensor_shader()
40 return VK_KERNEL_FROM_STR(kernel_name); in get_nchw_to_tensor_shader()
43 kernel_name = "nchw_to_image"; in get_nchw_to_tensor_shader()
[all …]
DShaderNameUtils.cpp14 std::string& kernel_name, in add_storage_type_suffix() argument
18 kernel_name += "_buffer"; in add_storage_type_suffix()
21 kernel_name += "_texture3d"; in add_storage_type_suffix()
24 kernel_name += "_texture2d"; in add_storage_type_suffix()
30 std::string& kernel_name, in add_storage_type_suffix() argument
32 return add_storage_type_suffix(kernel_name, tensor.storage_type()); in add_storage_type_suffix()
35 void add_dtype_suffix(std::string& kernel_name, const vkapi::ScalarType dtype) { in add_dtype_suffix() argument
38 kernel_name += "_float"; in add_dtype_suffix()
41 kernel_name += "_half"; in add_dtype_suffix()
44 kernel_name += "_int"; in add_dtype_suffix()
[all …]
DShaderNameUtils.h20 std::string& kernel_name,
23 std::string& kernel_name,
26 void add_dtype_suffix(std::string& kernel_name, const vkapi::ScalarType dtype);
27 void add_dtype_suffix(std::string& kernel_name, const api::vTensor& tensor);
29 void add_ndim_suffix(std::string& kernel_name, const size_t ndim);
30 void add_ndim_suffix(std::string& kernel_name, const api::vTensor& tensor);
32 void add_packed_dim_suffix(std::string& kernel_name, const int32_t packed_dim);
34 std::string& kernel_name,
/external/executorch/backends/cadence/aot/
Dfunctions.yaml18 kernel_name: torch::executor::to_copy_out
23 kernel_name: torch::executor::softmax_out
28 kernel_name: torch::executor::add_out
33 kernel_name: torch::executor::bmm_out
38 kernel_name: torch::executor::cat_out
43 kernel_name: torch::executor::clone_out
48 kernel_name: torch::executor::div_out
53 kernel_name: torch::executor::div_out_mode
58 kernel_name: torch::executor::embedding_out
63 kernel_name: torch::executor::empty_out
[all …]
Dfunctions_hifi.yaml18 kernel_name: torch::executor::to_copy_out
23 kernel_name: torch::executor::softmax_out
28 kernel_name: cadence::impl::HiFi::add_out
33 kernel_name: torch::executor::bmm_out
38 kernel_name: torch::executor::cat_out
43 kernel_name: torch::executor::clone_out
48 kernel_name: cadence::impl::HiFi::div_out
53 kernel_name: cadence::impl::HiFi::div_out_mode
58 kernel_name: torch::executor::embedding_out
63 kernel_name: torch::executor::full_out
[all …]
/external/executorch/kernels/optimized/
Doptimized.yaml8 kernel_name: torch::executor::opt_log_softmax_out
13 kernel_name: torch::executor::opt_add_out
18 kernel_name: torch::executor::opt_add_scalar_out
23 kernel_name: torch::executor::opt_bmm_out
28 kernel_name: torch::executor::opt_div_out
33 kernel_name: torch::executor::opt_div_scalar_out
38 kernel_name: torch::executor::opt_exp_out
43 kernel_name: torch::executor::opt_sigmoid_out
48 kernel_name: torch::executor::opt_gelu_out
53 kernel_name: torch::executor::opt_le_scalar_out
[all …]
Doptimized-oss.yaml11 kernel_name: torch::executor::opt_add_out
16 kernel_name: torch::executor::opt_add_scalar_out
21 kernel_name: torch::executor::opt_bmm_out
26 kernel_name: torch::executor::opt_div_out
31 kernel_name: torch::executor::opt_div_scalar_out
36 kernel_name: torch::executor::opt_exp_out
41 kernel_name: torch::executor::opt_sigmoid_out
46 kernel_name: torch::executor::opt_le_scalar_out
51 kernel_name: torch::executor::opt_le_tensor_out
56 kernel_name: torch::executor::opt_linear_out
[all …]
/external/pytorch/torch/_inductor/codegen/
Dcpp_wrapper_cuda.py36 kernel_name: str,
42 self.kernel_name = kernel_name
47 params = CudaKernelParamCache.get(self.kernel_name)
50 ), f"{self.kernel_name} not found in CudaKernelParamCache"
54 ), f"{key} not found in CudaKernelParamCache[{self.kernel_name}]"
61 return DeferredCudaKernelLine(self.kernel_name, line, self.keys)
71 kernel_name: str,
76 self.kernel_name = kernel_name
97 params = CudaKernelParamCache.get(self.kernel_name)
100 ), f"{self.kernel_name} not found in CudaKernelParamCache"
[all …]
Ddebug_utils.py34 kernel_name: str = "",
42 self.kernel_name = kernel_name
50 self.kernel_name,
55 def __exit__(self, args_to_print_or_save, kernel_name, arg_signatures): argument
58 kernel_name,
66 kernel_name, argument
76 self.kernel_name,
84 self.kernel_name,
101 kernel_name: str,
112 self.kernel_name = kernel_name
[all …]
/external/executorch/kernels/quantized/
Dquantized.yaml5 kernel_name: torch::executor::quantized_add_out
11 kernel_name: torch::executor::choose_qparams_tensor_out
17 kernel_name: torch::executor::dequantize_per_tensor_out
23 kernel_name: torch::executor::dequantize_per_tensor_tensor_args_out
29 kernel_name: torch::executor::quantize_per_channel_out
35 kernel_name: torch::executor::dequantize_per_channel_out
41 kernel_name: torch::executor::quantized_embedding_byte_out
47 kernel_name: torch::executor::quantized_embedding_byte_dtype_out
53 kernel_name: torch::executor::quantized_embedding_2bit_out
59 kernel_name: torch::executor::quantized_embedding_2bit_dtype_out
[all …]
/external/executorch/kernels/quantized/test/
Dtargets.bzl6 op_test("op_quantize_test", kernel_name = "quantized")
7 op_test("op_dequantize_test", kernel_name = "quantized")
8 op_test("op_choose_qparams_test", kernel_name = "quantized")
9 op_test("op_add_test", kernel_name = "quantized", deps = [
18 op_test("op_embedding_test", kernel_name = "quantized", deps = [
28 op_test("op_embedding2b_test", kernel_name = "quantized")
29 op_test("op_embedding4b_test", kernel_name = "quantized")
30 op_test("op_mixed_mm_test", kernel_name = "quantized", deps = [
36 op_test("op_mixed_linear_test", kernel_name = "quantized", deps = [
/external/executorch/shim/xplat/executorch/kernels/test/
Dutil.bzl3 def op_test(name, deps = [], kernel_name = "portable", use_kernel_prefix = False):
13 kernel_name: The name string as in //executorch/kernels/<kernel_name>.
21 if kernel_name == "aten":
31 "//executorch/kernels/{}/cpu:{}".format(kernel_name, op_root),
32 "//executorch/kernels/{}:generated_lib_headers".format(kernel_name),
33 "//executorch/kernels/{}/test:supported_features".format(kernel_name),
38 if kernel_name == "aten":
43 name_prefix = kernel_name + "_"
116 def codegen_function_header_wrapper(kernel_path, kernel_name):
121 Use target "function_header_wrapper_<kernel_name>" in tests.
[all …]
/external/executorch/backends/vulkan/runtime/graph/ops/impl/
DQuantizedLinear.cpp89 std::string kernel_name = "q_8w_linear"; in add_q_8w_linear_node() local
90 kernel_name.reserve(kShaderNameReserve); in add_q_8w_linear_node()
91 add_packed_dim_suffix(kernel_name, graph.packed_dim_of(mat1_W_packed)); in add_q_8w_linear_node()
92 add_packed_dim_suffix(kernel_name, graph.packed_dim_of(q_mat2)); in add_q_8w_linear_node()
93 add_dtype_suffix(kernel_name, graph.dtype_of(out_W_packed)); in add_q_8w_linear_node()
94 add_storage_type_suffix(kernel_name, graph.storage_type_of(out_W_packed)); in add_q_8w_linear_node()
118 VK_KERNEL_FROM_STR(kernel_name), in add_q_8w_linear_node()
160 std::string kernel_name = "q_8w_linear_optimized"; in add_q_8w_linear_optimized_node() local
161 kernel_name.reserve(kShaderNameReserve); in add_q_8w_linear_optimized_node()
162 add_packed_dim_suffix(kernel_name, graph.packed_dim_of(mat1_W_packed)); in add_q_8w_linear_optimized_node()
[all …]
DSelect.cpp66 std::string kernel_name; in add_select_int_node() local
75 kernel_name = "select_channel_3d"; in add_select_int_node()
77 kernel_name = "select_height_3d"; in add_select_int_node()
79 kernel_name = "select_width_3d"; in add_select_int_node()
89 kernel_name = "select_batch_4d"; in add_select_int_node()
91 kernel_name = "select_channel_4d"; in add_select_int_node()
93 kernel_name = "select_height_4d"; in add_select_int_node()
95 kernel_name = "select_width_4d"; in add_select_int_node()
102 kernel_name.reserve(kShaderNameReserve); in add_select_int_node()
103 add_dtype_suffix(kernel_name, *t_out); in add_select_int_node()
[all …]
DMatMul.cpp72 std::string kernel_name = "matmul_naive_buffer"; in add_matmul_naive_buffer_node() local
73 add_dtype_suffix(kernel_name, graph.dtype_of(out)); in add_matmul_naive_buffer_node()
87 VK_KERNEL_FROM_STR(kernel_name), in add_matmul_naive_buffer_node()
123 std::string kernel_name = graph.get_bool(mat2_is_transposed) in add_matmul_naive_texture3d_node() local
126 kernel_name.reserve(kShaderNameReserve); in add_matmul_naive_texture3d_node()
127 add_storage_type_suffix(kernel_name, graph.storage_type_of(out)); in add_matmul_naive_texture3d_node()
128 add_dtype_suffix(kernel_name, graph.dtype_of(out)); in add_matmul_naive_texture3d_node()
133 VK_KERNEL_FROM_STR(kernel_name), in add_matmul_naive_texture3d_node()
184 std::string kernel_name = mat2_is_transposed_val in add_matmul_optimized_node() local
191 kernel_name = "batch_" + kernel_name; in add_matmul_optimized_node()
[all …]
DCopy.cpp31 std::string kernel_name = "copy_offset"; in add_copy_offset_node() local
32 kernel_name.reserve(kShaderNameReserve); in add_copy_offset_node()
33 add_dtype_suffix(kernel_name, *t_out); in add_copy_offset_node()
34 add_storage_type_suffix(kernel_name, *t_out); in add_copy_offset_node()
46 auto shader = VK_KERNEL_FROM_STR(kernel_name); in add_copy_offset_node()
50 VK_KERNEL_FROM_STR(kernel_name), in add_copy_offset_node()
114 std::string kernel_name = "copy_channel_offset"; in add_copy_channel_offset_node() local
115 kernel_name.reserve(kShaderNameReserve); in add_copy_channel_offset_node()
116 add_dtype_suffix(kernel_name, *t_out); in add_copy_channel_offset_node()
154 auto shader = VK_KERNEL_FROM_STR(kernel_name); in add_copy_channel_offset_node()
[all …]
DClone.cpp41 std::string kernel_name = "clone"; in add_clone_node() local
42 add_dtype_suffix(kernel_name, *t_out); in add_clone_node()
46 VK_KERNEL_FROM_STR(kernel_name), in add_clone_node()
63 std::string kernel_name = "clone_image_to_buffer"; in add_image_to_buffer_node() local
64 add_dtype_suffix(kernel_name, graph.dtype_of(image)); in add_image_to_buffer_node()
65 vkapi::ShaderInfo shader = VK_KERNEL_FROM_STR(kernel_name); in add_image_to_buffer_node()
87 std::string kernel_name = "clone_buffer_to_image"; in add_buffer_to_image_node() local
88 add_dtype_suffix(kernel_name, graph.dtype_of(image)); in add_buffer_to_image_node()
89 vkapi::ShaderInfo shader = VK_KERNEL_FROM_STR(kernel_name); in add_buffer_to_image_node()
/external/gemmlowp/meta/generators/
Dcommon.py90 def __init__(self, emitter, kernel_name, output_stream_name): argument
91 self.kernel_name = kernel_name
99 in_type, out_type, self.kernel_name, self.output_stream_name, kernel_m,
105 'const FusedKernelParams<%s, %s>&' % (self.kernel_name,
110 _TemplateName(self.kernel_name + self.output_stream_name,
119 def __init__(self, emitter, kernel_name): argument
120 self.kernel_name = kernel_name
127 in_type, out_type, self.kernel_name, kernel_size, leftovers
132 ['const %s&' % self.kernel_name, 'params'],
135 _TemplateName(self.kernel_name, template_params))
/external/pytorch/torch/_inductor/codegen/cuda/
Dcuda_cpp_scheduling.py52 kernel_name = wrapper.src_to_kernel[src_code]
59 kernel_name = "_".join(["cuda", fused_name, wrapper.next_kernel_suffix()])
61 wrapper.src_to_kernel[src_code] = kernel_name
62 src_code = src_code.replace("KERNEL_NAME", kernel_name)
75 kernel_name, compile_wrapper.getvalue(), metadata_comment
77 return kernel_name
102 kernel_name = self.define_kernel(src_code, node_schedule)
108 call_args, kernel_name, arg_signatures, kernel
111 kernel.call_kernel(kernel_name, ctb)
/external/pytorch/torch/_inductor/codegen/rocm/
Drocm_cpp_scheduling.py47 kernel_name = wrapper.src_to_kernel[src_code]
54 kernel_name = "_".join(["rocm", fused_name, wrapper.next_kernel_suffix()])
56 wrapper.src_to_kernel[src_code] = kernel_name
57 src_code = src_code.replace("KERNEL_NAME", kernel_name)
70 kernel_name, compile_wrapper.getvalue(), metadata_comment
72 return kernel_name
96 kernel_name = self.define_kernel(src_code, node_schedule)
97 kernel.call_kernel(kernel_name, ctb)
Drocm_benchmark_request.py23 kernel_name: str,
29 super().__init__(kernel_name, input_tensor_meta, output_tensor_meta, extra_args)
57 …"make_run_fn: self.kernel_name=%s, self.source_file=%s, self.hash_key=%s, self.DLL=%s, args=%s, se…
58 self.kernel_name,
66 run_method = getattr(self.DLL, self.kernel_name)
94 run_method = getattr(self.DLL, self.kernel_name)
110 …"update_workspace_size called: new workspace size=%d, self.kernel_name=%s, self.source_file=%s, se…
112 self.kernel_name,
133 return f"{self.kernel_name=}, {self.source_file=}, {self.hash_key=}"
/external/pytorch/aten/src/ATen/native/quantized/cpu/qnnpack/src/q8gemm_sparse/
D8x4c1x4-dq-packedA-sse2.c1 #define KERNEL_NAME pytorch_q8gemm_dq_sparse_1x4_ukernel_8x4_packedA_w32__sse2 macro
4 #undef KERNEL_NAME
7 #define KERNEL_NAME pytorch_q8gemm_dq_sparse_1x4_ukernel_8x4_packedA_w16__sse2 macro
10 #undef KERNEL_NAME
13 #define KERNEL_NAME pytorch_q8gemm_dq_sparse_1x4_ukernel_8x4_packedA_w8__sse2 macro
16 #undef KERNEL_NAME
/external/executorch/backends/vulkan/test/utils/
Dtest_utils.cpp120 std::string kernel_name = "bitw8_image_to_nchw_nobitw8buffer"; in record_bitw8_image_to_nchw_nobitw8buffer_op() local
121 add_storage_type_suffix(kernel_name, v_src); in record_bitw8_image_to_nchw_nobitw8buffer_op()
122 add_dtype_suffix(kernel_name, v_src); in record_bitw8_image_to_nchw_nobitw8buffer_op()
125 VK_KERNEL_FROM_STR(kernel_name), in record_bitw8_image_to_nchw_nobitw8buffer_op()
146 std::string kernel_name; in record_conv2d_prepack_weights_op() local
148 kernel_name = "conv_transpose2d"; in record_conv2d_prepack_weights_op()
150 kernel_name = "conv2d"; in record_conv2d_prepack_weights_op()
152 kernel_name += "_prepack_weights"; in record_conv2d_prepack_weights_op()
153 add_dtype_suffix(kernel_name, v_dst); in record_conv2d_prepack_weights_op()
154 vkapi::ShaderInfo shader = VK_KERNEL_FROM_STR(kernel_name); in record_conv2d_prepack_weights_op()
[all …]
/external/OpenCL-CTS/test_conformance/device_execution/
Dutils.cpp23 …_queue queue, const char** source, unsigned int num_lines, const char* kernel_name, void* results,… in run_single_kernel() argument
25 …return run_single_kernel_args(context, queue, source, num_lines, kernel_name, results, res_size, 0… in run_single_kernel()
28 …_queue queue, const char** source, unsigned int num_lines, const char* kernel_name, void* results,… in run_single_kernel_args() argument
30 …return run_n_kernel_args(context, queue, source, num_lines, kernel_name, 1, 1, results, res_size, … in run_single_kernel_args()
33 …_queue queue, const char** source, unsigned int num_lines, const char* kernel_name, size_t local, … in run_n_kernel_args() argument
44 source, kernel_name); in run_n_kernel_args()
51 …d, %d, %p) for kernel: '%s' failed: %d", 0, (int)sizeof(cl_mem), &mem, kernel_name, err_ret)) retu… in run_n_kernel_args()
56 … kernel: '%s' failed: %d", (int)(i+1), (int)args[i].size, args[i].ptr, kernel_name, err_ret)) retu… in run_n_kernel_args()
60 …if(check_error(err_ret, "clEnqueueNDRangeKernel('%s', gws=%d, lws=%d) failed", kernel_name, (int)g… in run_n_kernel_args()

12345678910>>...15