/external/executorch/kernels/portable/ |
D | functions.yaml | 23 kernel_name: torch::executor::_cdist_forward_out 28 kernel_name: torch::executor::log_softmax_out 33 kernel_name: torch::executor::_native_batch_norm_legit_out 38 kernel_name: torch::executor::_native_batch_norm_legit_no_stats_out 43 kernel_name: torch::executor::_native_batch_norm_legit_no_training_out 48 kernel_name: torch::executor::_pdist_forward_out 53 kernel_name: torch::executor::softmax_out 58 kernel_name: torch::executor::to_copy_out 63 kernel_name: torch::executor::abs_out 68 kernel_name: torch::executor::acos_out [all …]
|
/external/executorch/backends/vulkan/runtime/graph/ops/utils/ |
D | StagingUtils.cpp | 26 std::string kernel_name; in get_nchw_to_tensor_shader() local 27 kernel_name.reserve(kShaderNameReserve); in get_nchw_to_tensor_shader() 31 kernel_name = "nchw_to_bitw8_image_nobitw8buffer"; in get_nchw_to_tensor_shader() 32 add_storage_type_suffix(kernel_name, v_dst); in get_nchw_to_tensor_shader() 33 add_dtype_suffix(kernel_name, v_dst); in get_nchw_to_tensor_shader() 34 return VK_KERNEL_FROM_STR(kernel_name); in get_nchw_to_tensor_shader() 38 kernel_name = "nchw_to_buffer"; in get_nchw_to_tensor_shader() 39 add_dtype_suffix(kernel_name, v_dst); in get_nchw_to_tensor_shader() 40 return VK_KERNEL_FROM_STR(kernel_name); in get_nchw_to_tensor_shader() 43 kernel_name = "nchw_to_image"; in get_nchw_to_tensor_shader() [all …]
|
D | ShaderNameUtils.cpp | 14 std::string& kernel_name, in add_storage_type_suffix() argument 18 kernel_name += "_buffer"; in add_storage_type_suffix() 21 kernel_name += "_texture3d"; in add_storage_type_suffix() 24 kernel_name += "_texture2d"; in add_storage_type_suffix() 30 std::string& kernel_name, in add_storage_type_suffix() argument 32 return add_storage_type_suffix(kernel_name, tensor.storage_type()); in add_storage_type_suffix() 35 void add_dtype_suffix(std::string& kernel_name, const vkapi::ScalarType dtype) { in add_dtype_suffix() argument 38 kernel_name += "_float"; in add_dtype_suffix() 41 kernel_name += "_half"; in add_dtype_suffix() 44 kernel_name += "_int"; in add_dtype_suffix() [all …]
|
D | ShaderNameUtils.h | 20 std::string& kernel_name, 23 std::string& kernel_name, 26 void add_dtype_suffix(std::string& kernel_name, const vkapi::ScalarType dtype); 27 void add_dtype_suffix(std::string& kernel_name, const api::vTensor& tensor); 29 void add_ndim_suffix(std::string& kernel_name, const size_t ndim); 30 void add_ndim_suffix(std::string& kernel_name, const api::vTensor& tensor); 32 void add_packed_dim_suffix(std::string& kernel_name, const int32_t packed_dim); 34 std::string& kernel_name,
|
/external/executorch/backends/cadence/aot/ |
D | functions.yaml | 18 kernel_name: torch::executor::to_copy_out 23 kernel_name: torch::executor::softmax_out 28 kernel_name: torch::executor::add_out 33 kernel_name: torch::executor::bmm_out 38 kernel_name: torch::executor::cat_out 43 kernel_name: torch::executor::clone_out 48 kernel_name: torch::executor::div_out 53 kernel_name: torch::executor::div_out_mode 58 kernel_name: torch::executor::embedding_out 63 kernel_name: torch::executor::empty_out [all …]
|
D | functions_hifi.yaml | 18 kernel_name: torch::executor::to_copy_out 23 kernel_name: torch::executor::softmax_out 28 kernel_name: cadence::impl::HiFi::add_out 33 kernel_name: torch::executor::bmm_out 38 kernel_name: torch::executor::cat_out 43 kernel_name: torch::executor::clone_out 48 kernel_name: cadence::impl::HiFi::div_out 53 kernel_name: cadence::impl::HiFi::div_out_mode 58 kernel_name: torch::executor::embedding_out 63 kernel_name: torch::executor::full_out [all …]
|
/external/executorch/kernels/optimized/ |
D | optimized.yaml | 8 kernel_name: torch::executor::opt_log_softmax_out 13 kernel_name: torch::executor::opt_add_out 18 kernel_name: torch::executor::opt_add_scalar_out 23 kernel_name: torch::executor::opt_bmm_out 28 kernel_name: torch::executor::opt_div_out 33 kernel_name: torch::executor::opt_div_scalar_out 38 kernel_name: torch::executor::opt_exp_out 43 kernel_name: torch::executor::opt_sigmoid_out 48 kernel_name: torch::executor::opt_gelu_out 53 kernel_name: torch::executor::opt_le_scalar_out [all …]
|
D | optimized-oss.yaml | 11 kernel_name: torch::executor::opt_add_out 16 kernel_name: torch::executor::opt_add_scalar_out 21 kernel_name: torch::executor::opt_bmm_out 26 kernel_name: torch::executor::opt_div_out 31 kernel_name: torch::executor::opt_div_scalar_out 36 kernel_name: torch::executor::opt_exp_out 41 kernel_name: torch::executor::opt_sigmoid_out 46 kernel_name: torch::executor::opt_le_scalar_out 51 kernel_name: torch::executor::opt_le_tensor_out 56 kernel_name: torch::executor::opt_linear_out [all …]
|
/external/pytorch/torch/_inductor/codegen/ |
D | cpp_wrapper_cuda.py | 36 kernel_name: str, 42 self.kernel_name = kernel_name 47 params = CudaKernelParamCache.get(self.kernel_name) 50 ), f"{self.kernel_name} not found in CudaKernelParamCache" 54 ), f"{key} not found in CudaKernelParamCache[{self.kernel_name}]" 61 return DeferredCudaKernelLine(self.kernel_name, line, self.keys) 71 kernel_name: str, 76 self.kernel_name = kernel_name 97 params = CudaKernelParamCache.get(self.kernel_name) 100 ), f"{self.kernel_name} not found in CudaKernelParamCache" [all …]
|
D | debug_utils.py | 34 kernel_name: str = "", 42 self.kernel_name = kernel_name 50 self.kernel_name, 55 def __exit__(self, args_to_print_or_save, kernel_name, arg_signatures): argument 58 kernel_name, 66 kernel_name, argument 76 self.kernel_name, 84 self.kernel_name, 101 kernel_name: str, 112 self.kernel_name = kernel_name [all …]
|
/external/executorch/kernels/quantized/ |
D | quantized.yaml | 5 kernel_name: torch::executor::quantized_add_out 11 kernel_name: torch::executor::choose_qparams_tensor_out 17 kernel_name: torch::executor::dequantize_per_tensor_out 23 kernel_name: torch::executor::dequantize_per_tensor_tensor_args_out 29 kernel_name: torch::executor::quantize_per_channel_out 35 kernel_name: torch::executor::dequantize_per_channel_out 41 kernel_name: torch::executor::quantized_embedding_byte_out 47 kernel_name: torch::executor::quantized_embedding_byte_dtype_out 53 kernel_name: torch::executor::quantized_embedding_2bit_out 59 kernel_name: torch::executor::quantized_embedding_2bit_dtype_out [all …]
|
/external/executorch/kernels/quantized/test/ |
D | targets.bzl | 6 op_test("op_quantize_test", kernel_name = "quantized") 7 op_test("op_dequantize_test", kernel_name = "quantized") 8 op_test("op_choose_qparams_test", kernel_name = "quantized") 9 op_test("op_add_test", kernel_name = "quantized", deps = [ 18 op_test("op_embedding_test", kernel_name = "quantized", deps = [ 28 op_test("op_embedding2b_test", kernel_name = "quantized") 29 op_test("op_embedding4b_test", kernel_name = "quantized") 30 op_test("op_mixed_mm_test", kernel_name = "quantized", deps = [ 36 op_test("op_mixed_linear_test", kernel_name = "quantized", deps = [
|
/external/executorch/shim/xplat/executorch/kernels/test/ |
D | util.bzl | 3 def op_test(name, deps = [], kernel_name = "portable", use_kernel_prefix = False): 13 kernel_name: The name string as in //executorch/kernels/<kernel_name>. 21 if kernel_name == "aten": 31 "//executorch/kernels/{}/cpu:{}".format(kernel_name, op_root), 32 "//executorch/kernels/{}:generated_lib_headers".format(kernel_name), 33 "//executorch/kernels/{}/test:supported_features".format(kernel_name), 38 if kernel_name == "aten": 43 name_prefix = kernel_name + "_" 116 def codegen_function_header_wrapper(kernel_path, kernel_name): 121 Use target "function_header_wrapper_<kernel_name>" in tests. [all …]
|
/external/executorch/backends/vulkan/runtime/graph/ops/impl/ |
D | QuantizedLinear.cpp | 89 std::string kernel_name = "q_8w_linear"; in add_q_8w_linear_node() local 90 kernel_name.reserve(kShaderNameReserve); in add_q_8w_linear_node() 91 add_packed_dim_suffix(kernel_name, graph.packed_dim_of(mat1_W_packed)); in add_q_8w_linear_node() 92 add_packed_dim_suffix(kernel_name, graph.packed_dim_of(q_mat2)); in add_q_8w_linear_node() 93 add_dtype_suffix(kernel_name, graph.dtype_of(out_W_packed)); in add_q_8w_linear_node() 94 add_storage_type_suffix(kernel_name, graph.storage_type_of(out_W_packed)); in add_q_8w_linear_node() 118 VK_KERNEL_FROM_STR(kernel_name), in add_q_8w_linear_node() 160 std::string kernel_name = "q_8w_linear_optimized"; in add_q_8w_linear_optimized_node() local 161 kernel_name.reserve(kShaderNameReserve); in add_q_8w_linear_optimized_node() 162 add_packed_dim_suffix(kernel_name, graph.packed_dim_of(mat1_W_packed)); in add_q_8w_linear_optimized_node() [all …]
|
D | Select.cpp | 66 std::string kernel_name; in add_select_int_node() local 75 kernel_name = "select_channel_3d"; in add_select_int_node() 77 kernel_name = "select_height_3d"; in add_select_int_node() 79 kernel_name = "select_width_3d"; in add_select_int_node() 89 kernel_name = "select_batch_4d"; in add_select_int_node() 91 kernel_name = "select_channel_4d"; in add_select_int_node() 93 kernel_name = "select_height_4d"; in add_select_int_node() 95 kernel_name = "select_width_4d"; in add_select_int_node() 102 kernel_name.reserve(kShaderNameReserve); in add_select_int_node() 103 add_dtype_suffix(kernel_name, *t_out); in add_select_int_node() [all …]
|
D | MatMul.cpp | 72 std::string kernel_name = "matmul_naive_buffer"; in add_matmul_naive_buffer_node() local 73 add_dtype_suffix(kernel_name, graph.dtype_of(out)); in add_matmul_naive_buffer_node() 87 VK_KERNEL_FROM_STR(kernel_name), in add_matmul_naive_buffer_node() 123 std::string kernel_name = graph.get_bool(mat2_is_transposed) in add_matmul_naive_texture3d_node() local 126 kernel_name.reserve(kShaderNameReserve); in add_matmul_naive_texture3d_node() 127 add_storage_type_suffix(kernel_name, graph.storage_type_of(out)); in add_matmul_naive_texture3d_node() 128 add_dtype_suffix(kernel_name, graph.dtype_of(out)); in add_matmul_naive_texture3d_node() 133 VK_KERNEL_FROM_STR(kernel_name), in add_matmul_naive_texture3d_node() 184 std::string kernel_name = mat2_is_transposed_val in add_matmul_optimized_node() local 191 kernel_name = "batch_" + kernel_name; in add_matmul_optimized_node() [all …]
|
D | Copy.cpp | 31 std::string kernel_name = "copy_offset"; in add_copy_offset_node() local 32 kernel_name.reserve(kShaderNameReserve); in add_copy_offset_node() 33 add_dtype_suffix(kernel_name, *t_out); in add_copy_offset_node() 34 add_storage_type_suffix(kernel_name, *t_out); in add_copy_offset_node() 46 auto shader = VK_KERNEL_FROM_STR(kernel_name); in add_copy_offset_node() 50 VK_KERNEL_FROM_STR(kernel_name), in add_copy_offset_node() 114 std::string kernel_name = "copy_channel_offset"; in add_copy_channel_offset_node() local 115 kernel_name.reserve(kShaderNameReserve); in add_copy_channel_offset_node() 116 add_dtype_suffix(kernel_name, *t_out); in add_copy_channel_offset_node() 154 auto shader = VK_KERNEL_FROM_STR(kernel_name); in add_copy_channel_offset_node() [all …]
|
D | Clone.cpp | 41 std::string kernel_name = "clone"; in add_clone_node() local 42 add_dtype_suffix(kernel_name, *t_out); in add_clone_node() 46 VK_KERNEL_FROM_STR(kernel_name), in add_clone_node() 63 std::string kernel_name = "clone_image_to_buffer"; in add_image_to_buffer_node() local 64 add_dtype_suffix(kernel_name, graph.dtype_of(image)); in add_image_to_buffer_node() 65 vkapi::ShaderInfo shader = VK_KERNEL_FROM_STR(kernel_name); in add_image_to_buffer_node() 87 std::string kernel_name = "clone_buffer_to_image"; in add_buffer_to_image_node() local 88 add_dtype_suffix(kernel_name, graph.dtype_of(image)); in add_buffer_to_image_node() 89 vkapi::ShaderInfo shader = VK_KERNEL_FROM_STR(kernel_name); in add_buffer_to_image_node()
|
/external/gemmlowp/meta/generators/ |
D | common.py | 90 def __init__(self, emitter, kernel_name, output_stream_name): argument 91 self.kernel_name = kernel_name 99 in_type, out_type, self.kernel_name, self.output_stream_name, kernel_m, 105 'const FusedKernelParams<%s, %s>&' % (self.kernel_name, 110 _TemplateName(self.kernel_name + self.output_stream_name, 119 def __init__(self, emitter, kernel_name): argument 120 self.kernel_name = kernel_name 127 in_type, out_type, self.kernel_name, kernel_size, leftovers 132 ['const %s&' % self.kernel_name, 'params'], 135 _TemplateName(self.kernel_name, template_params))
|
/external/pytorch/torch/_inductor/codegen/cuda/ |
D | cuda_cpp_scheduling.py | 52 kernel_name = wrapper.src_to_kernel[src_code] 59 kernel_name = "_".join(["cuda", fused_name, wrapper.next_kernel_suffix()]) 61 wrapper.src_to_kernel[src_code] = kernel_name 62 src_code = src_code.replace("KERNEL_NAME", kernel_name) 75 kernel_name, compile_wrapper.getvalue(), metadata_comment 77 return kernel_name 102 kernel_name = self.define_kernel(src_code, node_schedule) 108 call_args, kernel_name, arg_signatures, kernel 111 kernel.call_kernel(kernel_name, ctb)
|
/external/pytorch/torch/_inductor/codegen/rocm/ |
D | rocm_cpp_scheduling.py | 47 kernel_name = wrapper.src_to_kernel[src_code] 54 kernel_name = "_".join(["rocm", fused_name, wrapper.next_kernel_suffix()]) 56 wrapper.src_to_kernel[src_code] = kernel_name 57 src_code = src_code.replace("KERNEL_NAME", kernel_name) 70 kernel_name, compile_wrapper.getvalue(), metadata_comment 72 return kernel_name 96 kernel_name = self.define_kernel(src_code, node_schedule) 97 kernel.call_kernel(kernel_name, ctb)
|
D | rocm_benchmark_request.py | 23 kernel_name: str, 29 super().__init__(kernel_name, input_tensor_meta, output_tensor_meta, extra_args) 57 …"make_run_fn: self.kernel_name=%s, self.source_file=%s, self.hash_key=%s, self.DLL=%s, args=%s, se… 58 self.kernel_name, 66 run_method = getattr(self.DLL, self.kernel_name) 94 run_method = getattr(self.DLL, self.kernel_name) 110 …"update_workspace_size called: new workspace size=%d, self.kernel_name=%s, self.source_file=%s, se… 112 self.kernel_name, 133 return f"{self.kernel_name=}, {self.source_file=}, {self.hash_key=}"
|
/external/pytorch/aten/src/ATen/native/quantized/cpu/qnnpack/src/q8gemm_sparse/ |
D | 8x4c1x4-dq-packedA-sse2.c | 1 #define KERNEL_NAME pytorch_q8gemm_dq_sparse_1x4_ukernel_8x4_packedA_w32__sse2 macro 4 #undef KERNEL_NAME 7 #define KERNEL_NAME pytorch_q8gemm_dq_sparse_1x4_ukernel_8x4_packedA_w16__sse2 macro 10 #undef KERNEL_NAME 13 #define KERNEL_NAME pytorch_q8gemm_dq_sparse_1x4_ukernel_8x4_packedA_w8__sse2 macro 16 #undef KERNEL_NAME
|
/external/executorch/backends/vulkan/test/utils/ |
D | test_utils.cpp | 120 std::string kernel_name = "bitw8_image_to_nchw_nobitw8buffer"; in record_bitw8_image_to_nchw_nobitw8buffer_op() local 121 add_storage_type_suffix(kernel_name, v_src); in record_bitw8_image_to_nchw_nobitw8buffer_op() 122 add_dtype_suffix(kernel_name, v_src); in record_bitw8_image_to_nchw_nobitw8buffer_op() 125 VK_KERNEL_FROM_STR(kernel_name), in record_bitw8_image_to_nchw_nobitw8buffer_op() 146 std::string kernel_name; in record_conv2d_prepack_weights_op() local 148 kernel_name = "conv_transpose2d"; in record_conv2d_prepack_weights_op() 150 kernel_name = "conv2d"; in record_conv2d_prepack_weights_op() 152 kernel_name += "_prepack_weights"; in record_conv2d_prepack_weights_op() 153 add_dtype_suffix(kernel_name, v_dst); in record_conv2d_prepack_weights_op() 154 vkapi::ShaderInfo shader = VK_KERNEL_FROM_STR(kernel_name); in record_conv2d_prepack_weights_op() [all …]
|
/external/OpenCL-CTS/test_conformance/device_execution/ |
D | utils.cpp | 23 …_queue queue, const char** source, unsigned int num_lines, const char* kernel_name, void* results,… in run_single_kernel() argument 25 …return run_single_kernel_args(context, queue, source, num_lines, kernel_name, results, res_size, 0… in run_single_kernel() 28 …_queue queue, const char** source, unsigned int num_lines, const char* kernel_name, void* results,… in run_single_kernel_args() argument 30 …return run_n_kernel_args(context, queue, source, num_lines, kernel_name, 1, 1, results, res_size, … in run_single_kernel_args() 33 …_queue queue, const char** source, unsigned int num_lines, const char* kernel_name, size_t local, … in run_n_kernel_args() argument 44 source, kernel_name); in run_n_kernel_args() 51 …d, %d, %p) for kernel: '%s' failed: %d", 0, (int)sizeof(cl_mem), &mem, kernel_name, err_ret)) retu… in run_n_kernel_args() 56 … kernel: '%s' failed: %d", (int)(i+1), (int)args[i].size, args[i].ptr, kernel_name, err_ret)) retu… in run_n_kernel_args() 60 …if(check_error(err_ret, "clEnqueueNDRangeKernel('%s', gws=%d, lws=%d) failed", kernel_name, (int)g… in run_n_kernel_args()
|