Home
last modified time | relevance | path

Searched full:kernel_name (Results 1 – 25 of 365) sorted by relevance

12345678910>>...15

/aosp_15_r20/external/executorch/kernels/portable/
H A Dfunctions.yaml23 kernel_name: torch::executor::_cdist_forward_out
28 kernel_name: torch::executor::log_softmax_out
33 kernel_name: torch::executor::_native_batch_norm_legit_out
38 kernel_name: torch::executor::_native_batch_norm_legit_no_stats_out
43 kernel_name: torch::executor::_native_batch_norm_legit_no_training_out
48 kernel_name: torch::executor::_pdist_forward_out
53 kernel_name: torch::executor::softmax_out
58 kernel_name: torch::executor::to_copy_out
63 kernel_name: torch::executor::abs_out
68 kernel_name: torch::executor::acos_out
[all …]
/aosp_15_r20/external/executorch/backends/cadence/aot/
H A Dfunctions.yaml18 kernel_name: torch::executor::to_copy_out
23 kernel_name: torch::executor::softmax_out
28 kernel_name: torch::executor::add_out
33 kernel_name: torch::executor::bmm_out
38 kernel_name: torch::executor::cat_out
43 kernel_name: torch::executor::clone_out
48 kernel_name: torch::executor::div_out
53 kernel_name: torch::executor::div_out_mode
58 kernel_name: torch::executor::embedding_out
63 kernel_name: torch::executor::empty_out
[all …]
H A Dfunctions_hifi.yaml18 kernel_name: torch::executor::to_copy_out
23 kernel_name: torch::executor::softmax_out
28 kernel_name: cadence::impl::HiFi::add_out
33 kernel_name: torch::executor::bmm_out
38 kernel_name: torch::executor::cat_out
43 kernel_name: torch::executor::clone_out
48 kernel_name: cadence::impl::HiFi::div_out
53 kernel_name: cadence::impl::HiFi::div_out_mode
58 kernel_name: torch::executor::embedding_out
63 kernel_name: torch::executor::full_out
[all …]
/aosp_15_r20/external/executorch/backends/vulkan/runtime/graph/ops/utils/
H A DStagingUtils.cpp26 std::string kernel_name; in get_nchw_to_tensor_shader() local
27 kernel_name.reserve(kShaderNameReserve); in get_nchw_to_tensor_shader()
31 kernel_name = "nchw_to_bitw8_image_nobitw8buffer"; in get_nchw_to_tensor_shader()
32 add_storage_type_suffix(kernel_name, v_dst); in get_nchw_to_tensor_shader()
33 add_dtype_suffix(kernel_name, v_dst); in get_nchw_to_tensor_shader()
34 return VK_KERNEL_FROM_STR(kernel_name); in get_nchw_to_tensor_shader()
38 kernel_name = "nchw_to_buffer"; in get_nchw_to_tensor_shader()
39 add_dtype_suffix(kernel_name, v_dst); in get_nchw_to_tensor_shader()
40 return VK_KERNEL_FROM_STR(kernel_name); in get_nchw_to_tensor_shader()
43 kernel_name = "nchw_to_image"; in get_nchw_to_tensor_shader()
[all …]
H A DShaderNameUtils.cpp14 std::string& kernel_name, in add_storage_type_suffix() argument
18 kernel_name += "_buffer"; in add_storage_type_suffix()
21 kernel_name += "_texture3d"; in add_storage_type_suffix()
24 kernel_name += "_texture2d"; in add_storage_type_suffix()
30 std::string& kernel_name, in add_storage_type_suffix() argument
32 return add_storage_type_suffix(kernel_name, tensor.storage_type()); in add_storage_type_suffix()
35 void add_dtype_suffix(std::string& kernel_name, const vkapi::ScalarType dtype) { in add_dtype_suffix() argument
38 kernel_name += "_float"; in add_dtype_suffix()
41 kernel_name += "_half"; in add_dtype_suffix()
44 kernel_name += "_int"; in add_dtype_suffix()
[all …]
/aosp_15_r20/external/pytorch/torch/_inductor/codegen/
H A Dcpp_wrapper_cuda.py36 kernel_name: str,
42 self.kernel_name = kernel_name
47 params = CudaKernelParamCache.get(self.kernel_name)
50 ), f"{self.kernel_name} not found in CudaKernelParamCache"
54 ), f"{key} not found in CudaKernelParamCache[{self.kernel_name}]"
61 return DeferredCudaKernelLine(self.kernel_name, line, self.keys)
71 kernel_name: str,
76 self.kernel_name = kernel_name
97 params = CudaKernelParamCache.get(self.kernel_name)
100 ), f"{self.kernel_name} not found in CudaKernelParamCache"
[all …]
H A Ddebug_utils.py34 kernel_name: str = "",
42 self.kernel_name = kernel_name
50 self.kernel_name,
55 def __exit__(self, args_to_print_or_save, kernel_name, arg_signatures): argument
58 kernel_name,
66 kernel_name, argument
76 self.kernel_name,
84 self.kernel_name,
101 kernel_name: str,
112 self.kernel_name = kernel_name
[all …]
H A Dmulti_kernel.py103 kernel_names = tuple(k.kernel_name for k in kernels)
150 self.kernel_name = V.graph.wrapper_code.multi_kernel_state.define_kernel(
158 def call_kernel(self, kernel_name): argument
163 assert kernel_name == self.kernel_name
176 picked_kernel = MultiKernelCall.lookup_choice(kernel_name)
177 kernel_name = self.kernels[picked_kernel].kernel_name
181 kernel_name, call_args, arg_types, grid
184 grid = V.graph.wrapper_code.generate_default_grid(kernel_name, grid)
186 kernel_name,
225 def warn_mix_layout(self, kernel_name: str):
[all …]
/aosp_15_r20/external/executorch/kernels/optimized/
H A Doptimized.yaml8 kernel_name: torch::executor::opt_log_softmax_out
13 kernel_name: torch::executor::opt_add_out
18 kernel_name: torch::executor::opt_add_scalar_out
23 kernel_name: torch::executor::opt_bmm_out
28 kernel_name: torch::executor::opt_div_out
33 kernel_name: torch::executor::opt_div_scalar_out
38 kernel_name: torch::executor::opt_exp_out
43 kernel_name: torch::executor::opt_sigmoid_out
48 kernel_name: torch::executor::opt_gelu_out
53 kernel_name: torch::executor::opt_le_scalar_out
[all …]
H A Doptimized-oss.yaml11 kernel_name: torch::executor::opt_add_out
16 kernel_name: torch::executor::opt_add_scalar_out
21 kernel_name: torch::executor::opt_bmm_out
26 kernel_name: torch::executor::opt_div_out
31 kernel_name: torch::executor::opt_div_scalar_out
36 kernel_name: torch::executor::opt_exp_out
41 kernel_name: torch::executor::opt_sigmoid_out
46 kernel_name: torch::executor::opt_le_scalar_out
51 kernel_name: torch::executor::opt_le_tensor_out
56 kernel_name: torch::executor::opt_linear_out
[all …]
/aosp_15_r20/external/executorch/kernels/quantized/
H A Dquantized.yaml5 kernel_name: torch::executor::quantized_add_out
11 kernel_name: torch::executor::choose_qparams_tensor_out
17 kernel_name: torch::executor::dequantize_per_tensor_out
23 kernel_name: torch::executor::dequantize_per_tensor_tensor_args_out
29 kernel_name: torch::executor::quantize_per_channel_out
35 kernel_name: torch::executor::dequantize_per_channel_out
41 kernel_name: torch::executor::quantized_embedding_byte_out
47 kernel_name: torch::executor::quantized_embedding_byte_dtype_out
53 kernel_name: torch::executor::quantized_embedding_2bit_out
59 kernel_name: torch::executor::quantized_embedding_2bit_dtype_out
[all …]
/aosp_15_r20/external/executorch/backends/vulkan/runtime/graph/ops/impl/
H A DQuantizedLinear.cpp89 std::string kernel_name = "q_8w_linear"; in add_q_8w_linear_node() local
90 kernel_name.reserve(kShaderNameReserve); in add_q_8w_linear_node()
91 add_packed_dim_suffix(kernel_name, graph.packed_dim_of(mat1_W_packed)); in add_q_8w_linear_node()
92 add_packed_dim_suffix(kernel_name, graph.packed_dim_of(q_mat2)); in add_q_8w_linear_node()
93 add_dtype_suffix(kernel_name, graph.dtype_of(out_W_packed)); in add_q_8w_linear_node()
94 add_storage_type_suffix(kernel_name, graph.storage_type_of(out_W_packed)); in add_q_8w_linear_node()
118 VK_KERNEL_FROM_STR(kernel_name), in add_q_8w_linear_node()
160 std::string kernel_name = "q_8w_linear_optimized"; in add_q_8w_linear_optimized_node() local
161 kernel_name.reserve(kShaderNameReserve); in add_q_8w_linear_optimized_node()
162 add_packed_dim_suffix(kernel_name, graph.packed_dim_of(mat1_W_packed)); in add_q_8w_linear_optimized_node()
[all …]
H A DMatMul.cpp72 std::string kernel_name = "matmul_naive_buffer"; in add_matmul_naive_buffer_node() local
73 add_dtype_suffix(kernel_name, graph.dtype_of(out)); in add_matmul_naive_buffer_node()
87 VK_KERNEL_FROM_STR(kernel_name), in add_matmul_naive_buffer_node()
123 std::string kernel_name = graph.get_bool(mat2_is_transposed) in add_matmul_naive_texture3d_node() local
126 kernel_name.reserve(kShaderNameReserve); in add_matmul_naive_texture3d_node()
127 add_storage_type_suffix(kernel_name, graph.storage_type_of(out)); in add_matmul_naive_texture3d_node()
128 add_dtype_suffix(kernel_name, graph.dtype_of(out)); in add_matmul_naive_texture3d_node()
133 VK_KERNEL_FROM_STR(kernel_name), in add_matmul_naive_texture3d_node()
184 std::string kernel_name = mat2_is_transposed_val in add_matmul_optimized_node() local
191 kernel_name = "batch_" + kernel_name; in add_matmul_optimized_node()
[all …]
H A DConvolution.cpp130 std::string kernel_name; in get_conv2d_shader() local
131 kernel_name.reserve(kShaderNameReserve); in get_conv2d_shader()
134 kernel_name = "conv2d_dw"; in get_conv2d_shader()
138 kernel_name += "_output_tile_3x3"; in get_conv2d_shader()
141 kernel_name += "_output_tile_5x5"; in get_conv2d_shader()
147 kernel_name = "conv2d"; in get_conv2d_shader()
149 kernel_name = "conv2d_pw"; in get_conv2d_shader()
153 kernel_name = "conv2d"; in get_conv2d_shader()
156 kernel_name = "conv_transpose2d"; in get_conv2d_shader()
160 kernel_name += "_prepack_weights"; in get_conv2d_shader()
[all …]
H A DSelect.cpp66 std::string kernel_name; in add_select_int_node() local
75 kernel_name = "select_channel_3d"; in add_select_int_node()
77 kernel_name = "select_height_3d"; in add_select_int_node()
79 kernel_name = "select_width_3d"; in add_select_int_node()
89 kernel_name = "select_batch_4d"; in add_select_int_node()
91 kernel_name = "select_channel_4d"; in add_select_int_node()
93 kernel_name = "select_height_4d"; in add_select_int_node()
95 kernel_name = "select_width_4d"; in add_select_int_node()
102 kernel_name.reserve(kShaderNameReserve); in add_select_int_node()
103 add_dtype_suffix(kernel_name, *t_out); in add_select_int_node()
[all …]
H A DCopy.cpp31 std::string kernel_name = "copy_offset"; in add_copy_offset_node() local
32 kernel_name.reserve(kShaderNameReserve); in add_copy_offset_node()
33 add_dtype_suffix(kernel_name, *t_out); in add_copy_offset_node()
34 add_storage_type_suffix(kernel_name, *t_out); in add_copy_offset_node()
46 auto shader = VK_KERNEL_FROM_STR(kernel_name); in add_copy_offset_node()
50 VK_KERNEL_FROM_STR(kernel_name), in add_copy_offset_node()
114 std::string kernel_name = "copy_channel_offset"; in add_copy_channel_offset_node() local
115 kernel_name.reserve(kShaderNameReserve); in add_copy_channel_offset_node()
116 add_dtype_suffix(kernel_name, *t_out); in add_copy_channel_offset_node()
154 auto shader = VK_KERNEL_FROM_STR(kernel_name); in add_copy_channel_offset_node()
[all …]
H A DLinear.cpp103 std::string kernel_name = in add_addmm_naive_node() local
105 kernel_name.reserve(kShaderNameReserve); in add_addmm_naive_node()
106 add_storage_type_suffix(kernel_name, graph.storage_type_of(out)); in add_addmm_naive_node()
107 add_dtype_suffix(kernel_name, graph.dtype_of(out)); in add_addmm_naive_node()
112 VK_KERNEL_FROM_STR(kernel_name), in add_addmm_naive_node()
169 std::string kernel_name = graph.get_bool(mat2_is_transposed) in add_addmm_optimized_node() local
176 kernel_name = "batch_" + kernel_name; in add_addmm_optimized_node()
179 kernel_name += "_tile_row_2"; in add_addmm_optimized_node()
181 kernel_name += "_tile_row_4"; in add_addmm_optimized_node()
184 add_dtype_suffix(kernel_name, graph.dtype_of(out)); in add_addmm_optimized_node()
[all …]
/aosp_15_r20/external/executorch/backends/vulkan/test/utils/
H A Dtest_utils.cpp120 std::string kernel_name = "bitw8_image_to_nchw_nobitw8buffer"; in record_bitw8_image_to_nchw_nobitw8buffer_op() local
121 add_storage_type_suffix(kernel_name, v_src); in record_bitw8_image_to_nchw_nobitw8buffer_op()
122 add_dtype_suffix(kernel_name, v_src); in record_bitw8_image_to_nchw_nobitw8buffer_op()
125 VK_KERNEL_FROM_STR(kernel_name), in record_bitw8_image_to_nchw_nobitw8buffer_op()
146 std::string kernel_name; in record_conv2d_prepack_weights_op() local
148 kernel_name = "conv_transpose2d"; in record_conv2d_prepack_weights_op()
150 kernel_name = "conv2d"; in record_conv2d_prepack_weights_op()
152 kernel_name += "_prepack_weights"; in record_conv2d_prepack_weights_op()
153 add_dtype_suffix(kernel_name, v_dst); in record_conv2d_prepack_weights_op()
154 vkapi::ShaderInfo shader = VK_KERNEL_FROM_STR(kernel_name); in record_conv2d_prepack_weights_op()
[all …]
/aosp_15_r20/external/pytorch/torch/_inductor/
H A Dautotune_process.py481 kernel_name: str,
487 self.kernel_name = kernel_name
609 kernel_name: str,
620 super().__init__(kernel_name, input_tensor_meta, output_tensor_meta, extra_args)
638 run_method = getattr(mod, self.kernel_name).run
674 getattr(mod, self.kernel_name).precompile()
677 return f"{self.kernel_name=}, {self.module_path=}, {self.module_cache_key=}"
686 kernel_name: str,
692 super().__init__(kernel_name, input_tensor_meta, output_tensor_meta, extra_args)
719 …"make_run_fn: self.kernel_name=%s, self.source_file=%s, self.hash_key=%s, self.DLL=%s, args=%s, se…
[all …]
/aosp_15_r20/external/executorch/shim/xplat/executorch/kernels/test/
H A Dutil.bzl3 def op_test(name, deps = [], kernel_name = "portable", use_kernel_prefix = False):
13 kernel_name: The name string as in //executorch/kernels/<kernel_name>.
21 if kernel_name == "aten":
31 "//executorch/kernels/{}/cpu:{}".format(kernel_name, op_root),
32 "//executorch/kernels/{}:generated_lib_headers".format(kernel_name),
33 "//executorch/kernels/{}/test:supported_features".format(kernel_name),
38 if kernel_name == "aten":
43 name_prefix = kernel_name + "_"
116 def codegen_function_header_wrapper(kernel_path, kernel_name):
121 Use target "function_header_wrapper_<kernel_name>" in tests.
[all …]
/aosp_15_r20/external/gemmlowp/meta/generators/
H A Dcommon.py90 def __init__(self, emitter, kernel_name, output_stream_name): argument
91 self.kernel_name = kernel_name
99 in_type, out_type, self.kernel_name, self.output_stream_name, kernel_m,
105 'const FusedKernelParams<%s, %s>&' % (self.kernel_name,
110 _TemplateName(self.kernel_name + self.output_stream_name,
119 def __init__(self, emitter, kernel_name): argument
120 self.kernel_name = kernel_name
127 in_type, out_type, self.kernel_name, kernel_size, leftovers
132 ['const %s&' % self.kernel_name, 'params'],
135 _TemplateName(self.kernel_name, template_params))
/aosp_15_r20/external/OpenCL-CTS/test_conformance/math_brute_force/
H A Dcommon.cpp123 std::string GetUnaryKernel(const std::string &kernel_name, const char *builtin, in GetUnaryKernel() argument
136 __kernel void )", kernel_name.c_str(), R"((__global RETTYPE* out, in GetUnaryKernel()
145 __kernel void )", kernel_name.c_str(), R"((__global RETTYPE_SCALAR* out, in GetUnaryKernel()
197 std::string GetUnaryKernel(const std::string &kernel_name, const char *builtin, in GetUnaryKernel() argument
212 __kernel void )", kernel_name.c_str(), R"((__global RETTYPE1* out1, in GetUnaryKernel()
222 __kernel void )", kernel_name.c_str(), R"((__global RETTYPE1_SCALAR* out1, in GetUnaryKernel()
280 std::string GetBinaryKernel(const std::string &kernel_name, const char *builtin, in GetBinaryKernel() argument
312 __kernel void )", kernel_name.c_str(), R"((__global RETTYPE* out, in GetBinaryKernel()
322 __kernel void )", kernel_name.c_str(), R"((__global RETTYPE_SCALAR* out, in GetBinaryKernel()
379 std::string GetBinaryKernel(const std::string &kernel_name, const char *builtin, in GetBinaryKernel() argument
[all …]
/aosp_15_r20/external/pytorch/torch/_inductor/codegen/cuda/
H A Dcuda_cpp_scheduling.py52 kernel_name = wrapper.src_to_kernel[src_code]
59 kernel_name = "_".join(["cuda", fused_name, wrapper.next_kernel_suffix()])
61 wrapper.src_to_kernel[src_code] = kernel_name
62 src_code = src_code.replace("KERNEL_NAME", kernel_name)
75 kernel_name, compile_wrapper.getvalue(), metadata_comment
77 return kernel_name
102 kernel_name = self.define_kernel(src_code, node_schedule)
108 call_args, kernel_name, arg_signatures, kernel
111 kernel.call_kernel(kernel_name, ctb)
/aosp_15_r20/external/executorch/kernels/quantized/test/
H A Dtargets.bzl6 op_test("op_quantize_test", kernel_name = "quantized")
7 op_test("op_dequantize_test", kernel_name = "quantized")
8 op_test("op_choose_qparams_test", kernel_name = "quantized")
9 op_test("op_add_test", kernel_name = "quantized", deps = [
18 op_test("op_embedding_test", kernel_name = "quantized", deps = [
28 op_test("op_embedding2b_test", kernel_name = "quantized")
29 op_test("op_embedding4b_test", kernel_name = "quantized")
30 op_test("op_mixed_mm_test", kernel_name = "quantized", deps = [
36 op_test("op_mixed_linear_test", kernel_name = "quantized", deps = [
/aosp_15_r20/external/ComputeLibrary/src/gpu/cl/kernels/
H A DClIm2ColKernel.cpp56 std::string kernel_name{}; member
162 std::string kernel_name = "im2col_generic_"; in configure_opencl_kernel() local
197 kernel_name = "im2col3x3_"; in configure_opencl_kernel()
202 kernel_name = "im2col9x9_"; in configure_opencl_kernel()
233 kernel_name = "im2col1x1_stridex1_"; in configure_opencl_kernel()
239 kernel_name = "im2col3x3_"; in configure_opencl_kernel()
244 kernel_name = "im2col5x5_"; in configure_opencl_kernel()
252 kernel_name = "im2col11x11_padx0_pady0_"; in configure_opencl_kernel()
258 kernel_name = "im2col_generic_"; in configure_opencl_kernel()
266 kernel_name = "im2col_generic_padx0_pady0_"; in configure_opencl_kernel()
[all …]

12345678910>>...15