1*4bdc9457SAndroid Build Coastguard Worker // Copyright 2022 Google LLC
2*4bdc9457SAndroid Build Coastguard Worker //
3*4bdc9457SAndroid Build Coastguard Worker // This source code is licensed under the BSD-style license found in the
4*4bdc9457SAndroid Build Coastguard Worker // LICENSE file in the root directory of this source tree.
5*4bdc9457SAndroid Build Coastguard Worker
6*4bdc9457SAndroid Build Coastguard Worker #include <assert.h>
7*4bdc9457SAndroid Build Coastguard Worker #include <stddef.h>
8*4bdc9457SAndroid Build Coastguard Worker #include <stdint.h>
9*4bdc9457SAndroid Build Coastguard Worker #include <string.h>
10*4bdc9457SAndroid Build Coastguard Worker
11*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack.h>
12*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/log.h>
13*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/operator.h>
14*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/params.h>
15*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/subgraph.h>
16*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/subgraph-validation.h>
17*4bdc9457SAndroid Build Coastguard Worker
create_transpose_operator(const struct xnn_node * node,const struct xnn_value * values,size_t num_values,struct xnn_operator_data * opdata,const struct xnn_caches * caches)18*4bdc9457SAndroid Build Coastguard Worker static enum xnn_status create_transpose_operator(
19*4bdc9457SAndroid Build Coastguard Worker const struct xnn_node* node,
20*4bdc9457SAndroid Build Coastguard Worker const struct xnn_value* values,
21*4bdc9457SAndroid Build Coastguard Worker size_t num_values,
22*4bdc9457SAndroid Build Coastguard Worker struct xnn_operator_data* opdata,
23*4bdc9457SAndroid Build Coastguard Worker const struct xnn_caches* caches)
24*4bdc9457SAndroid Build Coastguard Worker {
25*4bdc9457SAndroid Build Coastguard Worker assert(node->num_inputs == 1);
26*4bdc9457SAndroid Build Coastguard Worker const uint32_t input_id = node->inputs[0];
27*4bdc9457SAndroid Build Coastguard Worker assert(input_id != XNN_INVALID_VALUE_ID);
28*4bdc9457SAndroid Build Coastguard Worker assert(input_id < num_values);
29*4bdc9457SAndroid Build Coastguard Worker
30*4bdc9457SAndroid Build Coastguard Worker assert(node->num_outputs == 1);
31*4bdc9457SAndroid Build Coastguard Worker const uint32_t output_id = node->outputs[0];
32*4bdc9457SAndroid Build Coastguard Worker assert(output_id != XNN_INVALID_VALUE_ID);
33*4bdc9457SAndroid Build Coastguard Worker assert(output_id < num_values);
34*4bdc9457SAndroid Build Coastguard Worker
35*4bdc9457SAndroid Build Coastguard Worker enum xnn_status status;
36*4bdc9457SAndroid Build Coastguard Worker switch (node->compute_type) {
37*4bdc9457SAndroid Build Coastguard Worker case xnn_compute_type_fp32:
38*4bdc9457SAndroid Build Coastguard Worker status = xnn_create_transpose_nd_x32(node->flags, &opdata->operator_objects[0]);
39*4bdc9457SAndroid Build Coastguard Worker break;
40*4bdc9457SAndroid Build Coastguard Worker #ifndef XNN_NO_F16_OPERATORS
41*4bdc9457SAndroid Build Coastguard Worker case xnn_compute_type_fp16:
42*4bdc9457SAndroid Build Coastguard Worker status = xnn_create_transpose_nd_x16(node->flags, &opdata->operator_objects[0]);
43*4bdc9457SAndroid Build Coastguard Worker break;
44*4bdc9457SAndroid Build Coastguard Worker #endif
45*4bdc9457SAndroid Build Coastguard Worker #if !defined(XNN_NO_QS8_OPERATORS) || !defined(XNN_NO_QU8_OPERATORS)
46*4bdc9457SAndroid Build Coastguard Worker case xnn_compute_type_qs8:
47*4bdc9457SAndroid Build Coastguard Worker case xnn_compute_type_qu8:
48*4bdc9457SAndroid Build Coastguard Worker status = xnn_create_transpose_nd_x8(node->flags, &opdata->operator_objects[0]);
49*4bdc9457SAndroid Build Coastguard Worker break;
50*4bdc9457SAndroid Build Coastguard Worker #endif
51*4bdc9457SAndroid Build Coastguard Worker default:
52*4bdc9457SAndroid Build Coastguard Worker XNN_UNREACHABLE;
53*4bdc9457SAndroid Build Coastguard Worker }
54*4bdc9457SAndroid Build Coastguard Worker
55*4bdc9457SAndroid Build Coastguard Worker if (status == xnn_status_success) {
56*4bdc9457SAndroid Build Coastguard Worker opdata->inputs[0] = input_id;
57*4bdc9457SAndroid Build Coastguard Worker opdata->outputs[0] = output_id;
58*4bdc9457SAndroid Build Coastguard Worker opdata->shape1.num_dims = node->params.transpose.num_dims;
59*4bdc9457SAndroid Build Coastguard Worker opdata->shape2.num_dims = node->params.transpose.num_dims;
60*4bdc9457SAndroid Build Coastguard Worker memcpy(opdata->shape1.dim, values[input_id].shape.dim, opdata->shape1.num_dims * sizeof(size_t));
61*4bdc9457SAndroid Build Coastguard Worker memcpy(opdata->shape2.dim, node->params.transpose.perm, opdata->shape2.num_dims * sizeof(size_t));
62*4bdc9457SAndroid Build Coastguard Worker }
63*4bdc9457SAndroid Build Coastguard Worker
64*4bdc9457SAndroid Build Coastguard Worker return status;
65*4bdc9457SAndroid Build Coastguard Worker }
66*4bdc9457SAndroid Build Coastguard Worker
setup_transpose_operator(const struct xnn_operator_data * opdata,const struct xnn_blob * blobs,size_t num_blobs,pthreadpool_t threadpool)67*4bdc9457SAndroid Build Coastguard Worker static enum xnn_status setup_transpose_operator(
68*4bdc9457SAndroid Build Coastguard Worker const struct xnn_operator_data* opdata,
69*4bdc9457SAndroid Build Coastguard Worker const struct xnn_blob* blobs,
70*4bdc9457SAndroid Build Coastguard Worker size_t num_blobs,
71*4bdc9457SAndroid Build Coastguard Worker pthreadpool_t threadpool)
72*4bdc9457SAndroid Build Coastguard Worker {
73*4bdc9457SAndroid Build Coastguard Worker const uint32_t input_id = opdata->inputs[0];
74*4bdc9457SAndroid Build Coastguard Worker assert(input_id != XNN_INVALID_VALUE_ID);
75*4bdc9457SAndroid Build Coastguard Worker assert(input_id < num_blobs);
76*4bdc9457SAndroid Build Coastguard Worker
77*4bdc9457SAndroid Build Coastguard Worker const uint32_t output_id = opdata->outputs[0];
78*4bdc9457SAndroid Build Coastguard Worker assert(output_id != XNN_INVALID_VALUE_ID);
79*4bdc9457SAndroid Build Coastguard Worker assert(output_id < num_blobs);
80*4bdc9457SAndroid Build Coastguard Worker
81*4bdc9457SAndroid Build Coastguard Worker const struct xnn_blob* input_blob = blobs + input_id;
82*4bdc9457SAndroid Build Coastguard Worker const void* input_data = input_blob->data;
83*4bdc9457SAndroid Build Coastguard Worker assert(input_data != NULL);
84*4bdc9457SAndroid Build Coastguard Worker
85*4bdc9457SAndroid Build Coastguard Worker const struct xnn_blob* output_blob = blobs + output_id;
86*4bdc9457SAndroid Build Coastguard Worker void* output_data = output_blob->data;
87*4bdc9457SAndroid Build Coastguard Worker assert(output_data != NULL);
88*4bdc9457SAndroid Build Coastguard Worker
89*4bdc9457SAndroid Build Coastguard Worker enum xnn_status status;
90*4bdc9457SAndroid Build Coastguard Worker switch (opdata->operator_objects[0]->type) {
91*4bdc9457SAndroid Build Coastguard Worker #ifndef XNN_NO_F16_OPERATORS
92*4bdc9457SAndroid Build Coastguard Worker case xnn_operator_type_transpose_nd_x16: {
93*4bdc9457SAndroid Build Coastguard Worker status = xnn_setup_transpose_nd_x16(
94*4bdc9457SAndroid Build Coastguard Worker opdata->operator_objects[0],
95*4bdc9457SAndroid Build Coastguard Worker input_data,
96*4bdc9457SAndroid Build Coastguard Worker output_data,
97*4bdc9457SAndroid Build Coastguard Worker opdata->shape1.num_dims,
98*4bdc9457SAndroid Build Coastguard Worker opdata->shape1.dim,
99*4bdc9457SAndroid Build Coastguard Worker opdata->shape2.dim,
100*4bdc9457SAndroid Build Coastguard Worker threadpool);
101*4bdc9457SAndroid Build Coastguard Worker break;
102*4bdc9457SAndroid Build Coastguard Worker }
103*4bdc9457SAndroid Build Coastguard Worker #endif // !defined(XNN_NO_F16_OPERATORS)
104*4bdc9457SAndroid Build Coastguard Worker case xnn_operator_type_transpose_nd_x32: {
105*4bdc9457SAndroid Build Coastguard Worker status = xnn_setup_transpose_nd_x32(
106*4bdc9457SAndroid Build Coastguard Worker opdata->operator_objects[0],
107*4bdc9457SAndroid Build Coastguard Worker input_data,
108*4bdc9457SAndroid Build Coastguard Worker output_data,
109*4bdc9457SAndroid Build Coastguard Worker opdata->shape1.num_dims,
110*4bdc9457SAndroid Build Coastguard Worker opdata->shape1.dim,
111*4bdc9457SAndroid Build Coastguard Worker opdata->shape2.dim,
112*4bdc9457SAndroid Build Coastguard Worker threadpool);
113*4bdc9457SAndroid Build Coastguard Worker break;
114*4bdc9457SAndroid Build Coastguard Worker }
115*4bdc9457SAndroid Build Coastguard Worker #if !defined(XNN_NO_QS8_OPERATORS) || !defined(XNN_NO_QU8_OPERATORS)
116*4bdc9457SAndroid Build Coastguard Worker case xnn_operator_type_transpose_nd_x8: {
117*4bdc9457SAndroid Build Coastguard Worker status = xnn_setup_transpose_nd_x8(
118*4bdc9457SAndroid Build Coastguard Worker opdata->operator_objects[0],
119*4bdc9457SAndroid Build Coastguard Worker input_data,
120*4bdc9457SAndroid Build Coastguard Worker output_data,
121*4bdc9457SAndroid Build Coastguard Worker opdata->shape1.num_dims,
122*4bdc9457SAndroid Build Coastguard Worker opdata->shape1.dim,
123*4bdc9457SAndroid Build Coastguard Worker opdata->shape2.dim,
124*4bdc9457SAndroid Build Coastguard Worker threadpool);
125*4bdc9457SAndroid Build Coastguard Worker break;
126*4bdc9457SAndroid Build Coastguard Worker }
127*4bdc9457SAndroid Build Coastguard Worker #endif // !defined(XNN_NO_QS8_OPERATORS) || !defined(XNN_NO_QU8_OPERATORS)
128*4bdc9457SAndroid Build Coastguard Worker default:
129*4bdc9457SAndroid Build Coastguard Worker XNN_UNREACHABLE;
130*4bdc9457SAndroid Build Coastguard Worker }
131*4bdc9457SAndroid Build Coastguard Worker
132*4bdc9457SAndroid Build Coastguard Worker return status;
133*4bdc9457SAndroid Build Coastguard Worker }
134*4bdc9457SAndroid Build Coastguard Worker
xnn_define_static_transpose(xnn_subgraph_t subgraph,size_t num_dims,const size_t * perm,uint32_t input_id,uint32_t output_id,uint32_t flags)135*4bdc9457SAndroid Build Coastguard Worker enum xnn_status xnn_define_static_transpose(
136*4bdc9457SAndroid Build Coastguard Worker xnn_subgraph_t subgraph,
137*4bdc9457SAndroid Build Coastguard Worker size_t num_dims,
138*4bdc9457SAndroid Build Coastguard Worker const size_t* perm,
139*4bdc9457SAndroid Build Coastguard Worker uint32_t input_id,
140*4bdc9457SAndroid Build Coastguard Worker uint32_t output_id,
141*4bdc9457SAndroid Build Coastguard Worker uint32_t flags)
142*4bdc9457SAndroid Build Coastguard Worker {
143*4bdc9457SAndroid Build Coastguard Worker enum xnn_status status;
144*4bdc9457SAndroid Build Coastguard Worker if ((status = xnn_subgraph_check_xnnpack_initialized(xnn_node_type_static_transpose)) != xnn_status_success) {
145*4bdc9457SAndroid Build Coastguard Worker return status;
146*4bdc9457SAndroid Build Coastguard Worker }
147*4bdc9457SAndroid Build Coastguard Worker
148*4bdc9457SAndroid Build Coastguard Worker if (num_dims == 0) {
149*4bdc9457SAndroid Build Coastguard Worker xnn_log_error(
150*4bdc9457SAndroid Build Coastguard Worker "failed to create %s operator with %zu num_dims: num_dims must be non-zero",
151*4bdc9457SAndroid Build Coastguard Worker xnn_node_type_to_string(xnn_node_type_static_transpose), num_dims);
152*4bdc9457SAndroid Build Coastguard Worker return xnn_status_invalid_parameter;
153*4bdc9457SAndroid Build Coastguard Worker }
154*4bdc9457SAndroid Build Coastguard Worker
155*4bdc9457SAndroid Build Coastguard Worker if (num_dims > XNN_MAX_TENSOR_DIMS) {
156*4bdc9457SAndroid Build Coastguard Worker xnn_log_error(
157*4bdc9457SAndroid Build Coastguard Worker "failed to create %s operator with %zu num_dims: num_dims must be <= %d",
158*4bdc9457SAndroid Build Coastguard Worker xnn_node_type_to_string(xnn_node_type_static_transpose), num_dims, XNN_MAX_TENSOR_DIMS);
159*4bdc9457SAndroid Build Coastguard Worker return xnn_status_invalid_parameter;
160*4bdc9457SAndroid Build Coastguard Worker }
161*4bdc9457SAndroid Build Coastguard Worker
162*4bdc9457SAndroid Build Coastguard Worker for (size_t i = 0; i < num_dims; ++i) {
163*4bdc9457SAndroid Build Coastguard Worker if (perm[i] >= num_dims) {
164*4bdc9457SAndroid Build Coastguard Worker xnn_log_error(
165*4bdc9457SAndroid Build Coastguard Worker "failed to create %s operator with %zu perm and %zu num_dims: 0 <= perm < num_dims",
166*4bdc9457SAndroid Build Coastguard Worker xnn_node_type_to_string(xnn_node_type_static_transpose), perm[i], num_dims);
167*4bdc9457SAndroid Build Coastguard Worker return xnn_status_invalid_parameter;
168*4bdc9457SAndroid Build Coastguard Worker }
169*4bdc9457SAndroid Build Coastguard Worker }
170*4bdc9457SAndroid Build Coastguard Worker
171*4bdc9457SAndroid Build Coastguard Worker for (size_t i = 0; i < num_dims - 1; ++i) {
172*4bdc9457SAndroid Build Coastguard Worker for (size_t j = i + 1; j < num_dims; ++j) {
173*4bdc9457SAndroid Build Coastguard Worker if (perm[i] == perm[j]) {
174*4bdc9457SAndroid Build Coastguard Worker xnn_log_error(
175*4bdc9457SAndroid Build Coastguard Worker "failed to create %s operator with duplicate entries in perm",
176*4bdc9457SAndroid Build Coastguard Worker xnn_node_type_to_string(xnn_node_type_static_transpose));
177*4bdc9457SAndroid Build Coastguard Worker return xnn_status_invalid_parameter;
178*4bdc9457SAndroid Build Coastguard Worker }
179*4bdc9457SAndroid Build Coastguard Worker }
180*4bdc9457SAndroid Build Coastguard Worker }
181*4bdc9457SAndroid Build Coastguard Worker
182*4bdc9457SAndroid Build Coastguard Worker if ((status = xnn_subgraph_check_input_node_id(xnn_node_type_static_transpose, input_id, subgraph->num_values)) !=
183*4bdc9457SAndroid Build Coastguard Worker xnn_status_success) {
184*4bdc9457SAndroid Build Coastguard Worker return status;
185*4bdc9457SAndroid Build Coastguard Worker }
186*4bdc9457SAndroid Build Coastguard Worker
187*4bdc9457SAndroid Build Coastguard Worker const struct xnn_value* input_value = &subgraph->values[input_id];
188*4bdc9457SAndroid Build Coastguard Worker status = xnn_subgraph_check_input_type_dense(xnn_node_type_static_transpose, input_id, input_value);
189*4bdc9457SAndroid Build Coastguard Worker if (status != xnn_status_success) {
190*4bdc9457SAndroid Build Coastguard Worker return status;
191*4bdc9457SAndroid Build Coastguard Worker }
192*4bdc9457SAndroid Build Coastguard Worker
193*4bdc9457SAndroid Build Coastguard Worker status = xnn_subgraph_check_output_node_id(xnn_node_type_static_transpose, output_id, subgraph->num_values);
194*4bdc9457SAndroid Build Coastguard Worker if (status != xnn_status_success) {
195*4bdc9457SAndroid Build Coastguard Worker return status;
196*4bdc9457SAndroid Build Coastguard Worker }
197*4bdc9457SAndroid Build Coastguard Worker
198*4bdc9457SAndroid Build Coastguard Worker const struct xnn_value* output_value = &subgraph->values[output_id];
199*4bdc9457SAndroid Build Coastguard Worker status = xnn_subgraph_check_output_type_dense(xnn_node_type_static_transpose, output_id, output_value);
200*4bdc9457SAndroid Build Coastguard Worker if (status != xnn_status_success) {
201*4bdc9457SAndroid Build Coastguard Worker return status;
202*4bdc9457SAndroid Build Coastguard Worker }
203*4bdc9457SAndroid Build Coastguard Worker
204*4bdc9457SAndroid Build Coastguard Worker enum xnn_compute_type compute_type = xnn_compute_type_invalid;
205*4bdc9457SAndroid Build Coastguard Worker switch (output_value->datatype) {
206*4bdc9457SAndroid Build Coastguard Worker case xnn_datatype_fp32:
207*4bdc9457SAndroid Build Coastguard Worker compute_type = xnn_compute_type_fp32;
208*4bdc9457SAndroid Build Coastguard Worker break;
209*4bdc9457SAndroid Build Coastguard Worker #ifndef XNN_NO_QS8_OPERATORS
210*4bdc9457SAndroid Build Coastguard Worker case xnn_datatype_qint8:
211*4bdc9457SAndroid Build Coastguard Worker compute_type = xnn_compute_type_qs8;
212*4bdc9457SAndroid Build Coastguard Worker break;
213*4bdc9457SAndroid Build Coastguard Worker #endif // !defined(XNN_NO_QS8_OPERATORS)
214*4bdc9457SAndroid Build Coastguard Worker #ifndef XNN_NO_QU8_OPERATORS
215*4bdc9457SAndroid Build Coastguard Worker case xnn_datatype_quint8:
216*4bdc9457SAndroid Build Coastguard Worker compute_type = xnn_compute_type_qu8;
217*4bdc9457SAndroid Build Coastguard Worker break;
218*4bdc9457SAndroid Build Coastguard Worker #endif // !defined(XNN_NO_QU8_OPERATORS)
219*4bdc9457SAndroid Build Coastguard Worker default:
220*4bdc9457SAndroid Build Coastguard Worker xnn_log_error(
221*4bdc9457SAndroid Build Coastguard Worker "failed to define %s operator with output ID #%" PRIu32 ": unsupported Value datatype %s (%d)",
222*4bdc9457SAndroid Build Coastguard Worker xnn_node_type_to_string(xnn_node_type_static_transpose), output_id,
223*4bdc9457SAndroid Build Coastguard Worker xnn_datatype_to_string(output_value->datatype), output_value->datatype);
224*4bdc9457SAndroid Build Coastguard Worker return xnn_status_invalid_parameter;
225*4bdc9457SAndroid Build Coastguard Worker }
226*4bdc9457SAndroid Build Coastguard Worker
227*4bdc9457SAndroid Build Coastguard Worker switch (input_value->datatype) {
228*4bdc9457SAndroid Build Coastguard Worker case xnn_datatype_fp32:
229*4bdc9457SAndroid Build Coastguard Worker #ifndef XNN_NO_QS8_OPERATORS
230*4bdc9457SAndroid Build Coastguard Worker case xnn_datatype_qint8:
231*4bdc9457SAndroid Build Coastguard Worker #endif // !defined(XNN_NO_QS8_OPERATORS)
232*4bdc9457SAndroid Build Coastguard Worker #ifndef XNN_NO_QU8_OPERATORS
233*4bdc9457SAndroid Build Coastguard Worker case xnn_datatype_quint8:
234*4bdc9457SAndroid Build Coastguard Worker #endif // !defined(XNN_NO_QU8_OPERATORS)
235*4bdc9457SAndroid Build Coastguard Worker break;
236*4bdc9457SAndroid Build Coastguard Worker default:
237*4bdc9457SAndroid Build Coastguard Worker xnn_log_error(
238*4bdc9457SAndroid Build Coastguard Worker "failed to define %s operator with input ID #%" PRIu32 ": unsupported Value datatype %s (%d)",
239*4bdc9457SAndroid Build Coastguard Worker xnn_node_type_to_string(xnn_node_type_static_transpose), input_id,
240*4bdc9457SAndroid Build Coastguard Worker xnn_datatype_to_string(input_value->datatype), input_value->datatype);
241*4bdc9457SAndroid Build Coastguard Worker return xnn_status_invalid_parameter;
242*4bdc9457SAndroid Build Coastguard Worker }
243*4bdc9457SAndroid Build Coastguard Worker
244*4bdc9457SAndroid Build Coastguard Worker status = xnn_subgraph_check_datatype_matches(
245*4bdc9457SAndroid Build Coastguard Worker xnn_node_type_static_transpose, input_id, input_value, output_id, output_value);
246*4bdc9457SAndroid Build Coastguard Worker if (status != xnn_status_success) {
247*4bdc9457SAndroid Build Coastguard Worker return status;
248*4bdc9457SAndroid Build Coastguard Worker }
249*4bdc9457SAndroid Build Coastguard Worker
250*4bdc9457SAndroid Build Coastguard Worker struct xnn_node* node = xnn_subgraph_new_node(subgraph);
251*4bdc9457SAndroid Build Coastguard Worker if (node == NULL) {
252*4bdc9457SAndroid Build Coastguard Worker return xnn_status_out_of_memory;
253*4bdc9457SAndroid Build Coastguard Worker }
254*4bdc9457SAndroid Build Coastguard Worker
255*4bdc9457SAndroid Build Coastguard Worker node->compute_type = compute_type;
256*4bdc9457SAndroid Build Coastguard Worker node->inputs[0] = input_id;
257*4bdc9457SAndroid Build Coastguard Worker node->flags = flags;
258*4bdc9457SAndroid Build Coastguard Worker node->num_inputs = 1;
259*4bdc9457SAndroid Build Coastguard Worker node->num_outputs = 1;
260*4bdc9457SAndroid Build Coastguard Worker node->outputs[0] = output_id;
261*4bdc9457SAndroid Build Coastguard Worker node->type = xnn_node_type_static_transpose;
262*4bdc9457SAndroid Build Coastguard Worker
263*4bdc9457SAndroid Build Coastguard Worker node->params.transpose.num_dims = num_dims;
264*4bdc9457SAndroid Build Coastguard Worker node->create = create_transpose_operator;
265*4bdc9457SAndroid Build Coastguard Worker node->setup = setup_transpose_operator;
266*4bdc9457SAndroid Build Coastguard Worker
267*4bdc9457SAndroid Build Coastguard Worker memcpy(node->params.transpose.perm, perm, num_dims * sizeof(size_t));
268*4bdc9457SAndroid Build Coastguard Worker
269*4bdc9457SAndroid Build Coastguard Worker return xnn_status_success;
270*4bdc9457SAndroid Build Coastguard Worker }
271