/aosp_15_r20/external/XNNPACK/src/f32-ibilinear-chw/ |
H A D | sse.c.in | 98 const __m128 valphav = _mm_shuffle_ps(vw0, vw1, _MM_SHUFFLE(3, 1, 3, 1)); variable 129 const __m128 valphav = _mm_shuffle_ps(vw, vw, _MM_SHUFFLE(3, 1, 3, 1)); variable 170 const __m128 valphav = _mm_load_ps1(w + 1); variable
|
H A D | wasmsimd.c.in | 102 const v128_t valphav = wasm_v32x4_shuffle(vw0, vw1, 1, 3, 5, 7); variable 133 const v128_t valphav = wasm_v32x4_shuffle(vw, vw, 1, 3, 1, 3); variable 174 const v128_t valphav = wasm_v128_load32_splat(w + 1); variable
|
H A D | scalar.c.in | 75 const float valphav = w[1]; variable 102 const float valphav = w[1]; variable
|
/aosp_15_r20/external/XNNPACK/src/f16-ibilinear-chw/ |
H A D | neonfp16arith.c.in | 100 const float16x4_t valphav = vw.val[1]; variable 134 const float16x4_t valphav = vwhv.val[1]; variable 186 const float16x4_t valphav = vwhv.val[1]; variable
|
/aosp_15_r20/external/XNNPACK/src/f32-ibilinear-chw/gen/ |
H A D | sse-p4.c | 56 const __m128 valphav = _mm_shuffle_ps(vw0, vw1, _MM_SHUFFLE(3, 1, 3, 1)); in xnn_f32_ibilinear_chw_ukernel__sse_p4() local 88 const __m128 valphav = _mm_shuffle_ps(vw, vw, _MM_SHUFFLE(3, 1, 3, 1)); in xnn_f32_ibilinear_chw_ukernel__sse_p4() local 130 const __m128 valphav = _mm_load_ps1(w + 1); in xnn_f32_ibilinear_chw_ukernel__sse_p4() local
|
H A D | wasmsimd-p4.c | 60 const v128_t valphav = wasm_v32x4_shuffle(vw0, vw1, 1, 3, 5, 7); in xnn_f32_ibilinear_chw_ukernel__wasmsimd_p4() local 92 const v128_t valphav = wasm_v32x4_shuffle(vw, vw, 1, 3, 1, 3); in xnn_f32_ibilinear_chw_ukernel__wasmsimd_p4() local 134 const v128_t valphav = wasm_v128_load32_splat(w + 1); in xnn_f32_ibilinear_chw_ukernel__wasmsimd_p4() local
|
H A D | neonfma-p4.c | 59 const float32x4_t valphav = vw.val[1]; in xnn_f32_ibilinear_chw_ukernel__neonfma_p4() local 93 const float32x2_t valphav = vw.val[1]; in xnn_f32_ibilinear_chw_ukernel__neonfma_p4() local 141 const float32x2_t valphav = vld1_dup_f32(w + 1); in xnn_f32_ibilinear_chw_ukernel__neonfma_p4() local
|
H A D | neon-p4.c | 59 const float32x4_t valphav = vw.val[1]; in xnn_f32_ibilinear_chw_ukernel__neon_p4() local 93 const float32x2_t valphav = vw.val[1]; in xnn_f32_ibilinear_chw_ukernel__neon_p4() local 141 const float32x2_t valphav = vld1_dup_f32(w + 1); in xnn_f32_ibilinear_chw_ukernel__neon_p4() local
|
H A D | sse-p8.c | 134 const __m128 valphav = _mm_shuffle_ps(vw0, vw1, _MM_SHUFFLE(3, 1, 3, 1)); in xnn_f32_ibilinear_chw_ukernel__sse_p8() local 166 const __m128 valphav = _mm_shuffle_ps(vw, vw, _MM_SHUFFLE(3, 1, 3, 1)); in xnn_f32_ibilinear_chw_ukernel__sse_p8() local 208 const __m128 valphav = _mm_load_ps1(w + 1); in xnn_f32_ibilinear_chw_ukernel__sse_p8() local
|
H A D | wasmsimd-p8.c | 146 const v128_t valphav = wasm_v32x4_shuffle(vw0, vw1, 1, 3, 5, 7); in xnn_f32_ibilinear_chw_ukernel__wasmsimd_p8() local 178 const v128_t valphav = wasm_v32x4_shuffle(vw, vw, 1, 3, 1, 3); in xnn_f32_ibilinear_chw_ukernel__wasmsimd_p8() local 220 const v128_t valphav = wasm_v128_load32_splat(w + 1); in xnn_f32_ibilinear_chw_ukernel__wasmsimd_p8() local
|
H A D | neonfma-p8.c | 147 const float32x4_t valphav = vw.val[1]; in xnn_f32_ibilinear_chw_ukernel__neonfma_p8() local 181 const float32x2_t valphav = vw.val[1]; in xnn_f32_ibilinear_chw_ukernel__neonfma_p8() local 229 const float32x2_t valphav = vld1_dup_f32(w + 1); in xnn_f32_ibilinear_chw_ukernel__neonfma_p8() local
|
H A D | neon-p8.c | 147 const float32x4_t valphav = vw.val[1]; in xnn_f32_ibilinear_chw_ukernel__neon_p8() local 181 const float32x2_t valphav = vw.val[1]; in xnn_f32_ibilinear_chw_ukernel__neon_p8() local 229 const float32x2_t valphav = vld1_dup_f32(w + 1); in xnn_f32_ibilinear_chw_ukernel__neon_p8() local
|
H A D | neonfma-p16.c | 219 const float32x4_t valphav = vw.val[1]; in xnn_f32_ibilinear_chw_ukernel__neonfma_p16() local 253 const float32x2_t valphav = vw.val[1]; in xnn_f32_ibilinear_chw_ukernel__neonfma_p16() local 301 const float32x2_t valphav = vld1_dup_f32(w + 1); in xnn_f32_ibilinear_chw_ukernel__neonfma_p16() local
|
H A D | neon-p16.c | 219 const float32x4_t valphav = vw.val[1]; in xnn_f32_ibilinear_chw_ukernel__neon_p16() local 253 const float32x2_t valphav = vw.val[1]; in xnn_f32_ibilinear_chw_ukernel__neon_p16() local 301 const float32x2_t valphav = vld1_dup_f32(w + 1); in xnn_f32_ibilinear_chw_ukernel__neon_p16() local
|
H A D | scalar-p1.c | 40 const float valphav = w[1]; in xnn_f32_ibilinear_chw_ukernel__scalar_p1() local
|
/aosp_15_r20/external/XNNPACK/src/f16-ibilinear-chw/gen/ |
H A D | neonfp16arith-p4.c | 63 const float16x4_t valphav = vw.val[1]; in xnn_f16_ibilinear_chw_ukernel__neonfp16arith_p4() local 98 const float16x4_t valphav = vwhv.val[1]; in xnn_f16_ibilinear_chw_ukernel__neonfp16arith_p4() local 151 const float16x4_t valphav = vwhv.val[1]; in xnn_f16_ibilinear_chw_ukernel__neonfp16arith_p4() local
|
H A D | neonfp16arith-p8.c | 130 const float16x4_t valphav = vw.val[1]; in xnn_f16_ibilinear_chw_ukernel__neonfp16arith_p8() local 165 const float16x4_t valphav = vwhv.val[1]; in xnn_f16_ibilinear_chw_ukernel__neonfp16arith_p8() local 218 const float16x4_t valphav = vwhv.val[1]; in xnn_f16_ibilinear_chw_ukernel__neonfp16arith_p8() local
|
H A D | neonfp16arith-p16.c | 183 const float16x4_t valphav = vw.val[1]; in xnn_f16_ibilinear_chw_ukernel__neonfp16arith_p16() local 218 const float16x4_t valphav = vwhv.val[1]; in xnn_f16_ibilinear_chw_ukernel__neonfp16arith_p16() local 271 const float16x4_t valphav = vwhv.val[1]; in xnn_f16_ibilinear_chw_ukernel__neonfp16arith_p16() local
|
/aosp_15_r20/external/XNNPACK/src/f32-ibilinear/gen/ |
H A D | scalar-c1.c | 36 const float valphav = weights[1]; in xnn_f32_ibilinear_ukernel__scalar_c1() local
|
H A D | wasmsimd-c4.c | 38 const v128_t valphav = wasm_v128_load32_splat(weights + 1); in xnn_f32_ibilinear_ukernel__wasmsimd_c4() local
|
H A D | sse-c4.c | 40 const __m128 valphav = _mm_movehl_ps(valphahv, valphahv); in xnn_f32_ibilinear_ukernel__sse_c4() local
|
/aosp_15_r20/external/XNNPACK/src/u8-ibilinear/gen/ |
H A D | scalar-c1.c | 36 const int32_t valphav = (int32_t) (uint32_t) (uint16_t) weights[1]; in xnn_u8_ibilinear_ukernel__scalar_c1() local
|
/aosp_15_r20/external/XNNPACK/src/s8-ibilinear/gen/ |
H A D | scalar-c1.c | 36 const int32_t valphav = (int32_t) (uint32_t) (uint16_t) weights[1]; in xnn_s8_ibilinear_ukernel__scalar_c1() local
|
/aosp_15_r20/external/XNNPACK/src/f16-ibilinear/gen/ |
H A D | fma3-c8.c | 42 const __m256 valphav = _mm256_permute_ps(valphahv, _MM_SHUFFLE(3, 1, 3, 1)); in xnn_f16_ibilinear_ukernel__fma3_c8() local
|
H A D | neonfp16arith-c8.c | 40 const float16x8_t valphav = vld1q_dup_f16(weights); weights = (const __fp16*) weights + 1; in xnn_f16_ibilinear_ukernel__neonfp16arith_c8() local
|