Home
last modified time | relevance | path

Searched defs:vb3 (Results 1 – 25 of 552) sorted by relevance

12345678910>>...23

/aosp_15_r20/external/XNNPACK/src/bf16-gemm/gen/
H A D1x4c8-minmax-neonbf16-bfmlal.c56 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_1x4c8__neonbf16_bfmlal() local
74 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_1x4c8__neonbf16_bfmlal() local
H A D1x4c8-minmax-neonbf16-bfdot.c56 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_1x4c8__neonbf16_bfdot() local
69 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_1x4c8__neonbf16_bfdot() local
H A D2x4c8-minmax-neonbf16-bfmlal.c67 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_2x4c8__neonbf16_bfmlal() local
94 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_2x4c8__neonbf16_bfmlal() local
H A D2x4c8-minmax-neonbf16-bfdot.c67 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_2x4c8__neonbf16_bfdot() local
85 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_2x4c8__neonbf16_bfdot() local
H A D1x4c8-minmax-neonfma-shland.c57 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_1x4c8__neonfma_shland() local
89 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_1x4c8__neonfma_shland() local
H A D1x4c8-minmax-neonfma-zip.c57 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_1x4c8__neonfma_zip() local
89 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_1x4c8__neonfma_zip() local
H A D3x4c8-minmax-neonbf16-bfdot.c78 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_3x4c8__neonbf16_bfdot() local
101 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_3x4c8__neonbf16_bfdot() local
H A D3x4c8-minmax-neonbf16-bfmlal.c78 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_3x4c8__neonbf16_bfmlal() local
114 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_3x4c8__neonbf16_bfmlal() local
H A D4x4c8-minmax-neonbf16-bfdot.c89 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_4x4c8__neonbf16_bfdot() local
117 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_4x4c8__neonbf16_bfdot() local
H A D2x4c8-minmax-neonfma-zip.c68 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_2x4c8__neonfma_zip() local
111 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_2x4c8__neonfma_zip() local
H A D2x4c8-minmax-neonfma-shland.c68 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_2x4c8__neonfma_shland() local
111 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_2x4c8__neonfma_shland() local
H A D4x4c8-minmax-neonbf16-bfmlal.c89 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_4x4c8__neonbf16_bfmlal() local
134 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_4x4c8__neonbf16_bfmlal() local
H A D5x4c8-minmax-neonbf16-bfdot.c100 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_5x4c8__neonbf16_bfdot() local
133 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_5x4c8__neonbf16_bfdot() local
H A D5x4c8-minmax-neonbf16-bfmlal.c100 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_5x4c8__neonbf16_bfmlal() local
154 const bfloat16x8_t vb3 = vld1q_bf16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_5x4c8__neonbf16_bfmlal() local
H A D3x4c8-minmax-neonfma-zip.c79 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_3x4c8__neonfma_zip() local
133 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_3x4c8__neonfma_zip() local
H A D3x4c8-minmax-neonfma-shland.c79 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_3x4c8__neonfma_shland() local
133 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_3x4c8__neonfma_shland() local
H A D4x4c8-minmax-neonfma-shland.c90 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_4x4c8__neonfma_shland() local
155 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_4x4c8__neonfma_shland() local
H A D4x4c8-minmax-neonfma-zip.c90 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_4x4c8__neonfma_zip() local
155 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_4x4c8__neonfma_zip() local
H A D5x4c8-minmax-neonfma-zip.c101 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_5x4c8__neonfma_zip() local
177 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_5x4c8__neonfma_zip() local
H A D5x4c8-minmax-neonfma-shland.c101 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_5x4c8__neonfma_shland() local
177 const uint16x8_t vb3 = vld1q_u16(w); w += 8; in xnn_bf16_gemm_minmax_ukernel_5x4c8__neonfma_shland() local
/aosp_15_r20/external/pytorch/aten/src/ATen/native/quantized/cpu/qnnpack/src/q8conv/
H A D4x4c2-sse2.c138 const __m128i vb3 = _mm_loadl_epi64((const __m128i*)((uintptr_t)w + 24)); in pytorch_q8conv_ukernel_4x4c2__sse2() local
250 const __m128i vb3 = _mm_loadl_epi64((const __m128i*)w); in pytorch_q8conv_ukernel_4x4c2__sse2() local
/aosp_15_r20/external/pytorch/aten/src/ATen/native/quantized/cpu/qnnpack/src/q8gemm/
H A D4x4c2-dq-sse2.c146 const __m128i vb3 = _mm_loadl_epi64((const __m128i*)((uintptr_t)w + 24)); in pytorch_q8gemm_dq_ukernel_4x4c2__sse2() local
248 const __m128i vb3 = in pytorch_q8gemm_dq_ukernel_4x4c2__sse2() local
H A D4x4c2-sse2.c140 const __m128i vb3 = _mm_loadl_epi64((const __m128i*)((uintptr_t)w + 24)); in pytorch_q8gemm_ukernel_4x4c2__sse2() local
242 const __m128i vb3 = in pytorch_q8gemm_ukernel_4x4c2__sse2() local
H A D2x4c8-sse2.c122 const __m128i vb3 = _mm_loadl_epi64((const __m128i*)b3); in pytorch_q8gemm_ukernel_2x4c8__sse2() local
162 const __m128i vb3 = _mm_loadl_epi64((const __m128i*)b3); in pytorch_q8gemm_ukernel_2x4c8__sse2() local
/aosp_15_r20/external/XNNPACK/src/f32-vbinary/gen/
H A Dvadd-scalar-x4.c41 const float vb3 = b[3]; in xnn_f32_vadd_ukernel__scalar_x4() local

12345678910>>...23