/aosp_15_r20/external/XNNPACK/src/amalgam/ |
H A D | sse41.c | 427 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->sse4.output_zero_point); in xnn_f32_qs8_vcvt_ukernel__sse41_x32() local 1442 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x25__sse41_mul16() local 1752 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x25__sse41_mul16() local 1875 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x3__sse41_mul16() local 1943 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x3__sse41_mul16() local 2168 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x9__sse41_mul16() local 2302 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x9__sse41_mul16() local 2406 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_gemm_minmax_fp32_ukernel_1x4c8__sse41_ld64() local 2560 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_gemm_minmax_fp32_ukernel_3x4c8__sse41_ld64() local 2692 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_igemm_minmax_fp32_ukernel_1x4c8__sse41_ld64() local [all …]
|
H A D | avx2.c | 1602 …const __m256i voutput_zero_point = _mm256_load_si256((const __m256i*) params->avx2.output_zero_poi… in xnn_f32_qs8_vcvt_ukernel__avx2_x64() local 1728 …const __m256i voutput_zero_point = _mm256_load_si256((const __m256i*) params->avx2.output_zero_poi… in xnn_f32_qu8_vcvt_ukernel__avx2_x64() local 2670 …const __m256i voutput_zero_point = _mm256_load_si256((const __m256i*) params->fp32_avx2.output_zer… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul32() local 2847 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_avx2.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul32() local 2968 …const __m256i voutput_zero_point = _mm256_load_si256((const __m256i*) params->fp32_avx2.output_zer… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x3__avx2_mul32() local 3013 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_avx2.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x3__avx2_mul32() local 3218 …const __m256i voutput_zero_point = _mm256_load_si256((const __m256i*) params->fp32_avx2.output_zer… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x9__avx2_mul32() local 3299 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_avx2.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x9__avx2_mul32() local 3421 …const __m256i voutput_zero_point = _mm256_load_si256((const __m256i*) params->fp32_avx2.output_zer… in xnn_qc8_gemm_minmax_fp32_ukernel_1x8c8__avx2() local 3603 …const __m256i voutput_zero_point = _mm256_load_si256((const __m256i*) params->fp32_avx2.output_zer… in xnn_qc8_gemm_minmax_fp32_ukernel_3x8c8__avx2() local [all …]
|
H A D | avx512skx.c | 100 const __m512i voutput_zero_point = _mm512_load_si512(params->avx512.output_zero_point); in xnn_f32_qs8_vcvt_ukernel__avx512skx_x128() local 218 const __m512i voutput_zero_point = _mm512_load_si512(params->avx512.output_zero_point); in xnn_f32_qu8_vcvt_ukernel__avx512skx_x128() local 339 const __m512i voutput_zero_point = _mm512_load_si512(params->fp32_avx512.output_zero_point); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local 945 const __m512i voutput_zero_point = _mm512_load_si512(params->fp32_avx512.output_zero_point); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x3__avx512skx_mul32() local 1111 const __m512i voutput_zero_point = _mm512_load_si512(params->fp32_avx512.output_zero_point); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x9__avx512skx_mul32() local 1408 …const __m256i voutput_zero_point = _mm256_load_si256((const __m256i*) params->fp32_avx512.output_z… in xnn_qc8_gemm_minmax_fp32_ukernel_1x16c8__avx512skx() local 1525 const __m512i voutput_zero_point = _mm512_load_si512(params->fp32_avx512.output_zero_point); in xnn_qc8_gemm_minmax_fp32_ukernel_4x16c8__avx512skx() local 1693 …const __m256i voutput_zero_point = _mm256_load_si256((const __m256i*) params->fp32_avx512.output_z… in xnn_qc8_igemm_minmax_fp32_ukernel_1x16c8__avx512skx() local 1815 const __m512i voutput_zero_point = _mm512_load_si512(params->fp32_avx512.output_zero_point); in xnn_qc8_igemm_minmax_fp32_ukernel_4x16c8__avx512skx() local 1991 const __m512i voutput_zero_point = _mm512_load_si512(params->fp32_avx512.output_zero_point); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local [all …]
|
H A D | ssse3.c | 247 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->ssse3.output_zero_point… in xnn_qs8_vcvt_ukernel__ssse3_x32() local 362 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->sse2.output_zero_point); in xnn_qs8_vlrelu_ukernel__ssse3_x32() local 500 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->ssse3.output_zero_point… in xnn_qu8_vcvt_ukernel__ssse3_x32() local 612 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->sse2.output_zero_point); in xnn_qu8_vlrelu_ukernel__ssse3_x32() local
|
H A D | avx.c | 2295 const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->avx.output_zero_point); in xnn_f32_qs8_vcvt_ukernel__avx_x32() local 2401 const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->avx.output_zero_point); in xnn_f32_qu8_vcvt_ukernel__avx_x32() local 5368 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx_mul16_add16() local 5683 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx_mul16_add16() local 5842 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x3__avx_mul16_add16() local 5915 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x3__avx_mul16_add16() local 6206 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x9__avx_mul16_add16() local 6345 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x9__avx_mul16_add16() local 6452 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_gemm_minmax_fp32_ukernel_1x4c8__avx_ld128() local 6578 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_gemm_minmax_fp32_ukernel_2x4c8__avx_ld128() local [all …]
|
H A D | sse2.c | 1364 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->sse2.output_zero_point); in xnn_f32_qs8_vcvt_ukernel__sse2_x32() local 1501 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->sse2.output_zero_point); in xnn_f32_qu8_vcvt_ukernel__sse2_x32() local 3181 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x25__sse2_mul16() local 3516 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x25__sse2_mul16() local 3642 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x3__sse2_mul16() local 3713 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x3__sse2_mul16() local 3947 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x9__sse2_mul16() local 4090 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x9__sse2_mul16() local 4194 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qc8_gemm_minmax_fp32_ukernel_1x4c8__sse2_ld64() local 4349 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qc8_gemm_minmax_fp32_ukernel_3x4c8__sse2_ld64() local [all …]
|
/aosp_15_r20/external/XNNPACK/src/qc8-dwconv/gen/ |
H A D | up16x3-minmax-fp32-avx2-mul32.c | 103 …const __m256i voutput_zero_point = _mm256_load_si256((const __m256i*) params->fp32_avx2.output_zer… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x3__avx2_mul32() local 148 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_avx2.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x3__avx2_mul32() local
|
H A D | up8x3-minmax-fp32-sse41-mul16.c | 112 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x3__sse41_mul16() local 180 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x3__sse41_mul16() local
|
H A D | up8x9-minmax-fp32-avx2-mul32.c | 154 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_avx2.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x9__avx2_mul32() local 223 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_avx2.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x9__avx2_mul32() local
|
H A D | up8x3-minmax-fp32-sse2-mul16.c | 115 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x3__sse2_mul16() local 186 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x3__sse2_mul16() local
|
H A D | up16x3-minmax-fp32-avx-mul16-add16.c | 141 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x3__avx_mul16_add16() local 214 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x3__avx_mul16_add16() local
|
H A D | up16x3-minmax-fp32-xop-mul16-add16.c | 146 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x3__xop_mul16_add16() local 219 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x3__xop_mul16_add16() local
|
H A D | up8x9-minmax-fp32-avx-mul32.c | 188 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x9__avx_mul32() local 259 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x9__avx_mul32() local
|
H A D | up8x9-minmax-fp32-sse41-mul32.c | 188 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x9__sse41_mul32() local 259 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x9__sse41_mul32() local
|
H A D | up16x9-minmax-fp32-avx2-mul32.c | 187 …const __m256i voutput_zero_point = _mm256_load_si256((const __m256i*) params->fp32_avx2.output_zer… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x9__avx2_mul32() local 268 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_avx2.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x9__avx2_mul32() local
|
H A D | up8x9-minmax-fp32-xop-mul32.c | 193 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x9__xop_mul32() local 264 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qc8_dwconv_minmax_fp32_ukernel_up8x9__xop_mul32() local
|
/aosp_15_r20/external/XNNPACK/src/qu8-dwconv/gen/ |
H A D | up8x9-minmax-fp32-avx2-mul32.c | 154 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_avx2.output_zero_p… in xnn_qu8_dwconv_minmax_fp32_ukernel_up8x9__avx2_mul32() local 222 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_avx2.output_zero_p… in xnn_qu8_dwconv_minmax_fp32_ukernel_up8x9__avx2_mul32() local
|
H A D | up16x9-minmax-fp32-avx2-mul32.c | 186 …const __m256i voutput_zero_point = _mm256_load_si256((const __m256i*) params->fp32_avx2.output_zer… in xnn_qu8_dwconv_minmax_fp32_ukernel_up16x9__avx2_mul32() local 266 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_avx2.output_zero_p… in xnn_qu8_dwconv_minmax_fp32_ukernel_up16x9__avx2_mul32() local
|
H A D | up8x9-minmax-fp32-xop-mul32.c | 192 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qu8_dwconv_minmax_fp32_ukernel_up8x9__xop_mul32() local 262 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qu8_dwconv_minmax_fp32_ukernel_up8x9__xop_mul32() local
|
H A D | up8x9-minmax-fp32-sse41-mul32.c | 187 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qu8_dwconv_minmax_fp32_ukernel_up8x9__sse41_mul32() local 257 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qu8_dwconv_minmax_fp32_ukernel_up8x9__sse41_mul32() local
|
H A D | up8x9-minmax-fp32-avx-mul32.c | 187 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qu8_dwconv_minmax_fp32_ukernel_up8x9__avx_mul32() local 257 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse2.output_zero_p… in xnn_qu8_dwconv_minmax_fp32_ukernel_up8x9__avx_mul32() local
|
/aosp_15_r20/external/XNNPACK/src/qs8-dwconv/gen/ |
H A D | up8x9-minmax-fp32-avx2-mul32.c | 153 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_avx2.output_zero_p… in xnn_qs8_dwconv_minmax_fp32_ukernel_up8x9__avx2_mul32() local 221 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_avx2.output_zero_p… in xnn_qs8_dwconv_minmax_fp32_ukernel_up8x9__avx2_mul32() local
|
H A D | up8x9-minmax-fp32-avx-mul32.c | 186 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qs8_dwconv_minmax_fp32_ukernel_up8x9__avx_mul32() local 256 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qs8_dwconv_minmax_fp32_ukernel_up8x9__avx_mul32() local
|
H A D | up8x9-minmax-fp32-sse41-mul32.c | 186 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qs8_dwconv_minmax_fp32_ukernel_up8x9__sse41_mul32() local 256 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qs8_dwconv_minmax_fp32_ukernel_up8x9__sse41_mul32() local
|
H A D | up8x9-minmax-fp32-xop-mul32.c | 191 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qs8_dwconv_minmax_fp32_ukernel_up8x9__xop_mul32() local 261 …const __m128i voutput_zero_point = _mm_load_si128((const __m128i*) params->fp32_sse4.output_zero_p… in xnn_qs8_dwconv_minmax_fp32_ukernel_up8x9__xop_mul32() local
|