/aosp_15_r20/external/libaom/av1/common/arm/ |
H A D | highbd_convolve_sve2.c | 94 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in convolve12_8_x() local 202 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum[0]), vmovn_s64(sum[2])); in convolve8_8_x() local 271 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in convolve4_4_x() local 533 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_convolve8_4_y() local 558 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_convolve8_8_y() local 715 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_convolve4_4_y() local 728 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_convolve4_8_y() local 888 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in convolve12_4_2d_h() local 928 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in convolve12_8_2d_h() local 1037 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum[0]), vmovn_s64(sum[2])); in convolve8_8_2d_h() local [all …]
|
H A D | highbd_compound_convolve_sve2.c | 53 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum[0]), vmovn_s64(sum[2])); in highbd_12_convolve8_8_x() local 119 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum[0]), vmovn_s64(sum[2])); in highbd_convolve8_8_x() local 183 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_12_convolve4_4_x() local 276 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_convolve4_4_x() local 451 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_12_convolve8_4_y() local 472 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_12_convolve8_8_y() local 627 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_convolve8_4_y() local 648 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_convolve8_8_y() local 1179 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_convolve8_4_2d_v() local 1200 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_convolve8_8_2d_v() local
|
H A D | convolve_neon_i8mm.c | 68 int32x4_t sum0123 = vusmmlaq_s32(horiz_const, perm_samples[0], filter[0]); in convolve12_8_x() local 171 int32x4_t sum0123 = vusdotq_lane_s32(horiz_const, perm_samples[0], filter, 0); in convolve8_8_x() local 244 int32x4_t sum0123 = vusmmlaq_s32(horiz_const, perm_samples[0], filter); in convolve6_8_x() local 423 int32x4_t sum0123 = vusdotq_lane_s32(vdupq_n_s32(0), s0_lo, filters_0_7, 0); in convolve12_8_y() local 613 int32x4_t sum0123 = vusdotq_lane_s32(vdupq_n_s32(0), s0_lo, filters, 0); in convolve8_8_y() local 797 int32x4_t sum0123 = in convolve8_8_2d_h() local 898 int32x4_t sum0123 = in convolve4_8_2d_h() local 1025 int32x4_t sum0123 = vusmmlaq_s32(horiz_const, perm_samples[0], filter); in convolve6_8_2d_h() local
|
H A D | convolve_neon_dotprod.c | 99 int32x4_t sum0123 = vdotq_laneq_s32(acc, perm_samples[0], filter, 0); in convolve12_8_x() local 223 int32x4_t sum0123 = vdotq_lane_s32(acc, perm_samples[0], filters, 0); in convolve4_8_x() local 315 int32x4_t sum0123 = vdotq_lane_s32(acc, perm_samples[0], filter, 0); in convolve8_8_x() local 464 int32x4_t sum0123 = vdotq_lane_s32(acc, s0_lo, filters_0_7, 0); in convolve12_8_y() local 693 int32x4_t sum0123 = vdotq_lane_s32(acc, s0_lo, filters, 0); in convolve8_8_y() local 937 int32x4_t sum0123 = vdotq_laneq_s32(correction, perm_samples[0], filters, 0); in convolve12_8_2d_h() local 1083 int32x4_t sum0123 = vdotq_lane_s32(correction, perm_samples[0], filters, 0); in convolve4_8_2d_h() local 1201 int32x4_t sum0123 = vdotq_lane_s32(correction, perm_samples[0], filters, 0); in convolve8_8_2d_h() local
|
H A D | av1_convolve_scale_neon_i8mm.c | 73 int32x4_t sum0123 = vpaddq_s32(sum01, sum23); in convolve8_8_h() local 208 int32x4_t sum0123 = in convolve8_8_h_scale_2() local
|
H A D | av1_convolve_scale_neon_dotprod.c | 83 int32x4_t sum0123 = vpaddq_s32(sum01, sum23); in convolve8_8_h() local 231 int32x4_t sum0123 = vdotq_lane_s32(horiz_const, perm_samples[0], filters, 0); in convolve8_8_h_scale_2() local
|
H A D | convolve_neon_i8mm.h | 74 int32x4_t sum0123 = vusmmlaq_s32(horiz_const, perm_samples[0], filter[0]); in convolve12_8_2d_h() local
|
H A D | compound_convolve_neon_i8mm.c | 61 int32x4_t sum0123 = vusmmlaq_s32(horiz_const, permuted_samples[0], x_filter); in convolve6_8_2d_h() local 359 int32x4_t sum0123 = vusmmlaq_s32(round_offset, permuted_samples[0], x_filter); in convolve6_8_x() local
|
H A D | resize_neon_i8mm.c | 39 int32x4_t sum0123 = vusmmlaq_s32(vdupq_n_s32(0), perm_samples[0], filters); in scale_2_to_1_filter8_8() local
|
H A D | resize_neon_dotprod.c | 53 int32x4_t sum0123 = vdotq_lane_s32(acc, perm_samples[0], filter, 0); in scale_2_to_1_filter8_8() local
|
/aosp_15_r20/external/libaom/aom_dsp/arm/ |
H A D | aom_scaled_convolve8_neon_i8mm.c | 30 int32x4_t sum0123 = vpaddq_s32(sum01, sum23); in convolve8_4_h() local 53 int32x4_t sum0123 = vpaddq_s32(sum01, sum23); in convolve8_8_h() local 196 int32x4_t sum0123 = vusdotq_lane_s32(vdupq_n_s32(0), s0123[0], filter, 0); in convolve8_8_v() local
|
H A D | aom_scaled_convolve8_neon_dotprod.c | 37 int32x4_t sum0123 = vpaddq_s32(sum01, sum23); in convolve8_4_h() local 69 int32x4_t sum0123 = vpaddq_s32(sum01, sum23); in convolve8_8_h() local 231 int32x4_t sum0123 = vdotq_lane_s32(acc, s0123_128[0], filter, 0); in convolve8_8_v() local
|
H A D | highbd_convolve8_sve.c | 36 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_convolve8_4_h() local 60 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_convolve8_8_h() local
|
H A D | aom_convolve8_neon_i8mm.c | 172 int32x4_t sum0123 = vusmmlaq_s32(vdupq_n_s32(0), perm_samples[0], filter); in convolve6_8_h() local
|
/aosp_15_r20/external/libvpx/vpx_dsp/arm/ |
H A D | highbd_vpx_convolve8_sve2.c | 117 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_convolve8_4_v() local 139 int32x4_t sum0123 = vcombine_s32(vmovn_s64(sum01), vmovn_s64(sum23)); in highbd_convolve8_8_v() local
|
/aosp_15_r20/external/libgav1/src/dsp/arm/ |
H A D | loop_restoration_neon.cc | 806 const uint32x4_t sum0123 = vaddq_u32(sum01, sum23); in Sum5W_32() local 845 const uint16x8_t sum0123 = vaddq_u16(sum01, sum23); in Sum5Horizontal() local
|