Home
last modified time | relevance | path

Searched defs:sum1 (Results 1 – 25 of 138) sorted by relevance

123456

/aosp_15_r20/external/rust/android-crates-io/crates/libz-sys/src/zlib-ng/
Dadler32_p.h15 #define DO1(sum1, sum2, buf, i) {(sum1) += buf[(i)]; (sum2) += (sum1);} argument
16 #define DO2(sum1, sum2, buf, i) {DO1(sum1, sum2, buf, i); DO1(sum1, sum2, buf, i+1);} argument
17 #define DO4(sum1, sum2, buf, i) {DO2(sum1, sum2, buf, i); DO2(sum1, sum2, buf, i+2);} argument
18 #define DO8(sum1, sum2, buf, i) {DO4(sum1, sum2, buf, i); DO4(sum1, sum2, buf, i+4);} argument
19 #define DO16(sum1, sum2, buf) {DO8(sum1, sum2, buf, 0); DO8(sum1, sum2, buf, 8);} argument
/aosp_15_r20/external/libaom/aom_dsp/arm/
H A Daom_convolve8_neon.h84 uint16x8_t sum1 = vmull_u8(s2, f0); in convolve8_horiz_2tap_neon() local
106 uint16x8_t sum1 = vmull_u8(s2, f0); in convolve8_horiz_2tap_neon() local
131 uint16x8_t sum1 = vmull_u8(vget_high_u8(s0), f0); in convolve8_horiz_2tap_neon() local
265 uint16x8_t sum1 = vmull_u8(s2, f0); in convolve8_vert_2tap_neon() local
285 uint16x8_t sum1 = vmull_u8(s1, f0); in convolve8_vert_2tap_neon() local
310 uint16x8_t sum1 = vmull_u8(vget_high_u8(s0), f0); in convolve8_vert_2tap_neon() local
H A Daom_convolve8_neon_dotprod.c90 int32x4_t sum1 = vdotq_lane_s32(acc, perm_samples[1], filters, 0); in convolve8_8_h() local
191 int32x4_t sum1 = vdotq_lane_s32(acc, perm_samples[1], filters, 0); in convolve4_8_h() local
365 int32x4_t sum1 = vdotq_lane_s32(acc, samples1_lo, filters, 0); in convolve8_8_v() local
/aosp_15_r20/external/libaom/aom_dsp/x86/
H A Dhighbd_variance_avx2.c60 __m256i sum1 = _mm256_setzero_si256(); in aom_highbd_var_filter_block2d_bil_avx2() local
105 __m256i sum1 = _mm256_setzero_si256(); in aom_highbd_var_filter_block2d_bil_avx2() local
154 __m256i sum1 = _mm256_setzero_si256(); in aom_highbd_var_filter_block2d_bil_avx2() local
222 __m256i sum1 = _mm256_setzero_si256(); in aom_highbd_var_filter_block2d_bil_avx2() local
291 __m256i sum1 = _mm256_setzero_si256(); in aom_highbd_var_filter_block2d_bil_avx2() local
343 __m256i sum1 = _mm256_setzero_si256(); in aom_highbd_var_filter_block2d_bil_avx2() local
407 __m256i sum1 = _mm256_setzero_si256(); in aom_highbd_var_filter_block2d_bil_avx2() local
479 __m256i sum1 = _mm256_setzero_si256(); in aom_highbd_var_filter_block2d_bil_avx2() local
556 __m256i sum1 = _mm256_setzero_si256(); in aom_highbd_var_filter_block2d_bil_avx2() local
H A Dsse_sse4.c25 const __m128i sum1 = _mm_cvtepu32_epi64(_mm_srli_si128(*sum_all, 8)); in summary_all_sse4() local
35 const __m128i sum1 = _mm_cvtepu32_epi64(_mm_srli_si128(*sum32, 8)); in summary_32_sse4() local
H A Davg_intrin_sse2.c113 __m128i sum0, sum1, s0, s1, s2, s3, u0; in aom_avg_8x8_sse2() local
138 __m128i sum0, sum1, s0, s1, s2, s3, u0; in calc_avg_8x8_dual_sse2() local
623 const __m128i sum1 = _mm_madd_epi16(abs1, one); in aom_satd_lp_sse2() local
/aosp_15_r20/external/kotlinx.coroutines/kotlinx-coroutines-core/common/test/flow/operators/
H A DDistinctUntilChangedTest.kt26 val sum1 = flow.distinctUntilChanged().map { it.i }.sum() in <lambda>() constant
41 val sum1 = flow.distinctUntilChanged().map { it.i }.sum() in <lambda>() constant
/aosp_15_r20/external/libavc/common/x86/svc/
H A Disvc_resi_trans_quant_sse42.c144 __m128i sum0, sum1, sum2, cmp0, cmp1; in isvc_resi_trans_quant_4x4_sse42() local
444 __m128i sum0, sum1, sum2, cmp0, cmp1; in isvc_resi_trans_quant_4x4_with_res_pred_sse42() local
852 __m128i cmp0, cmp1, sum0, sum1, sum2; in isvc_resi_trans_quant_chroma_4x4_sse42() local
1147 __m128i cmp0, cmp1, sum0, sum1, sum2; in isvc_resi_trans_quant_chroma_4x4_with_res_pred_sse42() local
1528 __m128i cmp0, cmp1, sum0, sum1, sum2; in isvc_hadamard_quant_4x4_sse42() local
1785 __m128i sum0, sum1; in isvc_hadamard_quant_2x2_uv_sse42() local
/aosp_15_r20/external/pytorch/aten/src/ATen/native/cuda/
H A Dgroup_norm_kernel.cu116 T_ACC sum1 = 0; in Compute1dBackwardFusedParamsCUDAKernel() local
162 T_ACC sum1 = 0; in GammaBeta1dBackwardCUDAKernel1() local
243 T_ACC sum1 = g_shared[threadIdx.x][threadIdx.y]; in GammaBeta1dBackwardCUDAKernel2() local
286 T_ACC sum1 = 0; in ComputeInternalGradientsCUDAKernel() local
326 T_ACC sum1 = 0; in ComputeBackwardFusedParamsCUDAKernel() local
372 T_ACC sum1 = 0; in GammaBetaBackwardCUDAKernel1() local
447 T_ACC sum1 = g_shared[threadIdx.x][threadIdx.y]; in GammaBetaBackwardCUDAKernel2() local
/aosp_15_r20/external/libavc/common/x86/
H A Dih264_resi_trans_quant_sse42.c115 __m128i sum0, sum1, sum2, cmp0, cmp1; in ih264_resi_trans_quant_4x4_sse42() local
389 __m128i cmp0, cmp1, sum0, sum1, sum2; in ih264_resi_trans_quant_chroma_4x4_sse42() local
674 __m128i cmp0, cmp1, sum0, sum1, sum2; in ih264_hadamard_quant_4x4_sse42() local
903 __m128i sum0, sum1; in ih264_hadamard_quant_2x2_uv_sse42() local
/aosp_15_r20/external/libaom/av1/common/arm/
H A Dhighbd_convolve_neon.c58 int32x4_t sum1 = vmull_lane_s16(vget_high_s16(s0), y_filter_0_3, 1); in highbd_convolve6_8_y() local
190 int32x4_t sum1 = vmull_lane_s16(vget_high_s16(s0), y_filter_0_3, 0); in highbd_convolve8_8_y() local
339 int32x4_t sum1 = vmull_lane_s16(vget_high_s16(s0), y_filter_0_3, 0); in highbd_convolve12_8_y() local
509 int32x4_t sum1 = offset; in highbd_convolve6_8_x() local
598 int32x4_t sum1 = offset; in highbd_convolve8_8_x() local
734 int32x4_t sum1 = offset; in highbd_convolve12_8_x() local
912 int32x4_t sum1 = vmlal_lane_s16(offset, vget_high_s16(s0), y_filter_0_3, 1); in highbd_convolve6_8_2d_v() local
1052 int32x4_t sum1 = vmlal_lane_s16(offset, vget_high_s16(s0), y_filter_lo, 0); in highbd_convolve8_8_2d_v() local
1216 int32x4_t sum1 = vmlal_lane_s16(offset, vget_high_s16(s0), y_filter_0_3, 0); in highbd_convolve12_8_2d_v() local
1360 int32x4_t sum1 = vmlal_lane_s16(offset, vget_high_s16(s[0]), x_filter_0_3, 1); in highbd_convolve6_8_2d_h() local
[all …]
H A Dconvolve_neon.h71 int32x4_t sum1 = vmull_lane_s16(vget_high_s16(s0), y_filter_0_3, 0); in convolve12_8_2d_v() local
240 int32x4_t sum1 = vmull_lane_s16(vget_high_s16(s0), y_filter_lo, 0); in convolve8_8_2d_v() local
411 int32x4_t sum1 = vmull_lane_s16(vget_high_s16(s0), y_filter_lo, 1); in convolve6_8_2d_v() local
559 int32x4_t sum1 = vmull_lane_s16(vget_high_s16(s0), y_filter, 0); in convolve4_8_2d_v() local
H A Dhighbd_compound_convolve_neon.c77 int32x4_t sum1 = vmlal_lane_s16(offset, vget_high_s16(s0), filter_0_3, 1); in highbd_12_convolve6_8() local
103 int32x4_t sum1 = vmlal_lane_s16(offset, vget_high_s16(s0), filter_0_3, 1); in highbd_convolve6_8() local
262 int32x4_t sum1 = vmlal_lane_s16(offset, vget_high_s16(s0), filter_0_3, 0); in highbd_12_convolve8_8() local
292 int32x4_t sum1 = vmlal_lane_s16(offset, vget_high_s16(s0), filter_0_3, 0); in highbd_convolve8_8() local
733 int32x4_t sum1 = vmlal_lane_s16(offset, vget_high_s16(s0), filter, 0); in highbd_12_convolve4_8() local
838 int32x4_t sum1 = vmlal_lane_s16(offset, vget_high_s16(s0), filter, 0); in highbd_convolve4_8() local
1296 int32x4_t sum1 = vmlal_lane_s16(offset, vget_high_s16(s0), y_filter_0_3, 1); in highbd_convolve6_8_2d_v() local
1423 int32x4_t sum1 = vmlal_lane_s16(offset, vget_high_s16(s0), y_filter_0_3, 0); in highbd_convolve8_8_2d_v() local
H A Dhighbd_convolve_neon.h71 const int32x4_t offset, int32x4_t *sum0, int32x4_t *sum1) { in highbd_convolve8_8_s32()
102 int32x4_t sum1; in highbd_convolve8_8_srsub_s32_s16() local
/aosp_15_r20/external/rust/android-crates-io/crates/libz-sys/src/zlib-ng/arch/x86/
Dadler32_avx512_p.h16 __m128i sum1 = _mm_unpackhi_epi64(c_plus_d, c_plus_d); in _mm512_reduce_add_epu32() local
39 __m128i sum1 = _mm_add_epi32(_mm256_extracti128_si256(non_zero_avx, 1), in partial_hsum() local
/aosp_15_r20/external/webp/src/dsp/
H A Dssim_sse2.c37 const __m128i sum1 = _mm_madd_epi16(C0, C0); in SubtractAndSquare_SSE2() local
52 __m128i sum1; in AccumulateSSE_SSE2() local
/aosp_15_r20/external/tensorflow/tensorflow/lite/kernels/internal/optimized/
H A Ddepthwiseconv_3x3_filter_common.h149 int32x4_t sum1 = vpaddlq_s16(vmull_s8(vget_high_s8(lhs), vget_high_s8(rhs))); in vdotq_s32() local
171 int32x4_t sum1 = vpaddlq_s16(vmull_s8(vget_high_s8(lhs), lane_rhs)); in vdotq_four_lane_s32() local
/aosp_15_r20/external/libvpx/vpx_dsp/x86/
H A Dconvolve_avx2.h61 __m256i sum1, sum2; in convolve8_16_avx2() local
88 __m128i sum1, sum2; in convolve8_8_avx2() local
H A Dsse_sse4.c24 const __m128i sum1 = _mm_cvtepu32_epi64(_mm_srli_si128(*sum_all, 8)); in summary_all_sse4() local
34 const __m128i sum1 = _mm_cvtepu32_epi64(_mm_srli_si128(*sum32, 8)); in summary_32_sse4() local
/aosp_15_r20/external/flatbuffers/tests/FlatBuffers.Test.Swift.Wasm/Tests/FlatBuffers.Test.Swift.WasmTests/
H A DFlatBuffersMonsterWriterTests.swift272 var sum1 = 0 in readFlatbufferMonster() variable
339 var sum1 = 0 in readObjectApi() variable
/aosp_15_r20/external/flatbuffers/tests/FlatBuffers.Test.Swift/Tests/FlatBuffers.Test.SwiftTests/
H A DFlatBuffersMonsterWriterTests.swift298 var sum1 = 0 in readFlatbufferMonster() variable
365 var sum1 = 0 in readObjectApi() variable
/aosp_15_r20/external/libaom/av1/common/x86/
H A Dselfguided_sse4.c147 static __m128i compute_p(__m128i sum1, __m128i sum2, int bit_depth, int n) { in compute_p()
196 __m128i sum1 = boxsum_from_ii(Dij, buf_stride, r); in calc_ab() local
337 __m128i sum1 = boxsum_from_ii(Dij, buf_stride, r); in calc_ab_fast() local
/aosp_15_r20/external/libvpx/vpx_dsp/arm/
H A Dfdct_neon.h110 const int32x4_t sum1 = vmlal_n_s16(a1, vget_high_s16(b), constant); in butterfly_one_coeff_s16_s32() local
400 const int32x4_t sum1 = vmlal_n_s16(a2, vget_high_s16(b), constant2); in butterfly_two_coeff() local
425 const int32x4_t sum1 = vmlaq_n_s32(a2, b_hi, constant2); in butterfly_two_coeff_s32() local
H A Dloopfilter_neon.c186 uint16x8_t *sum1) { in filter_update_16()
208 const uint8x16_t add1, uint16x8_t *sum0, uint16x8_t *sum1) { in calc_7_tap_filter_16_kernel()
224 uint16x8_t *sum0, uint16x8_t *sum1) { in apply_15_tap_filter_16_kernel()
260 uint16x8_t sum0, sum1; in calc_7_tap_filter_16() local
355 uint16x8_t sum0, sum1; in apply_15_tap_filter_16() local
/aosp_15_r20/external/libaom/aom_dsp/flow_estimation/x86/
H A Ddisflow_sse4.c171 __m128i sum1 = _mm_add_epi32(_mm_madd_epi16(px2, h_kernel_01), in compute_flow_vector() local
210 __m128i sum1 = _mm_add_epi32( in compute_flow_vector() local

123456