xref: /aosp_15_r20/external/libvpx/vpx_dsp/x86/quantize_ssse3.h (revision fb1b10ab9aebc7c7068eedab379b749d7e3900be)
1*fb1b10abSAndroid Build Coastguard Worker /*
2*fb1b10abSAndroid Build Coastguard Worker  *  Copyright (c) 2017 The WebM project authors. All Rights Reserved.
3*fb1b10abSAndroid Build Coastguard Worker  *
4*fb1b10abSAndroid Build Coastguard Worker  *  Use of this source code is governed by a BSD-style license
5*fb1b10abSAndroid Build Coastguard Worker  *  that can be found in the LICENSE file in the root of the source
6*fb1b10abSAndroid Build Coastguard Worker  *  tree. An additional intellectual property rights grant can be found
7*fb1b10abSAndroid Build Coastguard Worker  *  in the file PATENTS.  All contributing project authors may
8*fb1b10abSAndroid Build Coastguard Worker  *  be found in the AUTHORS file in the root of the source tree.
9*fb1b10abSAndroid Build Coastguard Worker  */
10*fb1b10abSAndroid Build Coastguard Worker 
11*fb1b10abSAndroid Build Coastguard Worker #ifndef VPX_VPX_DSP_X86_QUANTIZE_SSSE3_H_
12*fb1b10abSAndroid Build Coastguard Worker #define VPX_VPX_DSP_X86_QUANTIZE_SSSE3_H_
13*fb1b10abSAndroid Build Coastguard Worker 
14*fb1b10abSAndroid Build Coastguard Worker #include <emmintrin.h>
15*fb1b10abSAndroid Build Coastguard Worker 
16*fb1b10abSAndroid Build Coastguard Worker #include "./vpx_config.h"
17*fb1b10abSAndroid Build Coastguard Worker #include "vpx/vpx_integer.h"
18*fb1b10abSAndroid Build Coastguard Worker #include "vpx_dsp/x86/quantize_sse2.h"
19*fb1b10abSAndroid Build Coastguard Worker 
calculate_dqcoeff_and_store_32x32(const __m128i qcoeff,const __m128i dequant,const __m128i zero,tran_low_t * dqcoeff)20*fb1b10abSAndroid Build Coastguard Worker static INLINE void calculate_dqcoeff_and_store_32x32(const __m128i qcoeff,
21*fb1b10abSAndroid Build Coastguard Worker                                                      const __m128i dequant,
22*fb1b10abSAndroid Build Coastguard Worker                                                      const __m128i zero,
23*fb1b10abSAndroid Build Coastguard Worker                                                      tran_low_t *dqcoeff) {
24*fb1b10abSAndroid Build Coastguard Worker   // Un-sign to bias rounding like C.
25*fb1b10abSAndroid Build Coastguard Worker   const __m128i coeff = _mm_abs_epi16(qcoeff);
26*fb1b10abSAndroid Build Coastguard Worker 
27*fb1b10abSAndroid Build Coastguard Worker   const __m128i sign_0 = _mm_unpacklo_epi16(zero, qcoeff);
28*fb1b10abSAndroid Build Coastguard Worker   const __m128i sign_1 = _mm_unpackhi_epi16(zero, qcoeff);
29*fb1b10abSAndroid Build Coastguard Worker 
30*fb1b10abSAndroid Build Coastguard Worker   const __m128i low = _mm_mullo_epi16(coeff, dequant);
31*fb1b10abSAndroid Build Coastguard Worker   const __m128i high = _mm_mulhi_epi16(coeff, dequant);
32*fb1b10abSAndroid Build Coastguard Worker   __m128i dqcoeff32_0 = _mm_unpacklo_epi16(low, high);
33*fb1b10abSAndroid Build Coastguard Worker   __m128i dqcoeff32_1 = _mm_unpackhi_epi16(low, high);
34*fb1b10abSAndroid Build Coastguard Worker 
35*fb1b10abSAndroid Build Coastguard Worker   // "Divide" by 2.
36*fb1b10abSAndroid Build Coastguard Worker   dqcoeff32_0 = _mm_srli_epi32(dqcoeff32_0, 1);
37*fb1b10abSAndroid Build Coastguard Worker   dqcoeff32_1 = _mm_srli_epi32(dqcoeff32_1, 1);
38*fb1b10abSAndroid Build Coastguard Worker 
39*fb1b10abSAndroid Build Coastguard Worker   dqcoeff32_0 = _mm_sign_epi32(dqcoeff32_0, sign_0);
40*fb1b10abSAndroid Build Coastguard Worker   dqcoeff32_1 = _mm_sign_epi32(dqcoeff32_1, sign_1);
41*fb1b10abSAndroid Build Coastguard Worker 
42*fb1b10abSAndroid Build Coastguard Worker #if CONFIG_VP9_HIGHBITDEPTH
43*fb1b10abSAndroid Build Coastguard Worker   _mm_store_si128((__m128i *)(dqcoeff), dqcoeff32_0);
44*fb1b10abSAndroid Build Coastguard Worker   _mm_store_si128((__m128i *)(dqcoeff + 4), dqcoeff32_1);
45*fb1b10abSAndroid Build Coastguard Worker #else
46*fb1b10abSAndroid Build Coastguard Worker   _mm_store_si128((__m128i *)(dqcoeff),
47*fb1b10abSAndroid Build Coastguard Worker                   _mm_packs_epi32(dqcoeff32_0, dqcoeff32_1));
48*fb1b10abSAndroid Build Coastguard Worker #endif  // CONFIG_VP9_HIGHBITDEPTH
49*fb1b10abSAndroid Build Coastguard Worker }
50*fb1b10abSAndroid Build Coastguard Worker 
51*fb1b10abSAndroid Build Coastguard Worker #endif  // VPX_VPX_DSP_X86_QUANTIZE_SSSE3_H_
52