xref: /aosp_15_r20/external/libopus/celt/fixed_generic.h (revision a58d3d2adb790c104798cd88c8a3aff4fa8b82cc)
1*a58d3d2aSXin Li /* Copyright (C) 2007-2009 Xiph.Org Foundation
2*a58d3d2aSXin Li    Copyright (C) 2003-2008 Jean-Marc Valin
3*a58d3d2aSXin Li    Copyright (C) 2007-2008 CSIRO */
4*a58d3d2aSXin Li /**
5*a58d3d2aSXin Li    @file fixed_generic.h
6*a58d3d2aSXin Li    @brief Generic fixed-point operations
7*a58d3d2aSXin Li */
8*a58d3d2aSXin Li /*
9*a58d3d2aSXin Li    Redistribution and use in source and binary forms, with or without
10*a58d3d2aSXin Li    modification, are permitted provided that the following conditions
11*a58d3d2aSXin Li    are met:
12*a58d3d2aSXin Li 
13*a58d3d2aSXin Li    - Redistributions of source code must retain the above copyright
14*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer.
15*a58d3d2aSXin Li 
16*a58d3d2aSXin Li    - Redistributions in binary form must reproduce the above copyright
17*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer in the
18*a58d3d2aSXin Li    documentation and/or other materials provided with the distribution.
19*a58d3d2aSXin Li 
20*a58d3d2aSXin Li    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
21*a58d3d2aSXin Li    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
22*a58d3d2aSXin Li    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
23*a58d3d2aSXin Li    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
24*a58d3d2aSXin Li    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
25*a58d3d2aSXin Li    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
26*a58d3d2aSXin Li    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
27*a58d3d2aSXin Li    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
28*a58d3d2aSXin Li    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
29*a58d3d2aSXin Li    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
30*a58d3d2aSXin Li    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
31*a58d3d2aSXin Li */
32*a58d3d2aSXin Li 
33*a58d3d2aSXin Li #ifndef FIXED_GENERIC_H
34*a58d3d2aSXin Li #define FIXED_GENERIC_H
35*a58d3d2aSXin Li 
36*a58d3d2aSXin Li /** Multiply a 16-bit signed value by a 16-bit unsigned value. The result is a 32-bit signed value */
37*a58d3d2aSXin Li #define MULT16_16SU(a,b) ((opus_val32)(opus_val16)(a)*(opus_val32)(opus_uint16)(b))
38*a58d3d2aSXin Li 
39*a58d3d2aSXin Li /** 16x32 multiplication, followed by a 16-bit shift right. Results fits in 32 bits */
40*a58d3d2aSXin Li #if OPUS_FAST_INT64
41*a58d3d2aSXin Li #define MULT16_32_Q16(a,b) ((opus_val32)SHR((opus_int64)((opus_val16)(a))*(b),16))
42*a58d3d2aSXin Li #else
43*a58d3d2aSXin Li #define MULT16_32_Q16(a,b) ADD32(MULT16_16((a),SHR((b),16)), SHR(MULT16_16SU((a),((b)&0x0000ffff)),16))
44*a58d3d2aSXin Li #endif
45*a58d3d2aSXin Li 
46*a58d3d2aSXin Li /** 16x32 multiplication, followed by a 16-bit shift right (round-to-nearest). Results fits in 32 bits */
47*a58d3d2aSXin Li #if OPUS_FAST_INT64
48*a58d3d2aSXin Li #define MULT16_32_P16(a,b) ((opus_val32)PSHR((opus_int64)((opus_val16)(a))*(b),16))
49*a58d3d2aSXin Li #else
50*a58d3d2aSXin Li #define MULT16_32_P16(a,b) ADD32(MULT16_16((a),SHR((b),16)), PSHR(MULT16_16SU((a),((b)&0x0000ffff)),16))
51*a58d3d2aSXin Li #endif
52*a58d3d2aSXin Li 
53*a58d3d2aSXin Li /** 16x32 multiplication, followed by a 15-bit shift right. Results fits in 32 bits */
54*a58d3d2aSXin Li #if OPUS_FAST_INT64
55*a58d3d2aSXin Li #define MULT16_32_Q15(a,b) ((opus_val32)SHR((opus_int64)((opus_val16)(a))*(b),15))
56*a58d3d2aSXin Li #else
57*a58d3d2aSXin Li #define MULT16_32_Q15(a,b) ADD32(SHL(MULT16_16((a),SHR((b),16)),1), SHR(MULT16_16SU((a),((b)&0x0000ffff)),15))
58*a58d3d2aSXin Li #endif
59*a58d3d2aSXin Li 
60*a58d3d2aSXin Li /** 32x32 multiplication, followed by a 16-bit shift right. Results fits in 32 bits */
61*a58d3d2aSXin Li #if OPUS_FAST_INT64
62*a58d3d2aSXin Li #define MULT32_32_Q16(a,b) ((opus_val32)SHR((opus_int64)(a)*(opus_int64)(b),16))
63*a58d3d2aSXin Li #else
64*a58d3d2aSXin Li #define MULT32_32_Q16(a,b) (ADD32(ADD32(ADD32((opus_val32)(SHR32(((opus_uint32)((a)&0x0000ffff)*(opus_uint32)((b)&0x0000ffff)),16)), MULT16_16SU(SHR32(a,16),((b)&0x0000ffff))), MULT16_16SU(SHR32(b,16),((a)&0x0000ffff))), SHL32(MULT16_16(SHR32(a,16),SHR32(b,16)),16)))
65*a58d3d2aSXin Li #endif
66*a58d3d2aSXin Li 
67*a58d3d2aSXin Li /** 32x32 multiplication, followed by a 31-bit shift right. Results fits in 32 bits */
68*a58d3d2aSXin Li #if OPUS_FAST_INT64
69*a58d3d2aSXin Li #define MULT32_32_Q31(a,b) ((opus_val32)SHR((opus_int64)(a)*(opus_int64)(b),31))
70*a58d3d2aSXin Li #else
71*a58d3d2aSXin Li #define MULT32_32_Q31(a,b) ADD32(ADD32(SHL(MULT16_16(SHR((a),16),SHR((b),16)),1), SHR(MULT16_16SU(SHR((a),16),((b)&0x0000ffff)),15)), SHR(MULT16_16SU(SHR((b),16),((a)&0x0000ffff)),15))
72*a58d3d2aSXin Li #endif
73*a58d3d2aSXin Li 
74*a58d3d2aSXin Li /** Compile-time conversion of float constant to 16-bit value */
75*a58d3d2aSXin Li #define QCONST16(x,bits) ((opus_val16)(.5+(x)*(((opus_val32)1)<<(bits))))
76*a58d3d2aSXin Li 
77*a58d3d2aSXin Li /** Compile-time conversion of float constant to 32-bit value */
78*a58d3d2aSXin Li #define QCONST32(x,bits) ((opus_val32)(.5+(x)*(((opus_val32)1)<<(bits))))
79*a58d3d2aSXin Li 
80*a58d3d2aSXin Li /** Negate a 16-bit value */
81*a58d3d2aSXin Li #define NEG16(x) (-(x))
82*a58d3d2aSXin Li /** Negate a 32-bit value */
83*a58d3d2aSXin Li #define NEG32(x) (-(x))
84*a58d3d2aSXin Li 
85*a58d3d2aSXin Li /** Change a 32-bit value into a 16-bit value. The value is assumed to fit in 16-bit, otherwise the result is undefined */
86*a58d3d2aSXin Li #define EXTRACT16(x) ((opus_val16)(x))
87*a58d3d2aSXin Li /** Change a 16-bit value into a 32-bit value */
88*a58d3d2aSXin Li #define EXTEND32(x) ((opus_val32)(x))
89*a58d3d2aSXin Li 
90*a58d3d2aSXin Li /** Arithmetic shift-right of a 16-bit value */
91*a58d3d2aSXin Li #define SHR16(a,shift) ((a) >> (shift))
92*a58d3d2aSXin Li /** Arithmetic shift-left of a 16-bit value */
93*a58d3d2aSXin Li #define SHL16(a,shift) ((opus_int16)((opus_uint16)(a)<<(shift)))
94*a58d3d2aSXin Li /** Arithmetic shift-right of a 32-bit value */
95*a58d3d2aSXin Li #define SHR32(a,shift) ((a) >> (shift))
96*a58d3d2aSXin Li /** Arithmetic shift-left of a 32-bit value */
97*a58d3d2aSXin Li #define SHL32(a,shift) ((opus_int32)((opus_uint32)(a)<<(shift)))
98*a58d3d2aSXin Li 
99*a58d3d2aSXin Li /** 32-bit arithmetic shift right with rounding-to-nearest instead of rounding down */
100*a58d3d2aSXin Li #define PSHR32(a,shift) (SHR32((a)+((EXTEND32(1)<<((shift))>>1)),shift))
101*a58d3d2aSXin Li /** 32-bit arithmetic shift right where the argument can be negative */
102*a58d3d2aSXin Li #define VSHR32(a, shift) (((shift)>0) ? SHR32(a, shift) : SHL32(a, -(shift)))
103*a58d3d2aSXin Li 
104*a58d3d2aSXin Li /** "RAW" macros, should not be used outside of this header file */
105*a58d3d2aSXin Li #define SHR(a,shift) ((a) >> (shift))
106*a58d3d2aSXin Li #define SHL(a,shift) SHL32(a,shift)
107*a58d3d2aSXin Li #define PSHR(a,shift) (SHR((a)+((EXTEND32(1)<<((shift))>>1)),shift))
108*a58d3d2aSXin Li #define SATURATE(x,a) (((x)>(a) ? (a) : (x)<-(a) ? -(a) : (x)))
109*a58d3d2aSXin Li 
110*a58d3d2aSXin Li #define SATURATE16(x) (EXTRACT16((x)>32767 ? 32767 : (x)<-32768 ? -32768 : (x)))
111*a58d3d2aSXin Li 
112*a58d3d2aSXin Li /** Shift by a and round-to-nearest 32-bit value. Result is a 16-bit value */
113*a58d3d2aSXin Li #define ROUND16(x,a) (EXTRACT16(PSHR32((x),(a))))
114*a58d3d2aSXin Li /** Shift by a and round-to-nearest 32-bit value. Result is a saturated 16-bit value */
115*a58d3d2aSXin Li #define SROUND16(x,a) EXTRACT16(SATURATE(PSHR32(x,a), 32767));
116*a58d3d2aSXin Li 
117*a58d3d2aSXin Li /** Divide by two */
118*a58d3d2aSXin Li #define HALF16(x)  (SHR16(x,1))
119*a58d3d2aSXin Li #define HALF32(x)  (SHR32(x,1))
120*a58d3d2aSXin Li 
121*a58d3d2aSXin Li /** Add two 16-bit values */
122*a58d3d2aSXin Li #define ADD16(a,b) ((opus_val16)((opus_val16)(a)+(opus_val16)(b)))
123*a58d3d2aSXin Li /** Subtract two 16-bit values */
124*a58d3d2aSXin Li #define SUB16(a,b) ((opus_val16)(a)-(opus_val16)(b))
125*a58d3d2aSXin Li /** Add two 32-bit values */
126*a58d3d2aSXin Li #define ADD32(a,b) ((opus_val32)(a)+(opus_val32)(b))
127*a58d3d2aSXin Li /** Subtract two 32-bit values */
128*a58d3d2aSXin Li #define SUB32(a,b) ((opus_val32)(a)-(opus_val32)(b))
129*a58d3d2aSXin Li 
130*a58d3d2aSXin Li /** Add two 32-bit values, ignore any overflows */
131*a58d3d2aSXin Li #define ADD32_ovflw(a,b) ((opus_val32)((opus_uint32)(a)+(opus_uint32)(b)))
132*a58d3d2aSXin Li /** Subtract two 32-bit values, ignore any overflows */
133*a58d3d2aSXin Li #define SUB32_ovflw(a,b) ((opus_val32)((opus_uint32)(a)-(opus_uint32)(b)))
134*a58d3d2aSXin Li /* Avoid MSVC warning C4146: unary minus operator applied to unsigned type */
135*a58d3d2aSXin Li /** Negate 32-bit value, ignore any overflows */
136*a58d3d2aSXin Li #define NEG32_ovflw(a) ((opus_val32)(0-(opus_uint32)(a)))
137*a58d3d2aSXin Li 
138*a58d3d2aSXin Li /** 16x16 multiplication where the result fits in 16 bits */
139*a58d3d2aSXin Li #define MULT16_16_16(a,b)     ((((opus_val16)(a))*((opus_val16)(b))))
140*a58d3d2aSXin Li 
141*a58d3d2aSXin Li /** 32x32 multiplication where the result fits in 32 bits */
142*a58d3d2aSXin Li #define MULT32_32_32(a,b)     ((((opus_val32)(a))*((opus_val32)(b))))
143*a58d3d2aSXin Li 
144*a58d3d2aSXin Li /* (opus_val32)(opus_val16) gives TI compiler a hint that it's 16x16->32 multiply */
145*a58d3d2aSXin Li /** 16x16 multiplication where the result fits in 32 bits */
146*a58d3d2aSXin Li #define MULT16_16(a,b)     (((opus_val32)(opus_val16)(a))*((opus_val32)(opus_val16)(b)))
147*a58d3d2aSXin Li 
148*a58d3d2aSXin Li /** 16x16 multiply-add where the result fits in 32 bits */
149*a58d3d2aSXin Li #define MAC16_16(c,a,b) (ADD32((c),MULT16_16((a),(b))))
150*a58d3d2aSXin Li /** 16x32 multiply, followed by a 15-bit shift right and 32-bit add.
151*a58d3d2aSXin Li     b must fit in 31 bits.
152*a58d3d2aSXin Li     Result fits in 32 bits. */
153*a58d3d2aSXin Li #define MAC16_32_Q15(c,a,b) ADD32((c),ADD32(MULT16_16((a),SHR((b),15)), SHR(MULT16_16((a),((b)&0x00007fff)),15)))
154*a58d3d2aSXin Li 
155*a58d3d2aSXin Li /** 16x32 multiplication, followed by a 16-bit shift right and 32-bit add.
156*a58d3d2aSXin Li     Results fits in 32 bits */
157*a58d3d2aSXin Li #define MAC16_32_Q16(c,a,b) ADD32((c),ADD32(MULT16_16((a),SHR((b),16)), SHR(MULT16_16SU((a),((b)&0x0000ffff)),16)))
158*a58d3d2aSXin Li 
159*a58d3d2aSXin Li #define MULT16_16_Q11_32(a,b) (SHR(MULT16_16((a),(b)),11))
160*a58d3d2aSXin Li #define MULT16_16_Q11(a,b) (SHR(MULT16_16((a),(b)),11))
161*a58d3d2aSXin Li #define MULT16_16_Q13(a,b) (SHR(MULT16_16((a),(b)),13))
162*a58d3d2aSXin Li #define MULT16_16_Q14(a,b) (SHR(MULT16_16((a),(b)),14))
163*a58d3d2aSXin Li #define MULT16_16_Q15(a,b) (SHR(MULT16_16((a),(b)),15))
164*a58d3d2aSXin Li 
165*a58d3d2aSXin Li #define MULT16_16_P13(a,b) (SHR(ADD32(4096,MULT16_16((a),(b))),13))
166*a58d3d2aSXin Li #define MULT16_16_P14(a,b) (SHR(ADD32(8192,MULT16_16((a),(b))),14))
167*a58d3d2aSXin Li #define MULT16_16_P15(a,b) (SHR(ADD32(16384,MULT16_16((a),(b))),15))
168*a58d3d2aSXin Li 
169*a58d3d2aSXin Li /** Divide a 32-bit value by a 16-bit value. Result fits in 16 bits */
170*a58d3d2aSXin Li #define DIV32_16(a,b) ((opus_val16)(((opus_val32)(a))/((opus_val16)(b))))
171*a58d3d2aSXin Li 
172*a58d3d2aSXin Li /** Divide a 32-bit value by a 32-bit value. Result fits in 32 bits */
173*a58d3d2aSXin Li #define DIV32(a,b) (((opus_val32)(a))/((opus_val32)(b)))
174*a58d3d2aSXin Li 
175*a58d3d2aSXin Li #if defined(MIPSr1_ASM)
176*a58d3d2aSXin Li #include "mips/fixed_generic_mipsr1.h"
177*a58d3d2aSXin Li #endif
178*a58d3d2aSXin Li 
SIG2WORD16_generic(celt_sig x)179*a58d3d2aSXin Li static OPUS_INLINE opus_val16 SIG2WORD16_generic(celt_sig x)
180*a58d3d2aSXin Li {
181*a58d3d2aSXin Li    x = PSHR32(x, SIG_SHIFT);
182*a58d3d2aSXin Li    x = MAX32(x, -32768);
183*a58d3d2aSXin Li    x = MIN32(x, 32767);
184*a58d3d2aSXin Li    return EXTRACT16(x);
185*a58d3d2aSXin Li }
186*a58d3d2aSXin Li #define SIG2WORD16(x) (SIG2WORD16_generic(x))
187*a58d3d2aSXin Li 
188*a58d3d2aSXin Li #endif
189