1*c0909341SAndroid Build Coastguard Worker /*
2*c0909341SAndroid Build Coastguard Worker * Copyright © 2018-2021, VideoLAN and dav1d authors
3*c0909341SAndroid Build Coastguard Worker * Copyright © 2018, Two Orioles, LLC
4*c0909341SAndroid Build Coastguard Worker * All rights reserved.
5*c0909341SAndroid Build Coastguard Worker *
6*c0909341SAndroid Build Coastguard Worker * Redistribution and use in source and binary forms, with or without
7*c0909341SAndroid Build Coastguard Worker * modification, are permitted provided that the following conditions are met:
8*c0909341SAndroid Build Coastguard Worker *
9*c0909341SAndroid Build Coastguard Worker * 1. Redistributions of source code must retain the above copyright notice, this
10*c0909341SAndroid Build Coastguard Worker * list of conditions and the following disclaimer.
11*c0909341SAndroid Build Coastguard Worker *
12*c0909341SAndroid Build Coastguard Worker * 2. Redistributions in binary form must reproduce the above copyright notice,
13*c0909341SAndroid Build Coastguard Worker * this list of conditions and the following disclaimer in the documentation
14*c0909341SAndroid Build Coastguard Worker * and/or other materials provided with the distribution.
15*c0909341SAndroid Build Coastguard Worker *
16*c0909341SAndroid Build Coastguard Worker * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
17*c0909341SAndroid Build Coastguard Worker * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
18*c0909341SAndroid Build Coastguard Worker * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
19*c0909341SAndroid Build Coastguard Worker * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
20*c0909341SAndroid Build Coastguard Worker * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
21*c0909341SAndroid Build Coastguard Worker * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
22*c0909341SAndroid Build Coastguard Worker * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
23*c0909341SAndroid Build Coastguard Worker * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24*c0909341SAndroid Build Coastguard Worker * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25*c0909341SAndroid Build Coastguard Worker * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26*c0909341SAndroid Build Coastguard Worker */
27*c0909341SAndroid Build Coastguard Worker
28*c0909341SAndroid Build Coastguard Worker #include "config.h"
29*c0909341SAndroid Build Coastguard Worker
30*c0909341SAndroid Build Coastguard Worker #include <errno.h>
31*c0909341SAndroid Build Coastguard Worker #include <limits.h>
32*c0909341SAndroid Build Coastguard Worker #include <string.h>
33*c0909341SAndroid Build Coastguard Worker #include <stdio.h>
34*c0909341SAndroid Build Coastguard Worker #include <inttypes.h>
35*c0909341SAndroid Build Coastguard Worker
36*c0909341SAndroid Build Coastguard Worker #include "dav1d/data.h"
37*c0909341SAndroid Build Coastguard Worker
38*c0909341SAndroid Build Coastguard Worker #include "common/frame.h"
39*c0909341SAndroid Build Coastguard Worker #include "common/intops.h"
40*c0909341SAndroid Build Coastguard Worker
41*c0909341SAndroid Build Coastguard Worker #include "src/ctx.h"
42*c0909341SAndroid Build Coastguard Worker #include "src/decode.h"
43*c0909341SAndroid Build Coastguard Worker #include "src/dequant_tables.h"
44*c0909341SAndroid Build Coastguard Worker #include "src/env.h"
45*c0909341SAndroid Build Coastguard Worker #include "src/filmgrain.h"
46*c0909341SAndroid Build Coastguard Worker #include "src/log.h"
47*c0909341SAndroid Build Coastguard Worker #include "src/qm.h"
48*c0909341SAndroid Build Coastguard Worker #include "src/recon.h"
49*c0909341SAndroid Build Coastguard Worker #include "src/ref.h"
50*c0909341SAndroid Build Coastguard Worker #include "src/tables.h"
51*c0909341SAndroid Build Coastguard Worker #include "src/thread_task.h"
52*c0909341SAndroid Build Coastguard Worker #include "src/warpmv.h"
53*c0909341SAndroid Build Coastguard Worker
init_quant_tables(const Dav1dSequenceHeader * const seq_hdr,const Dav1dFrameHeader * const frame_hdr,const int qidx,uint16_t (* dq)[3][2])54*c0909341SAndroid Build Coastguard Worker static void init_quant_tables(const Dav1dSequenceHeader *const seq_hdr,
55*c0909341SAndroid Build Coastguard Worker const Dav1dFrameHeader *const frame_hdr,
56*c0909341SAndroid Build Coastguard Worker const int qidx, uint16_t (*dq)[3][2])
57*c0909341SAndroid Build Coastguard Worker {
58*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < (frame_hdr->segmentation.enabled ? 8 : 1); i++) {
59*c0909341SAndroid Build Coastguard Worker const int yac = frame_hdr->segmentation.enabled ?
60*c0909341SAndroid Build Coastguard Worker iclip_u8(qidx + frame_hdr->segmentation.seg_data.d[i].delta_q) : qidx;
61*c0909341SAndroid Build Coastguard Worker const int ydc = iclip_u8(yac + frame_hdr->quant.ydc_delta);
62*c0909341SAndroid Build Coastguard Worker const int uac = iclip_u8(yac + frame_hdr->quant.uac_delta);
63*c0909341SAndroid Build Coastguard Worker const int udc = iclip_u8(yac + frame_hdr->quant.udc_delta);
64*c0909341SAndroid Build Coastguard Worker const int vac = iclip_u8(yac + frame_hdr->quant.vac_delta);
65*c0909341SAndroid Build Coastguard Worker const int vdc = iclip_u8(yac + frame_hdr->quant.vdc_delta);
66*c0909341SAndroid Build Coastguard Worker
67*c0909341SAndroid Build Coastguard Worker dq[i][0][0] = dav1d_dq_tbl[seq_hdr->hbd][ydc][0];
68*c0909341SAndroid Build Coastguard Worker dq[i][0][1] = dav1d_dq_tbl[seq_hdr->hbd][yac][1];
69*c0909341SAndroid Build Coastguard Worker dq[i][1][0] = dav1d_dq_tbl[seq_hdr->hbd][udc][0];
70*c0909341SAndroid Build Coastguard Worker dq[i][1][1] = dav1d_dq_tbl[seq_hdr->hbd][uac][1];
71*c0909341SAndroid Build Coastguard Worker dq[i][2][0] = dav1d_dq_tbl[seq_hdr->hbd][vdc][0];
72*c0909341SAndroid Build Coastguard Worker dq[i][2][1] = dav1d_dq_tbl[seq_hdr->hbd][vac][1];
73*c0909341SAndroid Build Coastguard Worker }
74*c0909341SAndroid Build Coastguard Worker }
75*c0909341SAndroid Build Coastguard Worker
read_mv_component_diff(MsacContext * const msac,CdfMvComponent * const mv_comp,const int mv_prec)76*c0909341SAndroid Build Coastguard Worker static int read_mv_component_diff(MsacContext *const msac,
77*c0909341SAndroid Build Coastguard Worker CdfMvComponent *const mv_comp,
78*c0909341SAndroid Build Coastguard Worker const int mv_prec)
79*c0909341SAndroid Build Coastguard Worker {
80*c0909341SAndroid Build Coastguard Worker const int sign = dav1d_msac_decode_bool_adapt(msac, mv_comp->sign);
81*c0909341SAndroid Build Coastguard Worker const int cl = dav1d_msac_decode_symbol_adapt16(msac, mv_comp->classes, 10);
82*c0909341SAndroid Build Coastguard Worker int up, fp = 3, hp = 1;
83*c0909341SAndroid Build Coastguard Worker
84*c0909341SAndroid Build Coastguard Worker if (!cl) {
85*c0909341SAndroid Build Coastguard Worker up = dav1d_msac_decode_bool_adapt(msac, mv_comp->class0);
86*c0909341SAndroid Build Coastguard Worker if (mv_prec >= 0) { // !force_integer_mv
87*c0909341SAndroid Build Coastguard Worker fp = dav1d_msac_decode_symbol_adapt4(msac, mv_comp->class0_fp[up], 3);
88*c0909341SAndroid Build Coastguard Worker if (mv_prec > 0) // allow_high_precision_mv
89*c0909341SAndroid Build Coastguard Worker hp = dav1d_msac_decode_bool_adapt(msac, mv_comp->class0_hp);
90*c0909341SAndroid Build Coastguard Worker }
91*c0909341SAndroid Build Coastguard Worker } else {
92*c0909341SAndroid Build Coastguard Worker up = 1 << cl;
93*c0909341SAndroid Build Coastguard Worker for (int n = 0; n < cl; n++)
94*c0909341SAndroid Build Coastguard Worker up |= dav1d_msac_decode_bool_adapt(msac, mv_comp->classN[n]) << n;
95*c0909341SAndroid Build Coastguard Worker if (mv_prec >= 0) { // !force_integer_mv
96*c0909341SAndroid Build Coastguard Worker fp = dav1d_msac_decode_symbol_adapt4(msac, mv_comp->classN_fp, 3);
97*c0909341SAndroid Build Coastguard Worker if (mv_prec > 0) // allow_high_precision_mv
98*c0909341SAndroid Build Coastguard Worker hp = dav1d_msac_decode_bool_adapt(msac, mv_comp->classN_hp);
99*c0909341SAndroid Build Coastguard Worker }
100*c0909341SAndroid Build Coastguard Worker }
101*c0909341SAndroid Build Coastguard Worker
102*c0909341SAndroid Build Coastguard Worker const int diff = ((up << 3) | (fp << 1) | hp) + 1;
103*c0909341SAndroid Build Coastguard Worker
104*c0909341SAndroid Build Coastguard Worker return sign ? -diff : diff;
105*c0909341SAndroid Build Coastguard Worker }
106*c0909341SAndroid Build Coastguard Worker
read_mv_residual(Dav1dTileState * const ts,mv * const ref_mv,const int mv_prec)107*c0909341SAndroid Build Coastguard Worker static void read_mv_residual(Dav1dTileState *const ts, mv *const ref_mv,
108*c0909341SAndroid Build Coastguard Worker const int mv_prec)
109*c0909341SAndroid Build Coastguard Worker {
110*c0909341SAndroid Build Coastguard Worker MsacContext *const msac = &ts->msac;
111*c0909341SAndroid Build Coastguard Worker const enum MVJoint mv_joint =
112*c0909341SAndroid Build Coastguard Worker dav1d_msac_decode_symbol_adapt4(msac, ts->cdf.mv.joint, N_MV_JOINTS - 1);
113*c0909341SAndroid Build Coastguard Worker if (mv_joint & MV_JOINT_V)
114*c0909341SAndroid Build Coastguard Worker ref_mv->y += read_mv_component_diff(msac, &ts->cdf.mv.comp[0], mv_prec);
115*c0909341SAndroid Build Coastguard Worker if (mv_joint & MV_JOINT_H)
116*c0909341SAndroid Build Coastguard Worker ref_mv->x += read_mv_component_diff(msac, &ts->cdf.mv.comp[1], mv_prec);
117*c0909341SAndroid Build Coastguard Worker }
118*c0909341SAndroid Build Coastguard Worker
read_tx_tree(Dav1dTaskContext * const t,const enum RectTxfmSize from,const int depth,uint16_t * const masks,const int x_off,const int y_off)119*c0909341SAndroid Build Coastguard Worker static void read_tx_tree(Dav1dTaskContext *const t,
120*c0909341SAndroid Build Coastguard Worker const enum RectTxfmSize from,
121*c0909341SAndroid Build Coastguard Worker const int depth, uint16_t *const masks,
122*c0909341SAndroid Build Coastguard Worker const int x_off, const int y_off)
123*c0909341SAndroid Build Coastguard Worker {
124*c0909341SAndroid Build Coastguard Worker const Dav1dFrameContext *const f = t->f;
125*c0909341SAndroid Build Coastguard Worker const int bx4 = t->bx & 31, by4 = t->by & 31;
126*c0909341SAndroid Build Coastguard Worker const TxfmInfo *const t_dim = &dav1d_txfm_dimensions[from];
127*c0909341SAndroid Build Coastguard Worker const int txw = t_dim->lw, txh = t_dim->lh;
128*c0909341SAndroid Build Coastguard Worker int is_split;
129*c0909341SAndroid Build Coastguard Worker
130*c0909341SAndroid Build Coastguard Worker if (depth < 2 && from > (int) TX_4X4) {
131*c0909341SAndroid Build Coastguard Worker const int cat = 2 * (TX_64X64 - t_dim->max) - depth;
132*c0909341SAndroid Build Coastguard Worker const int a = t->a->tx[bx4] < txw;
133*c0909341SAndroid Build Coastguard Worker const int l = t->l.tx[by4] < txh;
134*c0909341SAndroid Build Coastguard Worker
135*c0909341SAndroid Build Coastguard Worker is_split = dav1d_msac_decode_bool_adapt(&t->ts->msac,
136*c0909341SAndroid Build Coastguard Worker t->ts->cdf.m.txpart[cat][a + l]);
137*c0909341SAndroid Build Coastguard Worker if (is_split)
138*c0909341SAndroid Build Coastguard Worker masks[depth] |= 1 << (y_off * 4 + x_off);
139*c0909341SAndroid Build Coastguard Worker } else {
140*c0909341SAndroid Build Coastguard Worker is_split = 0;
141*c0909341SAndroid Build Coastguard Worker }
142*c0909341SAndroid Build Coastguard Worker
143*c0909341SAndroid Build Coastguard Worker if (is_split && t_dim->max > TX_8X8) {
144*c0909341SAndroid Build Coastguard Worker const enum RectTxfmSize sub = t_dim->sub;
145*c0909341SAndroid Build Coastguard Worker const TxfmInfo *const sub_t_dim = &dav1d_txfm_dimensions[sub];
146*c0909341SAndroid Build Coastguard Worker const int txsw = sub_t_dim->w, txsh = sub_t_dim->h;
147*c0909341SAndroid Build Coastguard Worker
148*c0909341SAndroid Build Coastguard Worker read_tx_tree(t, sub, depth + 1, masks, x_off * 2 + 0, y_off * 2 + 0);
149*c0909341SAndroid Build Coastguard Worker t->bx += txsw;
150*c0909341SAndroid Build Coastguard Worker if (txw >= txh && t->bx < f->bw)
151*c0909341SAndroid Build Coastguard Worker read_tx_tree(t, sub, depth + 1, masks, x_off * 2 + 1, y_off * 2 + 0);
152*c0909341SAndroid Build Coastguard Worker t->bx -= txsw;
153*c0909341SAndroid Build Coastguard Worker t->by += txsh;
154*c0909341SAndroid Build Coastguard Worker if (txh >= txw && t->by < f->bh) {
155*c0909341SAndroid Build Coastguard Worker read_tx_tree(t, sub, depth + 1, masks, x_off * 2 + 0, y_off * 2 + 1);
156*c0909341SAndroid Build Coastguard Worker t->bx += txsw;
157*c0909341SAndroid Build Coastguard Worker if (txw >= txh && t->bx < f->bw)
158*c0909341SAndroid Build Coastguard Worker read_tx_tree(t, sub, depth + 1, masks,
159*c0909341SAndroid Build Coastguard Worker x_off * 2 + 1, y_off * 2 + 1);
160*c0909341SAndroid Build Coastguard Worker t->bx -= txsw;
161*c0909341SAndroid Build Coastguard Worker }
162*c0909341SAndroid Build Coastguard Worker t->by -= txsh;
163*c0909341SAndroid Build Coastguard Worker } else {
164*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[t_dim->lw](&t->a->tx[bx4], is_split ? TX_4X4 : txw);
165*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[t_dim->lh](&t->l.tx[by4], is_split ? TX_4X4 : txh);
166*c0909341SAndroid Build Coastguard Worker }
167*c0909341SAndroid Build Coastguard Worker }
168*c0909341SAndroid Build Coastguard Worker
neg_deinterleave(int diff,int ref,int max)169*c0909341SAndroid Build Coastguard Worker static int neg_deinterleave(int diff, int ref, int max) {
170*c0909341SAndroid Build Coastguard Worker if (!ref) return diff;
171*c0909341SAndroid Build Coastguard Worker if (ref >= (max - 1)) return max - diff - 1;
172*c0909341SAndroid Build Coastguard Worker if (2 * ref < max) {
173*c0909341SAndroid Build Coastguard Worker if (diff <= 2 * ref) {
174*c0909341SAndroid Build Coastguard Worker if (diff & 1)
175*c0909341SAndroid Build Coastguard Worker return ref + ((diff + 1) >> 1);
176*c0909341SAndroid Build Coastguard Worker else
177*c0909341SAndroid Build Coastguard Worker return ref - (diff >> 1);
178*c0909341SAndroid Build Coastguard Worker }
179*c0909341SAndroid Build Coastguard Worker return diff;
180*c0909341SAndroid Build Coastguard Worker } else {
181*c0909341SAndroid Build Coastguard Worker if (diff <= 2 * (max - ref - 1)) {
182*c0909341SAndroid Build Coastguard Worker if (diff & 1)
183*c0909341SAndroid Build Coastguard Worker return ref + ((diff + 1) >> 1);
184*c0909341SAndroid Build Coastguard Worker else
185*c0909341SAndroid Build Coastguard Worker return ref - (diff >> 1);
186*c0909341SAndroid Build Coastguard Worker }
187*c0909341SAndroid Build Coastguard Worker return max - (diff + 1);
188*c0909341SAndroid Build Coastguard Worker }
189*c0909341SAndroid Build Coastguard Worker }
190*c0909341SAndroid Build Coastguard Worker
find_matching_ref(const Dav1dTaskContext * const t,const enum EdgeFlags intra_edge_flags,const int bw4,const int bh4,const int w4,const int h4,const int have_left,const int have_top,const int ref,uint64_t masks[2])191*c0909341SAndroid Build Coastguard Worker static void find_matching_ref(const Dav1dTaskContext *const t,
192*c0909341SAndroid Build Coastguard Worker const enum EdgeFlags intra_edge_flags,
193*c0909341SAndroid Build Coastguard Worker const int bw4, const int bh4,
194*c0909341SAndroid Build Coastguard Worker const int w4, const int h4,
195*c0909341SAndroid Build Coastguard Worker const int have_left, const int have_top,
196*c0909341SAndroid Build Coastguard Worker const int ref, uint64_t masks[2])
197*c0909341SAndroid Build Coastguard Worker {
198*c0909341SAndroid Build Coastguard Worker /*const*/ refmvs_block *const *r = &t->rt.r[(t->by & 31) + 5];
199*c0909341SAndroid Build Coastguard Worker int count = 0;
200*c0909341SAndroid Build Coastguard Worker int have_topleft = have_top && have_left;
201*c0909341SAndroid Build Coastguard Worker int have_topright = imax(bw4, bh4) < 32 &&
202*c0909341SAndroid Build Coastguard Worker have_top && t->bx + bw4 < t->ts->tiling.col_end &&
203*c0909341SAndroid Build Coastguard Worker (intra_edge_flags & EDGE_I444_TOP_HAS_RIGHT);
204*c0909341SAndroid Build Coastguard Worker
205*c0909341SAndroid Build Coastguard Worker #define bs(rp) dav1d_block_dimensions[(rp)->bs]
206*c0909341SAndroid Build Coastguard Worker #define matches(rp) ((rp)->ref.ref[0] == ref + 1 && (rp)->ref.ref[1] == -1)
207*c0909341SAndroid Build Coastguard Worker
208*c0909341SAndroid Build Coastguard Worker if (have_top) {
209*c0909341SAndroid Build Coastguard Worker const refmvs_block *r2 = &r[-1][t->bx];
210*c0909341SAndroid Build Coastguard Worker if (matches(r2)) {
211*c0909341SAndroid Build Coastguard Worker masks[0] |= 1;
212*c0909341SAndroid Build Coastguard Worker count = 1;
213*c0909341SAndroid Build Coastguard Worker }
214*c0909341SAndroid Build Coastguard Worker int aw4 = bs(r2)[0];
215*c0909341SAndroid Build Coastguard Worker if (aw4 >= bw4) {
216*c0909341SAndroid Build Coastguard Worker const int off = t->bx & (aw4 - 1);
217*c0909341SAndroid Build Coastguard Worker if (off) have_topleft = 0;
218*c0909341SAndroid Build Coastguard Worker if (aw4 - off > bw4) have_topright = 0;
219*c0909341SAndroid Build Coastguard Worker } else {
220*c0909341SAndroid Build Coastguard Worker unsigned mask = 1 << aw4;
221*c0909341SAndroid Build Coastguard Worker for (int x = aw4; x < w4; x += aw4) {
222*c0909341SAndroid Build Coastguard Worker r2 += aw4;
223*c0909341SAndroid Build Coastguard Worker if (matches(r2)) {
224*c0909341SAndroid Build Coastguard Worker masks[0] |= mask;
225*c0909341SAndroid Build Coastguard Worker if (++count >= 8) return;
226*c0909341SAndroid Build Coastguard Worker }
227*c0909341SAndroid Build Coastguard Worker aw4 = bs(r2)[0];
228*c0909341SAndroid Build Coastguard Worker mask <<= aw4;
229*c0909341SAndroid Build Coastguard Worker }
230*c0909341SAndroid Build Coastguard Worker }
231*c0909341SAndroid Build Coastguard Worker }
232*c0909341SAndroid Build Coastguard Worker if (have_left) {
233*c0909341SAndroid Build Coastguard Worker /*const*/ refmvs_block *const *r2 = r;
234*c0909341SAndroid Build Coastguard Worker if (matches(&r2[0][t->bx - 1])) {
235*c0909341SAndroid Build Coastguard Worker masks[1] |= 1;
236*c0909341SAndroid Build Coastguard Worker if (++count >= 8) return;
237*c0909341SAndroid Build Coastguard Worker }
238*c0909341SAndroid Build Coastguard Worker int lh4 = bs(&r2[0][t->bx - 1])[1];
239*c0909341SAndroid Build Coastguard Worker if (lh4 >= bh4) {
240*c0909341SAndroid Build Coastguard Worker if (t->by & (lh4 - 1)) have_topleft = 0;
241*c0909341SAndroid Build Coastguard Worker } else {
242*c0909341SAndroid Build Coastguard Worker unsigned mask = 1 << lh4;
243*c0909341SAndroid Build Coastguard Worker for (int y = lh4; y < h4; y += lh4) {
244*c0909341SAndroid Build Coastguard Worker r2 += lh4;
245*c0909341SAndroid Build Coastguard Worker if (matches(&r2[0][t->bx - 1])) {
246*c0909341SAndroid Build Coastguard Worker masks[1] |= mask;
247*c0909341SAndroid Build Coastguard Worker if (++count >= 8) return;
248*c0909341SAndroid Build Coastguard Worker }
249*c0909341SAndroid Build Coastguard Worker lh4 = bs(&r2[0][t->bx - 1])[1];
250*c0909341SAndroid Build Coastguard Worker mask <<= lh4;
251*c0909341SAndroid Build Coastguard Worker }
252*c0909341SAndroid Build Coastguard Worker }
253*c0909341SAndroid Build Coastguard Worker }
254*c0909341SAndroid Build Coastguard Worker if (have_topleft && matches(&r[-1][t->bx - 1])) {
255*c0909341SAndroid Build Coastguard Worker masks[1] |= 1ULL << 32;
256*c0909341SAndroid Build Coastguard Worker if (++count >= 8) return;
257*c0909341SAndroid Build Coastguard Worker }
258*c0909341SAndroid Build Coastguard Worker if (have_topright && matches(&r[-1][t->bx + bw4])) {
259*c0909341SAndroid Build Coastguard Worker masks[0] |= 1ULL << 32;
260*c0909341SAndroid Build Coastguard Worker }
261*c0909341SAndroid Build Coastguard Worker #undef matches
262*c0909341SAndroid Build Coastguard Worker }
263*c0909341SAndroid Build Coastguard Worker
derive_warpmv(const Dav1dTaskContext * const t,const int bw4,const int bh4,const uint64_t masks[2],const union mv mv,Dav1dWarpedMotionParams * const wmp)264*c0909341SAndroid Build Coastguard Worker static void derive_warpmv(const Dav1dTaskContext *const t,
265*c0909341SAndroid Build Coastguard Worker const int bw4, const int bh4,
266*c0909341SAndroid Build Coastguard Worker const uint64_t masks[2], const union mv mv,
267*c0909341SAndroid Build Coastguard Worker Dav1dWarpedMotionParams *const wmp)
268*c0909341SAndroid Build Coastguard Worker {
269*c0909341SAndroid Build Coastguard Worker int pts[8][2 /* in, out */][2 /* x, y */], np = 0;
270*c0909341SAndroid Build Coastguard Worker /*const*/ refmvs_block *const *r = &t->rt.r[(t->by & 31) + 5];
271*c0909341SAndroid Build Coastguard Worker
272*c0909341SAndroid Build Coastguard Worker #define add_sample(dx, dy, sx, sy, rp) do { \
273*c0909341SAndroid Build Coastguard Worker pts[np][0][0] = 16 * (2 * dx + sx * bs(rp)[0]) - 8; \
274*c0909341SAndroid Build Coastguard Worker pts[np][0][1] = 16 * (2 * dy + sy * bs(rp)[1]) - 8; \
275*c0909341SAndroid Build Coastguard Worker pts[np][1][0] = pts[np][0][0] + (rp)->mv.mv[0].x; \
276*c0909341SAndroid Build Coastguard Worker pts[np][1][1] = pts[np][0][1] + (rp)->mv.mv[0].y; \
277*c0909341SAndroid Build Coastguard Worker np++; \
278*c0909341SAndroid Build Coastguard Worker } while (0)
279*c0909341SAndroid Build Coastguard Worker
280*c0909341SAndroid Build Coastguard Worker // use masks[] to find the projectable motion vectors in the edges
281*c0909341SAndroid Build Coastguard Worker if ((unsigned) masks[0] == 1 && !(masks[1] >> 32)) {
282*c0909341SAndroid Build Coastguard Worker const int off = t->bx & (bs(&r[-1][t->bx])[0] - 1);
283*c0909341SAndroid Build Coastguard Worker add_sample(-off, 0, 1, -1, &r[-1][t->bx]);
284*c0909341SAndroid Build Coastguard Worker } else for (unsigned off = 0, xmask = (uint32_t) masks[0]; np < 8 && xmask;) { // top
285*c0909341SAndroid Build Coastguard Worker const int tz = ctz(xmask);
286*c0909341SAndroid Build Coastguard Worker off += tz;
287*c0909341SAndroid Build Coastguard Worker xmask >>= tz;
288*c0909341SAndroid Build Coastguard Worker add_sample(off, 0, 1, -1, &r[-1][t->bx + off]);
289*c0909341SAndroid Build Coastguard Worker xmask &= ~1;
290*c0909341SAndroid Build Coastguard Worker }
291*c0909341SAndroid Build Coastguard Worker if (np < 8 && masks[1] == 1) {
292*c0909341SAndroid Build Coastguard Worker const int off = t->by & (bs(&r[0][t->bx - 1])[1] - 1);
293*c0909341SAndroid Build Coastguard Worker add_sample(0, -off, -1, 1, &r[-off][t->bx - 1]);
294*c0909341SAndroid Build Coastguard Worker } else for (unsigned off = 0, ymask = (uint32_t) masks[1]; np < 8 && ymask;) { // left
295*c0909341SAndroid Build Coastguard Worker const int tz = ctz(ymask);
296*c0909341SAndroid Build Coastguard Worker off += tz;
297*c0909341SAndroid Build Coastguard Worker ymask >>= tz;
298*c0909341SAndroid Build Coastguard Worker add_sample(0, off, -1, 1, &r[off][t->bx - 1]);
299*c0909341SAndroid Build Coastguard Worker ymask &= ~1;
300*c0909341SAndroid Build Coastguard Worker }
301*c0909341SAndroid Build Coastguard Worker if (np < 8 && masks[1] >> 32) // top/left
302*c0909341SAndroid Build Coastguard Worker add_sample(0, 0, -1, -1, &r[-1][t->bx - 1]);
303*c0909341SAndroid Build Coastguard Worker if (np < 8 && masks[0] >> 32) // top/right
304*c0909341SAndroid Build Coastguard Worker add_sample(bw4, 0, 1, -1, &r[-1][t->bx + bw4]);
305*c0909341SAndroid Build Coastguard Worker assert(np > 0 && np <= 8);
306*c0909341SAndroid Build Coastguard Worker #undef bs
307*c0909341SAndroid Build Coastguard Worker
308*c0909341SAndroid Build Coastguard Worker // select according to motion vector difference against a threshold
309*c0909341SAndroid Build Coastguard Worker int mvd[8], ret = 0;
310*c0909341SAndroid Build Coastguard Worker const int thresh = 4 * iclip(imax(bw4, bh4), 4, 28);
311*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < np; i++) {
312*c0909341SAndroid Build Coastguard Worker mvd[i] = abs(pts[i][1][0] - pts[i][0][0] - mv.x) +
313*c0909341SAndroid Build Coastguard Worker abs(pts[i][1][1] - pts[i][0][1] - mv.y);
314*c0909341SAndroid Build Coastguard Worker if (mvd[i] > thresh)
315*c0909341SAndroid Build Coastguard Worker mvd[i] = -1;
316*c0909341SAndroid Build Coastguard Worker else
317*c0909341SAndroid Build Coastguard Worker ret++;
318*c0909341SAndroid Build Coastguard Worker }
319*c0909341SAndroid Build Coastguard Worker if (!ret) {
320*c0909341SAndroid Build Coastguard Worker ret = 1;
321*c0909341SAndroid Build Coastguard Worker } else for (int i = 0, j = np - 1, k = 0; k < np - ret; k++, i++, j--) {
322*c0909341SAndroid Build Coastguard Worker while (mvd[i] != -1) i++;
323*c0909341SAndroid Build Coastguard Worker while (mvd[j] == -1) j--;
324*c0909341SAndroid Build Coastguard Worker assert(i != j);
325*c0909341SAndroid Build Coastguard Worker if (i > j) break;
326*c0909341SAndroid Build Coastguard Worker // replace the discarded samples;
327*c0909341SAndroid Build Coastguard Worker mvd[i] = mvd[j];
328*c0909341SAndroid Build Coastguard Worker memcpy(pts[i], pts[j], sizeof(*pts));
329*c0909341SAndroid Build Coastguard Worker }
330*c0909341SAndroid Build Coastguard Worker
331*c0909341SAndroid Build Coastguard Worker if (!dav1d_find_affine_int(pts, ret, bw4, bh4, mv, wmp, t->bx, t->by) &&
332*c0909341SAndroid Build Coastguard Worker !dav1d_get_shear_params(wmp))
333*c0909341SAndroid Build Coastguard Worker {
334*c0909341SAndroid Build Coastguard Worker wmp->type = DAV1D_WM_TYPE_AFFINE;
335*c0909341SAndroid Build Coastguard Worker } else
336*c0909341SAndroid Build Coastguard Worker wmp->type = DAV1D_WM_TYPE_IDENTITY;
337*c0909341SAndroid Build Coastguard Worker }
338*c0909341SAndroid Build Coastguard Worker
findoddzero(const uint8_t * buf,int len)339*c0909341SAndroid Build Coastguard Worker static inline int findoddzero(const uint8_t *buf, int len) {
340*c0909341SAndroid Build Coastguard Worker for (int n = 0; n < len; n++)
341*c0909341SAndroid Build Coastguard Worker if (!buf[n * 2]) return 1;
342*c0909341SAndroid Build Coastguard Worker return 0;
343*c0909341SAndroid Build Coastguard Worker }
344*c0909341SAndroid Build Coastguard Worker
345*c0909341SAndroid Build Coastguard Worker // meant to be SIMD'able, so that theoretical complexity of this function
346*c0909341SAndroid Build Coastguard Worker // times block size goes from w4*h4 to w4+h4-1
347*c0909341SAndroid Build Coastguard Worker // a and b are previous two lines containing (a) top/left entries or (b)
348*c0909341SAndroid Build Coastguard Worker // top/left entries, with a[0] being either the first top or first left entry,
349*c0909341SAndroid Build Coastguard Worker // depending on top_offset being 1 or 0, and b being the first top/left entry
350*c0909341SAndroid Build Coastguard Worker // for whichever has one. left_offset indicates whether the (len-1)th entry
351*c0909341SAndroid Build Coastguard Worker // has a left neighbour.
352*c0909341SAndroid Build Coastguard Worker // output is order[] and ctx for each member of this diagonal.
order_palette(const uint8_t * pal_idx,const ptrdiff_t stride,const int i,const int first,const int last,uint8_t (* const order)[8],uint8_t * const ctx)353*c0909341SAndroid Build Coastguard Worker static void order_palette(const uint8_t *pal_idx, const ptrdiff_t stride,
354*c0909341SAndroid Build Coastguard Worker const int i, const int first, const int last,
355*c0909341SAndroid Build Coastguard Worker uint8_t (*const order)[8], uint8_t *const ctx)
356*c0909341SAndroid Build Coastguard Worker {
357*c0909341SAndroid Build Coastguard Worker int have_top = i > first;
358*c0909341SAndroid Build Coastguard Worker
359*c0909341SAndroid Build Coastguard Worker assert(pal_idx);
360*c0909341SAndroid Build Coastguard Worker pal_idx += first + (i - first) * stride;
361*c0909341SAndroid Build Coastguard Worker for (int j = first, n = 0; j >= last; have_top = 1, j--, n++, pal_idx += stride - 1) {
362*c0909341SAndroid Build Coastguard Worker const int have_left = j > 0;
363*c0909341SAndroid Build Coastguard Worker
364*c0909341SAndroid Build Coastguard Worker assert(have_left || have_top);
365*c0909341SAndroid Build Coastguard Worker
366*c0909341SAndroid Build Coastguard Worker #define add(v_in) do { \
367*c0909341SAndroid Build Coastguard Worker const int v = v_in; \
368*c0909341SAndroid Build Coastguard Worker assert((unsigned)v < 8U); \
369*c0909341SAndroid Build Coastguard Worker order[n][o_idx++] = v; \
370*c0909341SAndroid Build Coastguard Worker mask |= 1 << v; \
371*c0909341SAndroid Build Coastguard Worker } while (0)
372*c0909341SAndroid Build Coastguard Worker
373*c0909341SAndroid Build Coastguard Worker unsigned mask = 0;
374*c0909341SAndroid Build Coastguard Worker int o_idx = 0;
375*c0909341SAndroid Build Coastguard Worker if (!have_left) {
376*c0909341SAndroid Build Coastguard Worker ctx[n] = 0;
377*c0909341SAndroid Build Coastguard Worker add(pal_idx[-stride]);
378*c0909341SAndroid Build Coastguard Worker } else if (!have_top) {
379*c0909341SAndroid Build Coastguard Worker ctx[n] = 0;
380*c0909341SAndroid Build Coastguard Worker add(pal_idx[-1]);
381*c0909341SAndroid Build Coastguard Worker } else {
382*c0909341SAndroid Build Coastguard Worker const int l = pal_idx[-1], t = pal_idx[-stride], tl = pal_idx[-(stride + 1)];
383*c0909341SAndroid Build Coastguard Worker const int same_t_l = t == l;
384*c0909341SAndroid Build Coastguard Worker const int same_t_tl = t == tl;
385*c0909341SAndroid Build Coastguard Worker const int same_l_tl = l == tl;
386*c0909341SAndroid Build Coastguard Worker const int same_all = same_t_l & same_t_tl & same_l_tl;
387*c0909341SAndroid Build Coastguard Worker
388*c0909341SAndroid Build Coastguard Worker if (same_all) {
389*c0909341SAndroid Build Coastguard Worker ctx[n] = 4;
390*c0909341SAndroid Build Coastguard Worker add(t);
391*c0909341SAndroid Build Coastguard Worker } else if (same_t_l) {
392*c0909341SAndroid Build Coastguard Worker ctx[n] = 3;
393*c0909341SAndroid Build Coastguard Worker add(t);
394*c0909341SAndroid Build Coastguard Worker add(tl);
395*c0909341SAndroid Build Coastguard Worker } else if (same_t_tl | same_l_tl) {
396*c0909341SAndroid Build Coastguard Worker ctx[n] = 2;
397*c0909341SAndroid Build Coastguard Worker add(tl);
398*c0909341SAndroid Build Coastguard Worker add(same_t_tl ? l : t);
399*c0909341SAndroid Build Coastguard Worker } else {
400*c0909341SAndroid Build Coastguard Worker ctx[n] = 1;
401*c0909341SAndroid Build Coastguard Worker add(imin(t, l));
402*c0909341SAndroid Build Coastguard Worker add(imax(t, l));
403*c0909341SAndroid Build Coastguard Worker add(tl);
404*c0909341SAndroid Build Coastguard Worker }
405*c0909341SAndroid Build Coastguard Worker }
406*c0909341SAndroid Build Coastguard Worker for (unsigned m = 1, bit = 0; m < 0x100; m <<= 1, bit++)
407*c0909341SAndroid Build Coastguard Worker if (!(mask & m))
408*c0909341SAndroid Build Coastguard Worker order[n][o_idx++] = bit;
409*c0909341SAndroid Build Coastguard Worker assert(o_idx == 8);
410*c0909341SAndroid Build Coastguard Worker #undef add
411*c0909341SAndroid Build Coastguard Worker }
412*c0909341SAndroid Build Coastguard Worker }
413*c0909341SAndroid Build Coastguard Worker
read_pal_indices(Dav1dTaskContext * const t,uint8_t * const pal_idx,const Av1Block * const b,const int pl,const int w4,const int h4,const int bw4,const int bh4)414*c0909341SAndroid Build Coastguard Worker static void read_pal_indices(Dav1dTaskContext *const t,
415*c0909341SAndroid Build Coastguard Worker uint8_t *const pal_idx,
416*c0909341SAndroid Build Coastguard Worker const Av1Block *const b, const int pl,
417*c0909341SAndroid Build Coastguard Worker const int w4, const int h4,
418*c0909341SAndroid Build Coastguard Worker const int bw4, const int bh4)
419*c0909341SAndroid Build Coastguard Worker {
420*c0909341SAndroid Build Coastguard Worker Dav1dTileState *const ts = t->ts;
421*c0909341SAndroid Build Coastguard Worker const ptrdiff_t stride = bw4 * 4;
422*c0909341SAndroid Build Coastguard Worker assert(pal_idx);
423*c0909341SAndroid Build Coastguard Worker pixel *const pal_tmp = t->scratch.pal_idx_uv;
424*c0909341SAndroid Build Coastguard Worker pal_tmp[0] = dav1d_msac_decode_uniform(&ts->msac, b->pal_sz[pl]);
425*c0909341SAndroid Build Coastguard Worker uint16_t (*const color_map_cdf)[8] =
426*c0909341SAndroid Build Coastguard Worker ts->cdf.m.color_map[pl][b->pal_sz[pl] - 2];
427*c0909341SAndroid Build Coastguard Worker uint8_t (*const order)[8] = t->scratch.pal_order;
428*c0909341SAndroid Build Coastguard Worker uint8_t *const ctx = t->scratch.pal_ctx;
429*c0909341SAndroid Build Coastguard Worker for (int i = 1; i < 4 * (w4 + h4) - 1; i++) {
430*c0909341SAndroid Build Coastguard Worker // top/left-to-bottom/right diagonals ("wave-front")
431*c0909341SAndroid Build Coastguard Worker const int first = imin(i, w4 * 4 - 1);
432*c0909341SAndroid Build Coastguard Worker const int last = imax(0, i - h4 * 4 + 1);
433*c0909341SAndroid Build Coastguard Worker order_palette(pal_tmp, stride, i, first, last, order, ctx);
434*c0909341SAndroid Build Coastguard Worker for (int j = first, m = 0; j >= last; j--, m++) {
435*c0909341SAndroid Build Coastguard Worker const int color_idx = dav1d_msac_decode_symbol_adapt8(&ts->msac,
436*c0909341SAndroid Build Coastguard Worker color_map_cdf[ctx[m]], b->pal_sz[pl] - 1);
437*c0909341SAndroid Build Coastguard Worker pal_tmp[(i - j) * stride + j] = order[m][color_idx];
438*c0909341SAndroid Build Coastguard Worker }
439*c0909341SAndroid Build Coastguard Worker }
440*c0909341SAndroid Build Coastguard Worker
441*c0909341SAndroid Build Coastguard Worker t->c->pal_dsp.pal_idx_finish(pal_idx, pal_tmp, bw4 * 4, bh4 * 4,
442*c0909341SAndroid Build Coastguard Worker w4 * 4, h4 * 4);
443*c0909341SAndroid Build Coastguard Worker }
444*c0909341SAndroid Build Coastguard Worker
read_vartx_tree(Dav1dTaskContext * const t,Av1Block * const b,const enum BlockSize bs,const int bx4,const int by4)445*c0909341SAndroid Build Coastguard Worker static void read_vartx_tree(Dav1dTaskContext *const t,
446*c0909341SAndroid Build Coastguard Worker Av1Block *const b, const enum BlockSize bs,
447*c0909341SAndroid Build Coastguard Worker const int bx4, const int by4)
448*c0909341SAndroid Build Coastguard Worker {
449*c0909341SAndroid Build Coastguard Worker const Dav1dFrameContext *const f = t->f;
450*c0909341SAndroid Build Coastguard Worker const uint8_t *const b_dim = dav1d_block_dimensions[bs];
451*c0909341SAndroid Build Coastguard Worker const int bw4 = b_dim[0], bh4 = b_dim[1];
452*c0909341SAndroid Build Coastguard Worker
453*c0909341SAndroid Build Coastguard Worker // var-tx tree coding
454*c0909341SAndroid Build Coastguard Worker uint16_t tx_split[2] = { 0 };
455*c0909341SAndroid Build Coastguard Worker b->max_ytx = dav1d_max_txfm_size_for_bs[bs][0];
456*c0909341SAndroid Build Coastguard Worker if (!b->skip && (f->frame_hdr->segmentation.lossless[b->seg_id] ||
457*c0909341SAndroid Build Coastguard Worker b->max_ytx == TX_4X4))
458*c0909341SAndroid Build Coastguard Worker {
459*c0909341SAndroid Build Coastguard Worker b->max_ytx = b->uvtx = TX_4X4;
460*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->txfm_mode == DAV1D_TX_SWITCHABLE) {
461*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[b_dim[2]](&t->a->tx[bx4], TX_4X4);
462*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[b_dim[3]](&t->l.tx[by4], TX_4X4);
463*c0909341SAndroid Build Coastguard Worker }
464*c0909341SAndroid Build Coastguard Worker } else if (f->frame_hdr->txfm_mode != DAV1D_TX_SWITCHABLE || b->skip) {
465*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->txfm_mode == DAV1D_TX_SWITCHABLE) {
466*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[b_dim[2]](&t->a->tx[bx4], b_dim[2 + 0]);
467*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[b_dim[3]](&t->l.tx[by4], b_dim[2 + 1]);
468*c0909341SAndroid Build Coastguard Worker }
469*c0909341SAndroid Build Coastguard Worker b->uvtx = dav1d_max_txfm_size_for_bs[bs][f->cur.p.layout];
470*c0909341SAndroid Build Coastguard Worker } else {
471*c0909341SAndroid Build Coastguard Worker assert(bw4 <= 16 || bh4 <= 16 || b->max_ytx == TX_64X64);
472*c0909341SAndroid Build Coastguard Worker int y, x, y_off, x_off;
473*c0909341SAndroid Build Coastguard Worker const TxfmInfo *const ytx = &dav1d_txfm_dimensions[b->max_ytx];
474*c0909341SAndroid Build Coastguard Worker for (y = 0, y_off = 0; y < bh4; y += ytx->h, y_off++) {
475*c0909341SAndroid Build Coastguard Worker for (x = 0, x_off = 0; x < bw4; x += ytx->w, x_off++) {
476*c0909341SAndroid Build Coastguard Worker read_tx_tree(t, b->max_ytx, 0, tx_split, x_off, y_off);
477*c0909341SAndroid Build Coastguard Worker // contexts are updated inside read_tx_tree()
478*c0909341SAndroid Build Coastguard Worker t->bx += ytx->w;
479*c0909341SAndroid Build Coastguard Worker }
480*c0909341SAndroid Build Coastguard Worker t->bx -= x;
481*c0909341SAndroid Build Coastguard Worker t->by += ytx->h;
482*c0909341SAndroid Build Coastguard Worker }
483*c0909341SAndroid Build Coastguard Worker t->by -= y;
484*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
485*c0909341SAndroid Build Coastguard Worker printf("Post-vartxtree[%x/%x]: r=%d\n",
486*c0909341SAndroid Build Coastguard Worker tx_split[0], tx_split[1], t->ts->msac.rng);
487*c0909341SAndroid Build Coastguard Worker b->uvtx = dav1d_max_txfm_size_for_bs[bs][f->cur.p.layout];
488*c0909341SAndroid Build Coastguard Worker }
489*c0909341SAndroid Build Coastguard Worker assert(!(tx_split[0] & ~0x33));
490*c0909341SAndroid Build Coastguard Worker b->tx_split0 = (uint8_t)tx_split[0];
491*c0909341SAndroid Build Coastguard Worker b->tx_split1 = tx_split[1];
492*c0909341SAndroid Build Coastguard Worker }
493*c0909341SAndroid Build Coastguard Worker
get_prev_frame_segid(const Dav1dFrameContext * const f,const int by,const int bx,const int w4,int h4,const uint8_t * ref_seg_map,const ptrdiff_t stride)494*c0909341SAndroid Build Coastguard Worker static inline unsigned get_prev_frame_segid(const Dav1dFrameContext *const f,
495*c0909341SAndroid Build Coastguard Worker const int by, const int bx,
496*c0909341SAndroid Build Coastguard Worker const int w4, int h4,
497*c0909341SAndroid Build Coastguard Worker const uint8_t *ref_seg_map,
498*c0909341SAndroid Build Coastguard Worker const ptrdiff_t stride)
499*c0909341SAndroid Build Coastguard Worker {
500*c0909341SAndroid Build Coastguard Worker assert(f->frame_hdr->primary_ref_frame != DAV1D_PRIMARY_REF_NONE);
501*c0909341SAndroid Build Coastguard Worker
502*c0909341SAndroid Build Coastguard Worker unsigned seg_id = 8;
503*c0909341SAndroid Build Coastguard Worker ref_seg_map += by * stride + bx;
504*c0909341SAndroid Build Coastguard Worker do {
505*c0909341SAndroid Build Coastguard Worker for (int x = 0; x < w4; x++)
506*c0909341SAndroid Build Coastguard Worker seg_id = imin(seg_id, ref_seg_map[x]);
507*c0909341SAndroid Build Coastguard Worker ref_seg_map += stride;
508*c0909341SAndroid Build Coastguard Worker } while (--h4 > 0 && seg_id);
509*c0909341SAndroid Build Coastguard Worker assert(seg_id < 8);
510*c0909341SAndroid Build Coastguard Worker
511*c0909341SAndroid Build Coastguard Worker return seg_id;
512*c0909341SAndroid Build Coastguard Worker }
513*c0909341SAndroid Build Coastguard Worker
splat_oneref_mv(const Dav1dContext * const c,Dav1dTaskContext * const t,const enum BlockSize bs,const Av1Block * const b,const int bw4,const int bh4)514*c0909341SAndroid Build Coastguard Worker static inline void splat_oneref_mv(const Dav1dContext *const c,
515*c0909341SAndroid Build Coastguard Worker Dav1dTaskContext *const t,
516*c0909341SAndroid Build Coastguard Worker const enum BlockSize bs,
517*c0909341SAndroid Build Coastguard Worker const Av1Block *const b,
518*c0909341SAndroid Build Coastguard Worker const int bw4, const int bh4)
519*c0909341SAndroid Build Coastguard Worker {
520*c0909341SAndroid Build Coastguard Worker const enum InterPredMode mode = b->inter_mode;
521*c0909341SAndroid Build Coastguard Worker const refmvs_block ALIGN(tmpl, 16) = (refmvs_block) {
522*c0909341SAndroid Build Coastguard Worker .ref.ref = { b->ref[0] + 1, b->interintra_type ? 0 : -1 },
523*c0909341SAndroid Build Coastguard Worker .mv.mv[0] = b->mv[0],
524*c0909341SAndroid Build Coastguard Worker .bs = bs,
525*c0909341SAndroid Build Coastguard Worker .mf = (mode == GLOBALMV && imin(bw4, bh4) >= 2) | ((mode == NEWMV) * 2),
526*c0909341SAndroid Build Coastguard Worker };
527*c0909341SAndroid Build Coastguard Worker c->refmvs_dsp.splat_mv(&t->rt.r[(t->by & 31) + 5], &tmpl, t->bx, bw4, bh4);
528*c0909341SAndroid Build Coastguard Worker }
529*c0909341SAndroid Build Coastguard Worker
splat_intrabc_mv(const Dav1dContext * const c,Dav1dTaskContext * const t,const enum BlockSize bs,const Av1Block * const b,const int bw4,const int bh4)530*c0909341SAndroid Build Coastguard Worker static inline void splat_intrabc_mv(const Dav1dContext *const c,
531*c0909341SAndroid Build Coastguard Worker Dav1dTaskContext *const t,
532*c0909341SAndroid Build Coastguard Worker const enum BlockSize bs,
533*c0909341SAndroid Build Coastguard Worker const Av1Block *const b,
534*c0909341SAndroid Build Coastguard Worker const int bw4, const int bh4)
535*c0909341SAndroid Build Coastguard Worker {
536*c0909341SAndroid Build Coastguard Worker const refmvs_block ALIGN(tmpl, 16) = (refmvs_block) {
537*c0909341SAndroid Build Coastguard Worker .ref.ref = { 0, -1 },
538*c0909341SAndroid Build Coastguard Worker .mv.mv[0] = b->mv[0],
539*c0909341SAndroid Build Coastguard Worker .bs = bs,
540*c0909341SAndroid Build Coastguard Worker .mf = 0,
541*c0909341SAndroid Build Coastguard Worker };
542*c0909341SAndroid Build Coastguard Worker c->refmvs_dsp.splat_mv(&t->rt.r[(t->by & 31) + 5], &tmpl, t->bx, bw4, bh4);
543*c0909341SAndroid Build Coastguard Worker }
544*c0909341SAndroid Build Coastguard Worker
splat_tworef_mv(const Dav1dContext * const c,Dav1dTaskContext * const t,const enum BlockSize bs,const Av1Block * const b,const int bw4,const int bh4)545*c0909341SAndroid Build Coastguard Worker static inline void splat_tworef_mv(const Dav1dContext *const c,
546*c0909341SAndroid Build Coastguard Worker Dav1dTaskContext *const t,
547*c0909341SAndroid Build Coastguard Worker const enum BlockSize bs,
548*c0909341SAndroid Build Coastguard Worker const Av1Block *const b,
549*c0909341SAndroid Build Coastguard Worker const int bw4, const int bh4)
550*c0909341SAndroid Build Coastguard Worker {
551*c0909341SAndroid Build Coastguard Worker assert(bw4 >= 2 && bh4 >= 2);
552*c0909341SAndroid Build Coastguard Worker const enum CompInterPredMode mode = b->inter_mode;
553*c0909341SAndroid Build Coastguard Worker const refmvs_block ALIGN(tmpl, 16) = (refmvs_block) {
554*c0909341SAndroid Build Coastguard Worker .ref.ref = { b->ref[0] + 1, b->ref[1] + 1 },
555*c0909341SAndroid Build Coastguard Worker .mv.mv = { b->mv[0], b->mv[1] },
556*c0909341SAndroid Build Coastguard Worker .bs = bs,
557*c0909341SAndroid Build Coastguard Worker .mf = (mode == GLOBALMV_GLOBALMV) | !!((1 << mode) & (0xbc)) * 2,
558*c0909341SAndroid Build Coastguard Worker };
559*c0909341SAndroid Build Coastguard Worker c->refmvs_dsp.splat_mv(&t->rt.r[(t->by & 31) + 5], &tmpl, t->bx, bw4, bh4);
560*c0909341SAndroid Build Coastguard Worker }
561*c0909341SAndroid Build Coastguard Worker
splat_intraref(const Dav1dContext * const c,Dav1dTaskContext * const t,const enum BlockSize bs,const int bw4,const int bh4)562*c0909341SAndroid Build Coastguard Worker static inline void splat_intraref(const Dav1dContext *const c,
563*c0909341SAndroid Build Coastguard Worker Dav1dTaskContext *const t,
564*c0909341SAndroid Build Coastguard Worker const enum BlockSize bs,
565*c0909341SAndroid Build Coastguard Worker const int bw4, const int bh4)
566*c0909341SAndroid Build Coastguard Worker {
567*c0909341SAndroid Build Coastguard Worker const refmvs_block ALIGN(tmpl, 16) = (refmvs_block) {
568*c0909341SAndroid Build Coastguard Worker .ref.ref = { 0, -1 },
569*c0909341SAndroid Build Coastguard Worker .mv.mv[0].n = INVALID_MV,
570*c0909341SAndroid Build Coastguard Worker .bs = bs,
571*c0909341SAndroid Build Coastguard Worker .mf = 0,
572*c0909341SAndroid Build Coastguard Worker };
573*c0909341SAndroid Build Coastguard Worker c->refmvs_dsp.splat_mv(&t->rt.r[(t->by & 31) + 5], &tmpl, t->bx, bw4, bh4);
574*c0909341SAndroid Build Coastguard Worker }
575*c0909341SAndroid Build Coastguard Worker
mc_lowest_px(int * const dst,const int by4,const int bh4,const int mvy,const int ss_ver,const struct ScalableMotionParams * const smp)576*c0909341SAndroid Build Coastguard Worker static void mc_lowest_px(int *const dst, const int by4, const int bh4,
577*c0909341SAndroid Build Coastguard Worker const int mvy, const int ss_ver,
578*c0909341SAndroid Build Coastguard Worker const struct ScalableMotionParams *const smp)
579*c0909341SAndroid Build Coastguard Worker {
580*c0909341SAndroid Build Coastguard Worker const int v_mul = 4 >> ss_ver;
581*c0909341SAndroid Build Coastguard Worker if (!smp->scale) {
582*c0909341SAndroid Build Coastguard Worker const int my = mvy >> (3 + ss_ver), dy = mvy & (15 >> !ss_ver);
583*c0909341SAndroid Build Coastguard Worker *dst = imax(*dst, (by4 + bh4) * v_mul + my + 4 * !!dy);
584*c0909341SAndroid Build Coastguard Worker } else {
585*c0909341SAndroid Build Coastguard Worker int y = (by4 * v_mul << 4) + mvy * (1 << !ss_ver);
586*c0909341SAndroid Build Coastguard Worker const int64_t tmp = (int64_t)(y) * smp->scale + (smp->scale - 0x4000) * 8;
587*c0909341SAndroid Build Coastguard Worker y = apply_sign64((int)((llabs(tmp) + 128) >> 8), tmp) + 32;
588*c0909341SAndroid Build Coastguard Worker const int bottom = ((y + (bh4 * v_mul - 1) * smp->step) >> 10) + 1 + 4;
589*c0909341SAndroid Build Coastguard Worker *dst = imax(*dst, bottom);
590*c0909341SAndroid Build Coastguard Worker }
591*c0909341SAndroid Build Coastguard Worker }
592*c0909341SAndroid Build Coastguard Worker
affine_lowest_px(Dav1dTaskContext * const t,int * const dst,const uint8_t * const b_dim,const Dav1dWarpedMotionParams * const wmp,const int ss_ver,const int ss_hor)593*c0909341SAndroid Build Coastguard Worker static ALWAYS_INLINE void affine_lowest_px(Dav1dTaskContext *const t, int *const dst,
594*c0909341SAndroid Build Coastguard Worker const uint8_t *const b_dim,
595*c0909341SAndroid Build Coastguard Worker const Dav1dWarpedMotionParams *const wmp,
596*c0909341SAndroid Build Coastguard Worker const int ss_ver, const int ss_hor)
597*c0909341SAndroid Build Coastguard Worker {
598*c0909341SAndroid Build Coastguard Worker const int h_mul = 4 >> ss_hor, v_mul = 4 >> ss_ver;
599*c0909341SAndroid Build Coastguard Worker assert(!((b_dim[0] * h_mul) & 7) && !((b_dim[1] * v_mul) & 7));
600*c0909341SAndroid Build Coastguard Worker const int32_t *const mat = wmp->matrix;
601*c0909341SAndroid Build Coastguard Worker const int y = b_dim[1] * v_mul - 8; // lowest y
602*c0909341SAndroid Build Coastguard Worker
603*c0909341SAndroid Build Coastguard Worker const int src_y = t->by * 4 + ((y + 4) << ss_ver);
604*c0909341SAndroid Build Coastguard Worker const int64_t mat5_y = (int64_t) mat[5] * src_y + mat[1];
605*c0909341SAndroid Build Coastguard Worker // check left- and right-most blocks
606*c0909341SAndroid Build Coastguard Worker for (int x = 0; x < b_dim[0] * h_mul; x += imax(8, b_dim[0] * h_mul - 8)) {
607*c0909341SAndroid Build Coastguard Worker // calculate transformation relative to center of 8x8 block in
608*c0909341SAndroid Build Coastguard Worker // luma pixel units
609*c0909341SAndroid Build Coastguard Worker const int src_x = t->bx * 4 + ((x + 4) << ss_hor);
610*c0909341SAndroid Build Coastguard Worker const int64_t mvy = ((int64_t) mat[4] * src_x + mat5_y) >> ss_ver;
611*c0909341SAndroid Build Coastguard Worker const int dy = (int) (mvy >> 16) - 4;
612*c0909341SAndroid Build Coastguard Worker *dst = imax(*dst, dy + 4 + 8);
613*c0909341SAndroid Build Coastguard Worker }
614*c0909341SAndroid Build Coastguard Worker }
615*c0909341SAndroid Build Coastguard Worker
affine_lowest_px_luma(Dav1dTaskContext * const t,int * const dst,const uint8_t * const b_dim,const Dav1dWarpedMotionParams * const wmp)616*c0909341SAndroid Build Coastguard Worker static NOINLINE void affine_lowest_px_luma(Dav1dTaskContext *const t, int *const dst,
617*c0909341SAndroid Build Coastguard Worker const uint8_t *const b_dim,
618*c0909341SAndroid Build Coastguard Worker const Dav1dWarpedMotionParams *const wmp)
619*c0909341SAndroid Build Coastguard Worker {
620*c0909341SAndroid Build Coastguard Worker affine_lowest_px(t, dst, b_dim, wmp, 0, 0);
621*c0909341SAndroid Build Coastguard Worker }
622*c0909341SAndroid Build Coastguard Worker
affine_lowest_px_chroma(Dav1dTaskContext * const t,int * const dst,const uint8_t * const b_dim,const Dav1dWarpedMotionParams * const wmp)623*c0909341SAndroid Build Coastguard Worker static NOINLINE void affine_lowest_px_chroma(Dav1dTaskContext *const t, int *const dst,
624*c0909341SAndroid Build Coastguard Worker const uint8_t *const b_dim,
625*c0909341SAndroid Build Coastguard Worker const Dav1dWarpedMotionParams *const wmp)
626*c0909341SAndroid Build Coastguard Worker {
627*c0909341SAndroid Build Coastguard Worker const Dav1dFrameContext *const f = t->f;
628*c0909341SAndroid Build Coastguard Worker assert(f->cur.p.layout != DAV1D_PIXEL_LAYOUT_I400);
629*c0909341SAndroid Build Coastguard Worker if (f->cur.p.layout == DAV1D_PIXEL_LAYOUT_I444)
630*c0909341SAndroid Build Coastguard Worker affine_lowest_px_luma(t, dst, b_dim, wmp);
631*c0909341SAndroid Build Coastguard Worker else
632*c0909341SAndroid Build Coastguard Worker affine_lowest_px(t, dst, b_dim, wmp, f->cur.p.layout & DAV1D_PIXEL_LAYOUT_I420, 1);
633*c0909341SAndroid Build Coastguard Worker }
634*c0909341SAndroid Build Coastguard Worker
obmc_lowest_px(Dav1dTaskContext * const t,int (* const dst)[2],const int is_chroma,const uint8_t * const b_dim,const int bx4,const int by4,const int w4,const int h4)635*c0909341SAndroid Build Coastguard Worker static void obmc_lowest_px(Dav1dTaskContext *const t,
636*c0909341SAndroid Build Coastguard Worker int (*const dst)[2], const int is_chroma,
637*c0909341SAndroid Build Coastguard Worker const uint8_t *const b_dim,
638*c0909341SAndroid Build Coastguard Worker const int bx4, const int by4, const int w4, const int h4)
639*c0909341SAndroid Build Coastguard Worker {
640*c0909341SAndroid Build Coastguard Worker assert(!(t->bx & 1) && !(t->by & 1));
641*c0909341SAndroid Build Coastguard Worker const Dav1dFrameContext *const f = t->f;
642*c0909341SAndroid Build Coastguard Worker /*const*/ refmvs_block **r = &t->rt.r[(t->by & 31) + 5];
643*c0909341SAndroid Build Coastguard Worker const int ss_ver = is_chroma && f->cur.p.layout == DAV1D_PIXEL_LAYOUT_I420;
644*c0909341SAndroid Build Coastguard Worker const int ss_hor = is_chroma && f->cur.p.layout != DAV1D_PIXEL_LAYOUT_I444;
645*c0909341SAndroid Build Coastguard Worker const int h_mul = 4 >> ss_hor, v_mul = 4 >> ss_ver;
646*c0909341SAndroid Build Coastguard Worker
647*c0909341SAndroid Build Coastguard Worker if (t->by > t->ts->tiling.row_start &&
648*c0909341SAndroid Build Coastguard Worker (!is_chroma || b_dim[0] * h_mul + b_dim[1] * v_mul >= 16))
649*c0909341SAndroid Build Coastguard Worker {
650*c0909341SAndroid Build Coastguard Worker for (int i = 0, x = 0; x < w4 && i < imin(b_dim[2], 4); ) {
651*c0909341SAndroid Build Coastguard Worker // only odd blocks are considered for overlap handling, hence +1
652*c0909341SAndroid Build Coastguard Worker const refmvs_block *const a_r = &r[-1][t->bx + x + 1];
653*c0909341SAndroid Build Coastguard Worker const uint8_t *const a_b_dim = dav1d_block_dimensions[a_r->bs];
654*c0909341SAndroid Build Coastguard Worker
655*c0909341SAndroid Build Coastguard Worker if (a_r->ref.ref[0] > 0) {
656*c0909341SAndroid Build Coastguard Worker const int oh4 = imin(b_dim[1], 16) >> 1;
657*c0909341SAndroid Build Coastguard Worker mc_lowest_px(&dst[a_r->ref.ref[0] - 1][is_chroma], t->by,
658*c0909341SAndroid Build Coastguard Worker (oh4 * 3 + 3) >> 2, a_r->mv.mv[0].y, ss_ver,
659*c0909341SAndroid Build Coastguard Worker &f->svc[a_r->ref.ref[0] - 1][1]);
660*c0909341SAndroid Build Coastguard Worker i++;
661*c0909341SAndroid Build Coastguard Worker }
662*c0909341SAndroid Build Coastguard Worker x += imax(a_b_dim[0], 2);
663*c0909341SAndroid Build Coastguard Worker }
664*c0909341SAndroid Build Coastguard Worker }
665*c0909341SAndroid Build Coastguard Worker
666*c0909341SAndroid Build Coastguard Worker if (t->bx > t->ts->tiling.col_start)
667*c0909341SAndroid Build Coastguard Worker for (int i = 0, y = 0; y < h4 && i < imin(b_dim[3], 4); ) {
668*c0909341SAndroid Build Coastguard Worker // only odd blocks are considered for overlap handling, hence +1
669*c0909341SAndroid Build Coastguard Worker const refmvs_block *const l_r = &r[y + 1][t->bx - 1];
670*c0909341SAndroid Build Coastguard Worker const uint8_t *const l_b_dim = dav1d_block_dimensions[l_r->bs];
671*c0909341SAndroid Build Coastguard Worker
672*c0909341SAndroid Build Coastguard Worker if (l_r->ref.ref[0] > 0) {
673*c0909341SAndroid Build Coastguard Worker const int oh4 = iclip(l_b_dim[1], 2, b_dim[1]);
674*c0909341SAndroid Build Coastguard Worker mc_lowest_px(&dst[l_r->ref.ref[0] - 1][is_chroma],
675*c0909341SAndroid Build Coastguard Worker t->by + y, oh4, l_r->mv.mv[0].y, ss_ver,
676*c0909341SAndroid Build Coastguard Worker &f->svc[l_r->ref.ref[0] - 1][1]);
677*c0909341SAndroid Build Coastguard Worker i++;
678*c0909341SAndroid Build Coastguard Worker }
679*c0909341SAndroid Build Coastguard Worker y += imax(l_b_dim[1], 2);
680*c0909341SAndroid Build Coastguard Worker }
681*c0909341SAndroid Build Coastguard Worker }
682*c0909341SAndroid Build Coastguard Worker
decode_b(Dav1dTaskContext * const t,const enum BlockLevel bl,const enum BlockSize bs,const enum BlockPartition bp,const enum EdgeFlags intra_edge_flags)683*c0909341SAndroid Build Coastguard Worker static int decode_b(Dav1dTaskContext *const t,
684*c0909341SAndroid Build Coastguard Worker const enum BlockLevel bl,
685*c0909341SAndroid Build Coastguard Worker const enum BlockSize bs,
686*c0909341SAndroid Build Coastguard Worker const enum BlockPartition bp,
687*c0909341SAndroid Build Coastguard Worker const enum EdgeFlags intra_edge_flags) {
688*c0909341SAndroid Build Coastguard Worker Dav1dTileState *const ts = t->ts;
689*c0909341SAndroid Build Coastguard Worker const Dav1dFrameContext *const f = t->f;
690*c0909341SAndroid Build Coastguard Worker Av1Block b_mem, *const b = t->frame_thread.pass ?
691*c0909341SAndroid Build Coastguard Worker &f->frame_thread.b[t->by * f->b4_stride + t->bx] : &b_mem;
692*c0909341SAndroid Build Coastguard Worker const uint8_t *const b_dim = dav1d_block_dimensions[bs];
693*c0909341SAndroid Build Coastguard Worker const int bx4 = t->bx & 31, by4 = t->by & 31;
694*c0909341SAndroid Build Coastguard Worker const int ss_ver = f->cur.p.layout == DAV1D_PIXEL_LAYOUT_I420;
695*c0909341SAndroid Build Coastguard Worker const int ss_hor = f->cur.p.layout != DAV1D_PIXEL_LAYOUT_I444;
696*c0909341SAndroid Build Coastguard Worker const int cbx4 = bx4 >> ss_hor, cby4 = by4 >> ss_ver;
697*c0909341SAndroid Build Coastguard Worker const int bw4 = b_dim[0], bh4 = b_dim[1];
698*c0909341SAndroid Build Coastguard Worker const int w4 = imin(bw4, f->bw - t->bx), h4 = imin(bh4, f->bh - t->by);
699*c0909341SAndroid Build Coastguard Worker const int cbw4 = (bw4 + ss_hor) >> ss_hor, cbh4 = (bh4 + ss_ver) >> ss_ver;
700*c0909341SAndroid Build Coastguard Worker const int have_left = t->bx > ts->tiling.col_start;
701*c0909341SAndroid Build Coastguard Worker const int have_top = t->by > ts->tiling.row_start;
702*c0909341SAndroid Build Coastguard Worker const int has_chroma = f->cur.p.layout != DAV1D_PIXEL_LAYOUT_I400 &&
703*c0909341SAndroid Build Coastguard Worker (bw4 > ss_hor || t->bx & 1) &&
704*c0909341SAndroid Build Coastguard Worker (bh4 > ss_ver || t->by & 1);
705*c0909341SAndroid Build Coastguard Worker
706*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass == 2) {
707*c0909341SAndroid Build Coastguard Worker if (b->intra) {
708*c0909341SAndroid Build Coastguard Worker f->bd_fn.recon_b_intra(t, bs, intra_edge_flags, b);
709*c0909341SAndroid Build Coastguard Worker
710*c0909341SAndroid Build Coastguard Worker const enum IntraPredMode y_mode_nofilt =
711*c0909341SAndroid Build Coastguard Worker b->y_mode == FILTER_PRED ? DC_PRED : b->y_mode;
712*c0909341SAndroid Build Coastguard Worker #define set_ctx(rep_macro) \
713*c0909341SAndroid Build Coastguard Worker rep_macro(edge->mode, off, y_mode_nofilt); \
714*c0909341SAndroid Build Coastguard Worker rep_macro(edge->intra, off, 1)
715*c0909341SAndroid Build Coastguard Worker BlockContext *edge = t->a;
716*c0909341SAndroid Build Coastguard Worker for (int i = 0, off = bx4; i < 2; i++, off = by4, edge = &t->l) {
717*c0909341SAndroid Build Coastguard Worker case_set(b_dim[2 + i]);
718*c0909341SAndroid Build Coastguard Worker }
719*c0909341SAndroid Build Coastguard Worker #undef set_ctx
720*c0909341SAndroid Build Coastguard Worker if (IS_INTER_OR_SWITCH(f->frame_hdr)) {
721*c0909341SAndroid Build Coastguard Worker refmvs_block *const r = &t->rt.r[(t->by & 31) + 5 + bh4 - 1][t->bx];
722*c0909341SAndroid Build Coastguard Worker for (int x = 0; x < bw4; x++) {
723*c0909341SAndroid Build Coastguard Worker r[x].ref.ref[0] = 0;
724*c0909341SAndroid Build Coastguard Worker r[x].bs = bs;
725*c0909341SAndroid Build Coastguard Worker }
726*c0909341SAndroid Build Coastguard Worker refmvs_block *const *rr = &t->rt.r[(t->by & 31) + 5];
727*c0909341SAndroid Build Coastguard Worker for (int y = 0; y < bh4 - 1; y++) {
728*c0909341SAndroid Build Coastguard Worker rr[y][t->bx + bw4 - 1].ref.ref[0] = 0;
729*c0909341SAndroid Build Coastguard Worker rr[y][t->bx + bw4 - 1].bs = bs;
730*c0909341SAndroid Build Coastguard Worker }
731*c0909341SAndroid Build Coastguard Worker }
732*c0909341SAndroid Build Coastguard Worker
733*c0909341SAndroid Build Coastguard Worker if (has_chroma) {
734*c0909341SAndroid Build Coastguard Worker uint8_t uv_mode = b->uv_mode;
735*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[ulog2(cbw4)](&t->a->uvmode[cbx4], uv_mode);
736*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[ulog2(cbh4)](&t->l.uvmode[cby4], uv_mode);
737*c0909341SAndroid Build Coastguard Worker }
738*c0909341SAndroid Build Coastguard Worker } else {
739*c0909341SAndroid Build Coastguard Worker if (IS_INTER_OR_SWITCH(f->frame_hdr) /* not intrabc */ &&
740*c0909341SAndroid Build Coastguard Worker b->comp_type == COMP_INTER_NONE && b->motion_mode == MM_WARP)
741*c0909341SAndroid Build Coastguard Worker {
742*c0909341SAndroid Build Coastguard Worker if (b->matrix[0] == SHRT_MIN) {
743*c0909341SAndroid Build Coastguard Worker t->warpmv.type = DAV1D_WM_TYPE_IDENTITY;
744*c0909341SAndroid Build Coastguard Worker } else {
745*c0909341SAndroid Build Coastguard Worker t->warpmv.type = DAV1D_WM_TYPE_AFFINE;
746*c0909341SAndroid Build Coastguard Worker t->warpmv.matrix[2] = b->matrix[0] + 0x10000;
747*c0909341SAndroid Build Coastguard Worker t->warpmv.matrix[3] = b->matrix[1];
748*c0909341SAndroid Build Coastguard Worker t->warpmv.matrix[4] = b->matrix[2];
749*c0909341SAndroid Build Coastguard Worker t->warpmv.matrix[5] = b->matrix[3] + 0x10000;
750*c0909341SAndroid Build Coastguard Worker dav1d_set_affine_mv2d(bw4, bh4, b->mv2d, &t->warpmv,
751*c0909341SAndroid Build Coastguard Worker t->bx, t->by);
752*c0909341SAndroid Build Coastguard Worker dav1d_get_shear_params(&t->warpmv);
753*c0909341SAndroid Build Coastguard Worker #define signabs(v) v < 0 ? '-' : ' ', abs(v)
754*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
755*c0909341SAndroid Build Coastguard Worker printf("[ %c%x %c%x %c%x\n %c%x %c%x %c%x ]\n"
756*c0909341SAndroid Build Coastguard Worker "alpha=%c%x, beta=%c%x, gamma=%c%x, delta=%c%x, mv=y:%d,x:%d\n",
757*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.matrix[0]),
758*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.matrix[1]),
759*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.matrix[2]),
760*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.matrix[3]),
761*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.matrix[4]),
762*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.matrix[5]),
763*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.u.p.alpha),
764*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.u.p.beta),
765*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.u.p.gamma),
766*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.u.p.delta),
767*c0909341SAndroid Build Coastguard Worker b->mv2d.y, b->mv2d.x);
768*c0909341SAndroid Build Coastguard Worker #undef signabs
769*c0909341SAndroid Build Coastguard Worker }
770*c0909341SAndroid Build Coastguard Worker }
771*c0909341SAndroid Build Coastguard Worker if (f->bd_fn.recon_b_inter(t, bs, b)) return -1;
772*c0909341SAndroid Build Coastguard Worker
773*c0909341SAndroid Build Coastguard Worker const uint8_t *const filter = dav1d_filter_dir[b->filter2d];
774*c0909341SAndroid Build Coastguard Worker BlockContext *edge = t->a;
775*c0909341SAndroid Build Coastguard Worker for (int i = 0, off = bx4; i < 2; i++, off = by4, edge = &t->l) {
776*c0909341SAndroid Build Coastguard Worker #define set_ctx(rep_macro) \
777*c0909341SAndroid Build Coastguard Worker rep_macro(edge->filter[0], off, filter[0]); \
778*c0909341SAndroid Build Coastguard Worker rep_macro(edge->filter[1], off, filter[1]); \
779*c0909341SAndroid Build Coastguard Worker rep_macro(edge->intra, off, 0)
780*c0909341SAndroid Build Coastguard Worker case_set(b_dim[2 + i]);
781*c0909341SAndroid Build Coastguard Worker #undef set_ctx
782*c0909341SAndroid Build Coastguard Worker }
783*c0909341SAndroid Build Coastguard Worker
784*c0909341SAndroid Build Coastguard Worker if (IS_INTER_OR_SWITCH(f->frame_hdr)) {
785*c0909341SAndroid Build Coastguard Worker refmvs_block *const r = &t->rt.r[(t->by & 31) + 5 + bh4 - 1][t->bx];
786*c0909341SAndroid Build Coastguard Worker for (int x = 0; x < bw4; x++) {
787*c0909341SAndroid Build Coastguard Worker r[x].ref.ref[0] = b->ref[0] + 1;
788*c0909341SAndroid Build Coastguard Worker r[x].mv.mv[0] = b->mv[0];
789*c0909341SAndroid Build Coastguard Worker r[x].bs = bs;
790*c0909341SAndroid Build Coastguard Worker }
791*c0909341SAndroid Build Coastguard Worker refmvs_block *const *rr = &t->rt.r[(t->by & 31) + 5];
792*c0909341SAndroid Build Coastguard Worker for (int y = 0; y < bh4 - 1; y++) {
793*c0909341SAndroid Build Coastguard Worker rr[y][t->bx + bw4 - 1].ref.ref[0] = b->ref[0] + 1;
794*c0909341SAndroid Build Coastguard Worker rr[y][t->bx + bw4 - 1].mv.mv[0] = b->mv[0];
795*c0909341SAndroid Build Coastguard Worker rr[y][t->bx + bw4 - 1].bs = bs;
796*c0909341SAndroid Build Coastguard Worker }
797*c0909341SAndroid Build Coastguard Worker }
798*c0909341SAndroid Build Coastguard Worker
799*c0909341SAndroid Build Coastguard Worker if (has_chroma) {
800*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[ulog2(cbw4)](&t->a->uvmode[cbx4], DC_PRED);
801*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[ulog2(cbh4)](&t->l.uvmode[cby4], DC_PRED);
802*c0909341SAndroid Build Coastguard Worker }
803*c0909341SAndroid Build Coastguard Worker }
804*c0909341SAndroid Build Coastguard Worker return 0;
805*c0909341SAndroid Build Coastguard Worker }
806*c0909341SAndroid Build Coastguard Worker
807*c0909341SAndroid Build Coastguard Worker const int cw4 = (w4 + ss_hor) >> ss_hor, ch4 = (h4 + ss_ver) >> ss_ver;
808*c0909341SAndroid Build Coastguard Worker
809*c0909341SAndroid Build Coastguard Worker b->bl = bl;
810*c0909341SAndroid Build Coastguard Worker b->bp = bp;
811*c0909341SAndroid Build Coastguard Worker b->bs = bs;
812*c0909341SAndroid Build Coastguard Worker
813*c0909341SAndroid Build Coastguard Worker const Dav1dSegmentationData *seg = NULL;
814*c0909341SAndroid Build Coastguard Worker
815*c0909341SAndroid Build Coastguard Worker // segment_id (if seg_feature for skip/ref/gmv is enabled)
816*c0909341SAndroid Build Coastguard Worker int seg_pred = 0;
817*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->segmentation.enabled) {
818*c0909341SAndroid Build Coastguard Worker if (!f->frame_hdr->segmentation.update_map) {
819*c0909341SAndroid Build Coastguard Worker if (f->prev_segmap) {
820*c0909341SAndroid Build Coastguard Worker unsigned seg_id = get_prev_frame_segid(f, t->by, t->bx, w4, h4,
821*c0909341SAndroid Build Coastguard Worker f->prev_segmap,
822*c0909341SAndroid Build Coastguard Worker f->b4_stride);
823*c0909341SAndroid Build Coastguard Worker if (seg_id >= 8) return -1;
824*c0909341SAndroid Build Coastguard Worker b->seg_id = seg_id;
825*c0909341SAndroid Build Coastguard Worker } else {
826*c0909341SAndroid Build Coastguard Worker b->seg_id = 0;
827*c0909341SAndroid Build Coastguard Worker }
828*c0909341SAndroid Build Coastguard Worker seg = &f->frame_hdr->segmentation.seg_data.d[b->seg_id];
829*c0909341SAndroid Build Coastguard Worker } else if (f->frame_hdr->segmentation.seg_data.preskip) {
830*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->segmentation.temporal &&
831*c0909341SAndroid Build Coastguard Worker (seg_pred = dav1d_msac_decode_bool_adapt(&ts->msac,
832*c0909341SAndroid Build Coastguard Worker ts->cdf.m.seg_pred[t->a->seg_pred[bx4] +
833*c0909341SAndroid Build Coastguard Worker t->l.seg_pred[by4]])))
834*c0909341SAndroid Build Coastguard Worker {
835*c0909341SAndroid Build Coastguard Worker // temporal predicted seg_id
836*c0909341SAndroid Build Coastguard Worker if (f->prev_segmap) {
837*c0909341SAndroid Build Coastguard Worker unsigned seg_id = get_prev_frame_segid(f, t->by, t->bx,
838*c0909341SAndroid Build Coastguard Worker w4, h4,
839*c0909341SAndroid Build Coastguard Worker f->prev_segmap,
840*c0909341SAndroid Build Coastguard Worker f->b4_stride);
841*c0909341SAndroid Build Coastguard Worker if (seg_id >= 8) return -1;
842*c0909341SAndroid Build Coastguard Worker b->seg_id = seg_id;
843*c0909341SAndroid Build Coastguard Worker } else {
844*c0909341SAndroid Build Coastguard Worker b->seg_id = 0;
845*c0909341SAndroid Build Coastguard Worker }
846*c0909341SAndroid Build Coastguard Worker } else {
847*c0909341SAndroid Build Coastguard Worker int seg_ctx;
848*c0909341SAndroid Build Coastguard Worker const unsigned pred_seg_id =
849*c0909341SAndroid Build Coastguard Worker get_cur_frame_segid(t->by, t->bx, have_top, have_left,
850*c0909341SAndroid Build Coastguard Worker &seg_ctx, f->cur_segmap, f->b4_stride);
851*c0909341SAndroid Build Coastguard Worker const unsigned diff = dav1d_msac_decode_symbol_adapt8(&ts->msac,
852*c0909341SAndroid Build Coastguard Worker ts->cdf.m.seg_id[seg_ctx],
853*c0909341SAndroid Build Coastguard Worker DAV1D_MAX_SEGMENTS - 1);
854*c0909341SAndroid Build Coastguard Worker const unsigned last_active_seg_id =
855*c0909341SAndroid Build Coastguard Worker f->frame_hdr->segmentation.seg_data.last_active_segid;
856*c0909341SAndroid Build Coastguard Worker b->seg_id = neg_deinterleave(diff, pred_seg_id,
857*c0909341SAndroid Build Coastguard Worker last_active_seg_id + 1);
858*c0909341SAndroid Build Coastguard Worker if (b->seg_id > last_active_seg_id) b->seg_id = 0; // error?
859*c0909341SAndroid Build Coastguard Worker if (b->seg_id >= DAV1D_MAX_SEGMENTS) b->seg_id = 0; // error?
860*c0909341SAndroid Build Coastguard Worker }
861*c0909341SAndroid Build Coastguard Worker
862*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
863*c0909341SAndroid Build Coastguard Worker printf("Post-segid[preskip;%d]: r=%d\n",
864*c0909341SAndroid Build Coastguard Worker b->seg_id, ts->msac.rng);
865*c0909341SAndroid Build Coastguard Worker
866*c0909341SAndroid Build Coastguard Worker seg = &f->frame_hdr->segmentation.seg_data.d[b->seg_id];
867*c0909341SAndroid Build Coastguard Worker }
868*c0909341SAndroid Build Coastguard Worker } else {
869*c0909341SAndroid Build Coastguard Worker b->seg_id = 0;
870*c0909341SAndroid Build Coastguard Worker }
871*c0909341SAndroid Build Coastguard Worker
872*c0909341SAndroid Build Coastguard Worker // skip_mode
873*c0909341SAndroid Build Coastguard Worker if ((!seg || (!seg->globalmv && seg->ref == -1 && !seg->skip)) &&
874*c0909341SAndroid Build Coastguard Worker f->frame_hdr->skip_mode_enabled && imin(bw4, bh4) > 1)
875*c0909341SAndroid Build Coastguard Worker {
876*c0909341SAndroid Build Coastguard Worker const int smctx = t->a->skip_mode[bx4] + t->l.skip_mode[by4];
877*c0909341SAndroid Build Coastguard Worker b->skip_mode = dav1d_msac_decode_bool_adapt(&ts->msac,
878*c0909341SAndroid Build Coastguard Worker ts->cdf.m.skip_mode[smctx]);
879*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
880*c0909341SAndroid Build Coastguard Worker printf("Post-skipmode[%d]: r=%d\n", b->skip_mode, ts->msac.rng);
881*c0909341SAndroid Build Coastguard Worker } else {
882*c0909341SAndroid Build Coastguard Worker b->skip_mode = 0;
883*c0909341SAndroid Build Coastguard Worker }
884*c0909341SAndroid Build Coastguard Worker
885*c0909341SAndroid Build Coastguard Worker // skip
886*c0909341SAndroid Build Coastguard Worker if (b->skip_mode || (seg && seg->skip)) {
887*c0909341SAndroid Build Coastguard Worker b->skip = 1;
888*c0909341SAndroid Build Coastguard Worker } else {
889*c0909341SAndroid Build Coastguard Worker const int sctx = t->a->skip[bx4] + t->l.skip[by4];
890*c0909341SAndroid Build Coastguard Worker b->skip = dav1d_msac_decode_bool_adapt(&ts->msac, ts->cdf.m.skip[sctx]);
891*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
892*c0909341SAndroid Build Coastguard Worker printf("Post-skip[%d]: r=%d\n", b->skip, ts->msac.rng);
893*c0909341SAndroid Build Coastguard Worker }
894*c0909341SAndroid Build Coastguard Worker
895*c0909341SAndroid Build Coastguard Worker // segment_id
896*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->segmentation.enabled &&
897*c0909341SAndroid Build Coastguard Worker f->frame_hdr->segmentation.update_map &&
898*c0909341SAndroid Build Coastguard Worker !f->frame_hdr->segmentation.seg_data.preskip)
899*c0909341SAndroid Build Coastguard Worker {
900*c0909341SAndroid Build Coastguard Worker if (!b->skip && f->frame_hdr->segmentation.temporal &&
901*c0909341SAndroid Build Coastguard Worker (seg_pred = dav1d_msac_decode_bool_adapt(&ts->msac,
902*c0909341SAndroid Build Coastguard Worker ts->cdf.m.seg_pred[t->a->seg_pred[bx4] +
903*c0909341SAndroid Build Coastguard Worker t->l.seg_pred[by4]])))
904*c0909341SAndroid Build Coastguard Worker {
905*c0909341SAndroid Build Coastguard Worker // temporal predicted seg_id
906*c0909341SAndroid Build Coastguard Worker if (f->prev_segmap) {
907*c0909341SAndroid Build Coastguard Worker unsigned seg_id = get_prev_frame_segid(f, t->by, t->bx, w4, h4,
908*c0909341SAndroid Build Coastguard Worker f->prev_segmap,
909*c0909341SAndroid Build Coastguard Worker f->b4_stride);
910*c0909341SAndroid Build Coastguard Worker if (seg_id >= 8) return -1;
911*c0909341SAndroid Build Coastguard Worker b->seg_id = seg_id;
912*c0909341SAndroid Build Coastguard Worker } else {
913*c0909341SAndroid Build Coastguard Worker b->seg_id = 0;
914*c0909341SAndroid Build Coastguard Worker }
915*c0909341SAndroid Build Coastguard Worker } else {
916*c0909341SAndroid Build Coastguard Worker int seg_ctx;
917*c0909341SAndroid Build Coastguard Worker const unsigned pred_seg_id =
918*c0909341SAndroid Build Coastguard Worker get_cur_frame_segid(t->by, t->bx, have_top, have_left,
919*c0909341SAndroid Build Coastguard Worker &seg_ctx, f->cur_segmap, f->b4_stride);
920*c0909341SAndroid Build Coastguard Worker if (b->skip) {
921*c0909341SAndroid Build Coastguard Worker b->seg_id = pred_seg_id;
922*c0909341SAndroid Build Coastguard Worker } else {
923*c0909341SAndroid Build Coastguard Worker const unsigned diff = dav1d_msac_decode_symbol_adapt8(&ts->msac,
924*c0909341SAndroid Build Coastguard Worker ts->cdf.m.seg_id[seg_ctx],
925*c0909341SAndroid Build Coastguard Worker DAV1D_MAX_SEGMENTS - 1);
926*c0909341SAndroid Build Coastguard Worker const unsigned last_active_seg_id =
927*c0909341SAndroid Build Coastguard Worker f->frame_hdr->segmentation.seg_data.last_active_segid;
928*c0909341SAndroid Build Coastguard Worker b->seg_id = neg_deinterleave(diff, pred_seg_id,
929*c0909341SAndroid Build Coastguard Worker last_active_seg_id + 1);
930*c0909341SAndroid Build Coastguard Worker if (b->seg_id > last_active_seg_id) b->seg_id = 0; // error?
931*c0909341SAndroid Build Coastguard Worker }
932*c0909341SAndroid Build Coastguard Worker if (b->seg_id >= DAV1D_MAX_SEGMENTS) b->seg_id = 0; // error?
933*c0909341SAndroid Build Coastguard Worker }
934*c0909341SAndroid Build Coastguard Worker
935*c0909341SAndroid Build Coastguard Worker seg = &f->frame_hdr->segmentation.seg_data.d[b->seg_id];
936*c0909341SAndroid Build Coastguard Worker
937*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
938*c0909341SAndroid Build Coastguard Worker printf("Post-segid[postskip;%d]: r=%d\n",
939*c0909341SAndroid Build Coastguard Worker b->seg_id, ts->msac.rng);
940*c0909341SAndroid Build Coastguard Worker }
941*c0909341SAndroid Build Coastguard Worker
942*c0909341SAndroid Build Coastguard Worker // cdef index
943*c0909341SAndroid Build Coastguard Worker if (!b->skip) {
944*c0909341SAndroid Build Coastguard Worker const int idx = f->seq_hdr->sb128 ? ((t->bx & 16) >> 4) +
945*c0909341SAndroid Build Coastguard Worker ((t->by & 16) >> 3) : 0;
946*c0909341SAndroid Build Coastguard Worker if (t->cur_sb_cdef_idx_ptr[idx] == -1) {
947*c0909341SAndroid Build Coastguard Worker const int v = dav1d_msac_decode_bools(&ts->msac,
948*c0909341SAndroid Build Coastguard Worker f->frame_hdr->cdef.n_bits);
949*c0909341SAndroid Build Coastguard Worker t->cur_sb_cdef_idx_ptr[idx] = v;
950*c0909341SAndroid Build Coastguard Worker if (bw4 > 16) t->cur_sb_cdef_idx_ptr[idx + 1] = v;
951*c0909341SAndroid Build Coastguard Worker if (bh4 > 16) t->cur_sb_cdef_idx_ptr[idx + 2] = v;
952*c0909341SAndroid Build Coastguard Worker if (bw4 == 32 && bh4 == 32) t->cur_sb_cdef_idx_ptr[idx + 3] = v;
953*c0909341SAndroid Build Coastguard Worker
954*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
955*c0909341SAndroid Build Coastguard Worker printf("Post-cdef_idx[%d]: r=%d\n",
956*c0909341SAndroid Build Coastguard Worker *t->cur_sb_cdef_idx_ptr, ts->msac.rng);
957*c0909341SAndroid Build Coastguard Worker }
958*c0909341SAndroid Build Coastguard Worker }
959*c0909341SAndroid Build Coastguard Worker
960*c0909341SAndroid Build Coastguard Worker // delta-q/lf
961*c0909341SAndroid Build Coastguard Worker if (!(t->bx & (31 >> !f->seq_hdr->sb128)) &&
962*c0909341SAndroid Build Coastguard Worker !(t->by & (31 >> !f->seq_hdr->sb128)))
963*c0909341SAndroid Build Coastguard Worker {
964*c0909341SAndroid Build Coastguard Worker const int prev_qidx = ts->last_qidx;
965*c0909341SAndroid Build Coastguard Worker const int have_delta_q = f->frame_hdr->delta.q.present &&
966*c0909341SAndroid Build Coastguard Worker (bs != (f->seq_hdr->sb128 ? BS_128x128 : BS_64x64) || !b->skip);
967*c0909341SAndroid Build Coastguard Worker
968*c0909341SAndroid Build Coastguard Worker uint32_t prev_delta_lf = ts->last_delta_lf.u32;
969*c0909341SAndroid Build Coastguard Worker
970*c0909341SAndroid Build Coastguard Worker if (have_delta_q) {
971*c0909341SAndroid Build Coastguard Worker int delta_q = dav1d_msac_decode_symbol_adapt4(&ts->msac,
972*c0909341SAndroid Build Coastguard Worker ts->cdf.m.delta_q, 3);
973*c0909341SAndroid Build Coastguard Worker if (delta_q == 3) {
974*c0909341SAndroid Build Coastguard Worker const int n_bits = 1 + dav1d_msac_decode_bools(&ts->msac, 3);
975*c0909341SAndroid Build Coastguard Worker delta_q = dav1d_msac_decode_bools(&ts->msac, n_bits) +
976*c0909341SAndroid Build Coastguard Worker 1 + (1 << n_bits);
977*c0909341SAndroid Build Coastguard Worker }
978*c0909341SAndroid Build Coastguard Worker if (delta_q) {
979*c0909341SAndroid Build Coastguard Worker if (dav1d_msac_decode_bool_equi(&ts->msac)) delta_q = -delta_q;
980*c0909341SAndroid Build Coastguard Worker delta_q *= 1 << f->frame_hdr->delta.q.res_log2;
981*c0909341SAndroid Build Coastguard Worker }
982*c0909341SAndroid Build Coastguard Worker ts->last_qidx = iclip(ts->last_qidx + delta_q, 1, 255);
983*c0909341SAndroid Build Coastguard Worker if (have_delta_q && DEBUG_BLOCK_INFO)
984*c0909341SAndroid Build Coastguard Worker printf("Post-delta_q[%d->%d]: r=%d\n",
985*c0909341SAndroid Build Coastguard Worker delta_q, ts->last_qidx, ts->msac.rng);
986*c0909341SAndroid Build Coastguard Worker
987*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->delta.lf.present) {
988*c0909341SAndroid Build Coastguard Worker const int n_lfs = f->frame_hdr->delta.lf.multi ?
989*c0909341SAndroid Build Coastguard Worker f->cur.p.layout != DAV1D_PIXEL_LAYOUT_I400 ? 4 : 2 : 1;
990*c0909341SAndroid Build Coastguard Worker
991*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < n_lfs; i++) {
992*c0909341SAndroid Build Coastguard Worker int delta_lf = dav1d_msac_decode_symbol_adapt4(&ts->msac,
993*c0909341SAndroid Build Coastguard Worker ts->cdf.m.delta_lf[i + f->frame_hdr->delta.lf.multi], 3);
994*c0909341SAndroid Build Coastguard Worker if (delta_lf == 3) {
995*c0909341SAndroid Build Coastguard Worker const int n_bits = 1 + dav1d_msac_decode_bools(&ts->msac, 3);
996*c0909341SAndroid Build Coastguard Worker delta_lf = dav1d_msac_decode_bools(&ts->msac, n_bits) +
997*c0909341SAndroid Build Coastguard Worker 1 + (1 << n_bits);
998*c0909341SAndroid Build Coastguard Worker }
999*c0909341SAndroid Build Coastguard Worker if (delta_lf) {
1000*c0909341SAndroid Build Coastguard Worker if (dav1d_msac_decode_bool_equi(&ts->msac))
1001*c0909341SAndroid Build Coastguard Worker delta_lf = -delta_lf;
1002*c0909341SAndroid Build Coastguard Worker delta_lf *= 1 << f->frame_hdr->delta.lf.res_log2;
1003*c0909341SAndroid Build Coastguard Worker }
1004*c0909341SAndroid Build Coastguard Worker ts->last_delta_lf.i8[i] =
1005*c0909341SAndroid Build Coastguard Worker iclip(ts->last_delta_lf.i8[i] + delta_lf, -63, 63);
1006*c0909341SAndroid Build Coastguard Worker if (have_delta_q && DEBUG_BLOCK_INFO)
1007*c0909341SAndroid Build Coastguard Worker printf("Post-delta_lf[%d:%d]: r=%d\n", i, delta_lf,
1008*c0909341SAndroid Build Coastguard Worker ts->msac.rng);
1009*c0909341SAndroid Build Coastguard Worker }
1010*c0909341SAndroid Build Coastguard Worker }
1011*c0909341SAndroid Build Coastguard Worker }
1012*c0909341SAndroid Build Coastguard Worker if (ts->last_qidx == f->frame_hdr->quant.yac) {
1013*c0909341SAndroid Build Coastguard Worker // assign frame-wide q values to this sb
1014*c0909341SAndroid Build Coastguard Worker ts->dq = f->dq;
1015*c0909341SAndroid Build Coastguard Worker } else if (ts->last_qidx != prev_qidx) {
1016*c0909341SAndroid Build Coastguard Worker // find sb-specific quant parameters
1017*c0909341SAndroid Build Coastguard Worker init_quant_tables(f->seq_hdr, f->frame_hdr, ts->last_qidx, ts->dqmem);
1018*c0909341SAndroid Build Coastguard Worker ts->dq = ts->dqmem;
1019*c0909341SAndroid Build Coastguard Worker }
1020*c0909341SAndroid Build Coastguard Worker if (!ts->last_delta_lf.u32) {
1021*c0909341SAndroid Build Coastguard Worker // assign frame-wide lf values to this sb
1022*c0909341SAndroid Build Coastguard Worker ts->lflvl = f->lf.lvl;
1023*c0909341SAndroid Build Coastguard Worker } else if (ts->last_delta_lf.u32 != prev_delta_lf) {
1024*c0909341SAndroid Build Coastguard Worker // find sb-specific lf lvl parameters
1025*c0909341SAndroid Build Coastguard Worker ts->lflvl = ts->lflvlmem;
1026*c0909341SAndroid Build Coastguard Worker dav1d_calc_lf_values(ts->lflvlmem, f->frame_hdr, ts->last_delta_lf.i8);
1027*c0909341SAndroid Build Coastguard Worker }
1028*c0909341SAndroid Build Coastguard Worker }
1029*c0909341SAndroid Build Coastguard Worker
1030*c0909341SAndroid Build Coastguard Worker if (b->skip_mode) {
1031*c0909341SAndroid Build Coastguard Worker b->intra = 0;
1032*c0909341SAndroid Build Coastguard Worker } else if (IS_INTER_OR_SWITCH(f->frame_hdr)) {
1033*c0909341SAndroid Build Coastguard Worker if (seg && (seg->ref >= 0 || seg->globalmv)) {
1034*c0909341SAndroid Build Coastguard Worker b->intra = !seg->ref;
1035*c0909341SAndroid Build Coastguard Worker } else {
1036*c0909341SAndroid Build Coastguard Worker const int ictx = get_intra_ctx(t->a, &t->l, by4, bx4,
1037*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1038*c0909341SAndroid Build Coastguard Worker b->intra = !dav1d_msac_decode_bool_adapt(&ts->msac,
1039*c0909341SAndroid Build Coastguard Worker ts->cdf.m.intra[ictx]);
1040*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1041*c0909341SAndroid Build Coastguard Worker printf("Post-intra[%d]: r=%d\n", b->intra, ts->msac.rng);
1042*c0909341SAndroid Build Coastguard Worker }
1043*c0909341SAndroid Build Coastguard Worker } else if (f->frame_hdr->allow_intrabc) {
1044*c0909341SAndroid Build Coastguard Worker b->intra = !dav1d_msac_decode_bool_adapt(&ts->msac, ts->cdf.m.intrabc);
1045*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1046*c0909341SAndroid Build Coastguard Worker printf("Post-intrabcflag[%d]: r=%d\n", b->intra, ts->msac.rng);
1047*c0909341SAndroid Build Coastguard Worker } else {
1048*c0909341SAndroid Build Coastguard Worker b->intra = 1;
1049*c0909341SAndroid Build Coastguard Worker }
1050*c0909341SAndroid Build Coastguard Worker
1051*c0909341SAndroid Build Coastguard Worker // intra/inter-specific stuff
1052*c0909341SAndroid Build Coastguard Worker if (b->intra) {
1053*c0909341SAndroid Build Coastguard Worker uint16_t *const ymode_cdf = IS_INTER_OR_SWITCH(f->frame_hdr) ?
1054*c0909341SAndroid Build Coastguard Worker ts->cdf.m.y_mode[dav1d_ymode_size_context[bs]] :
1055*c0909341SAndroid Build Coastguard Worker ts->cdf.kfym[dav1d_intra_mode_context[t->a->mode[bx4]]]
1056*c0909341SAndroid Build Coastguard Worker [dav1d_intra_mode_context[t->l.mode[by4]]];
1057*c0909341SAndroid Build Coastguard Worker b->y_mode = dav1d_msac_decode_symbol_adapt16(&ts->msac, ymode_cdf,
1058*c0909341SAndroid Build Coastguard Worker N_INTRA_PRED_MODES - 1);
1059*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1060*c0909341SAndroid Build Coastguard Worker printf("Post-ymode[%d]: r=%d\n", b->y_mode, ts->msac.rng);
1061*c0909341SAndroid Build Coastguard Worker
1062*c0909341SAndroid Build Coastguard Worker // angle delta
1063*c0909341SAndroid Build Coastguard Worker if (b_dim[2] + b_dim[3] >= 2 && b->y_mode >= VERT_PRED &&
1064*c0909341SAndroid Build Coastguard Worker b->y_mode <= VERT_LEFT_PRED)
1065*c0909341SAndroid Build Coastguard Worker {
1066*c0909341SAndroid Build Coastguard Worker uint16_t *const acdf = ts->cdf.m.angle_delta[b->y_mode - VERT_PRED];
1067*c0909341SAndroid Build Coastguard Worker const int angle = dav1d_msac_decode_symbol_adapt8(&ts->msac, acdf, 6);
1068*c0909341SAndroid Build Coastguard Worker b->y_angle = angle - 3;
1069*c0909341SAndroid Build Coastguard Worker } else {
1070*c0909341SAndroid Build Coastguard Worker b->y_angle = 0;
1071*c0909341SAndroid Build Coastguard Worker }
1072*c0909341SAndroid Build Coastguard Worker
1073*c0909341SAndroid Build Coastguard Worker if (has_chroma) {
1074*c0909341SAndroid Build Coastguard Worker const int cfl_allowed = f->frame_hdr->segmentation.lossless[b->seg_id] ?
1075*c0909341SAndroid Build Coastguard Worker cbw4 == 1 && cbh4 == 1 : !!(cfl_allowed_mask & (1 << bs));
1076*c0909341SAndroid Build Coastguard Worker uint16_t *const uvmode_cdf = ts->cdf.m.uv_mode[cfl_allowed][b->y_mode];
1077*c0909341SAndroid Build Coastguard Worker b->uv_mode = dav1d_msac_decode_symbol_adapt16(&ts->msac, uvmode_cdf,
1078*c0909341SAndroid Build Coastguard Worker N_UV_INTRA_PRED_MODES - 1 - !cfl_allowed);
1079*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1080*c0909341SAndroid Build Coastguard Worker printf("Post-uvmode[%d]: r=%d\n", b->uv_mode, ts->msac.rng);
1081*c0909341SAndroid Build Coastguard Worker
1082*c0909341SAndroid Build Coastguard Worker b->uv_angle = 0;
1083*c0909341SAndroid Build Coastguard Worker if (b->uv_mode == CFL_PRED) {
1084*c0909341SAndroid Build Coastguard Worker #define SIGN(a) (!!(a) + ((a) > 0))
1085*c0909341SAndroid Build Coastguard Worker const int sign = dav1d_msac_decode_symbol_adapt8(&ts->msac,
1086*c0909341SAndroid Build Coastguard Worker ts->cdf.m.cfl_sign, 7) + 1;
1087*c0909341SAndroid Build Coastguard Worker const int sign_u = sign * 0x56 >> 8, sign_v = sign - sign_u * 3;
1088*c0909341SAndroid Build Coastguard Worker assert(sign_u == sign / 3);
1089*c0909341SAndroid Build Coastguard Worker if (sign_u) {
1090*c0909341SAndroid Build Coastguard Worker const int ctx = (sign_u == 2) * 3 + sign_v;
1091*c0909341SAndroid Build Coastguard Worker b->cfl_alpha[0] = dav1d_msac_decode_symbol_adapt16(&ts->msac,
1092*c0909341SAndroid Build Coastguard Worker ts->cdf.m.cfl_alpha[ctx], 15) + 1;
1093*c0909341SAndroid Build Coastguard Worker if (sign_u == 1) b->cfl_alpha[0] = -b->cfl_alpha[0];
1094*c0909341SAndroid Build Coastguard Worker } else {
1095*c0909341SAndroid Build Coastguard Worker b->cfl_alpha[0] = 0;
1096*c0909341SAndroid Build Coastguard Worker }
1097*c0909341SAndroid Build Coastguard Worker if (sign_v) {
1098*c0909341SAndroid Build Coastguard Worker const int ctx = (sign_v == 2) * 3 + sign_u;
1099*c0909341SAndroid Build Coastguard Worker b->cfl_alpha[1] = dav1d_msac_decode_symbol_adapt16(&ts->msac,
1100*c0909341SAndroid Build Coastguard Worker ts->cdf.m.cfl_alpha[ctx], 15) + 1;
1101*c0909341SAndroid Build Coastguard Worker if (sign_v == 1) b->cfl_alpha[1] = -b->cfl_alpha[1];
1102*c0909341SAndroid Build Coastguard Worker } else {
1103*c0909341SAndroid Build Coastguard Worker b->cfl_alpha[1] = 0;
1104*c0909341SAndroid Build Coastguard Worker }
1105*c0909341SAndroid Build Coastguard Worker #undef SIGN
1106*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1107*c0909341SAndroid Build Coastguard Worker printf("Post-uvalphas[%d/%d]: r=%d\n",
1108*c0909341SAndroid Build Coastguard Worker b->cfl_alpha[0], b->cfl_alpha[1], ts->msac.rng);
1109*c0909341SAndroid Build Coastguard Worker } else if (b_dim[2] + b_dim[3] >= 2 && b->uv_mode >= VERT_PRED &&
1110*c0909341SAndroid Build Coastguard Worker b->uv_mode <= VERT_LEFT_PRED)
1111*c0909341SAndroid Build Coastguard Worker {
1112*c0909341SAndroid Build Coastguard Worker uint16_t *const acdf = ts->cdf.m.angle_delta[b->uv_mode - VERT_PRED];
1113*c0909341SAndroid Build Coastguard Worker const int angle = dav1d_msac_decode_symbol_adapt8(&ts->msac, acdf, 6);
1114*c0909341SAndroid Build Coastguard Worker b->uv_angle = angle - 3;
1115*c0909341SAndroid Build Coastguard Worker }
1116*c0909341SAndroid Build Coastguard Worker }
1117*c0909341SAndroid Build Coastguard Worker
1118*c0909341SAndroid Build Coastguard Worker b->pal_sz[0] = b->pal_sz[1] = 0;
1119*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->allow_screen_content_tools &&
1120*c0909341SAndroid Build Coastguard Worker imax(bw4, bh4) <= 16 && bw4 + bh4 >= 4)
1121*c0909341SAndroid Build Coastguard Worker {
1122*c0909341SAndroid Build Coastguard Worker const int sz_ctx = b_dim[2] + b_dim[3] - 2;
1123*c0909341SAndroid Build Coastguard Worker if (b->y_mode == DC_PRED) {
1124*c0909341SAndroid Build Coastguard Worker const int pal_ctx = (t->a->pal_sz[bx4] > 0) + (t->l.pal_sz[by4] > 0);
1125*c0909341SAndroid Build Coastguard Worker const int use_y_pal = dav1d_msac_decode_bool_adapt(&ts->msac,
1126*c0909341SAndroid Build Coastguard Worker ts->cdf.m.pal_y[sz_ctx][pal_ctx]);
1127*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1128*c0909341SAndroid Build Coastguard Worker printf("Post-y_pal[%d]: r=%d\n", use_y_pal, ts->msac.rng);
1129*c0909341SAndroid Build Coastguard Worker if (use_y_pal)
1130*c0909341SAndroid Build Coastguard Worker f->bd_fn.read_pal_plane(t, b, 0, sz_ctx, bx4, by4);
1131*c0909341SAndroid Build Coastguard Worker }
1132*c0909341SAndroid Build Coastguard Worker
1133*c0909341SAndroid Build Coastguard Worker if (has_chroma && b->uv_mode == DC_PRED) {
1134*c0909341SAndroid Build Coastguard Worker const int pal_ctx = b->pal_sz[0] > 0;
1135*c0909341SAndroid Build Coastguard Worker const int use_uv_pal = dav1d_msac_decode_bool_adapt(&ts->msac,
1136*c0909341SAndroid Build Coastguard Worker ts->cdf.m.pal_uv[pal_ctx]);
1137*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1138*c0909341SAndroid Build Coastguard Worker printf("Post-uv_pal[%d]: r=%d\n", use_uv_pal, ts->msac.rng);
1139*c0909341SAndroid Build Coastguard Worker if (use_uv_pal) // see aomedia bug 2183 for why we use luma coordinates
1140*c0909341SAndroid Build Coastguard Worker f->bd_fn.read_pal_uv(t, b, sz_ctx, bx4, by4);
1141*c0909341SAndroid Build Coastguard Worker }
1142*c0909341SAndroid Build Coastguard Worker }
1143*c0909341SAndroid Build Coastguard Worker
1144*c0909341SAndroid Build Coastguard Worker if (b->y_mode == DC_PRED && !b->pal_sz[0] &&
1145*c0909341SAndroid Build Coastguard Worker imax(b_dim[2], b_dim[3]) <= 3 && f->seq_hdr->filter_intra)
1146*c0909341SAndroid Build Coastguard Worker {
1147*c0909341SAndroid Build Coastguard Worker const int is_filter = dav1d_msac_decode_bool_adapt(&ts->msac,
1148*c0909341SAndroid Build Coastguard Worker ts->cdf.m.use_filter_intra[bs]);
1149*c0909341SAndroid Build Coastguard Worker if (is_filter) {
1150*c0909341SAndroid Build Coastguard Worker b->y_mode = FILTER_PRED;
1151*c0909341SAndroid Build Coastguard Worker b->y_angle = dav1d_msac_decode_symbol_adapt8(&ts->msac,
1152*c0909341SAndroid Build Coastguard Worker ts->cdf.m.filter_intra, 4);
1153*c0909341SAndroid Build Coastguard Worker }
1154*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1155*c0909341SAndroid Build Coastguard Worker printf("Post-filterintramode[%d/%d]: r=%d\n",
1156*c0909341SAndroid Build Coastguard Worker b->y_mode, b->y_angle, ts->msac.rng);
1157*c0909341SAndroid Build Coastguard Worker }
1158*c0909341SAndroid Build Coastguard Worker
1159*c0909341SAndroid Build Coastguard Worker if (b->pal_sz[0]) {
1160*c0909341SAndroid Build Coastguard Worker uint8_t *pal_idx;
1161*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass) {
1162*c0909341SAndroid Build Coastguard Worker const int p = t->frame_thread.pass & 1;
1163*c0909341SAndroid Build Coastguard Worker assert(ts->frame_thread[p].pal_idx);
1164*c0909341SAndroid Build Coastguard Worker pal_idx = ts->frame_thread[p].pal_idx;
1165*c0909341SAndroid Build Coastguard Worker ts->frame_thread[p].pal_idx += bw4 * bh4 * 8;
1166*c0909341SAndroid Build Coastguard Worker } else
1167*c0909341SAndroid Build Coastguard Worker pal_idx = t->scratch.pal_idx_y;
1168*c0909341SAndroid Build Coastguard Worker read_pal_indices(t, pal_idx, b, 0, w4, h4, bw4, bh4);
1169*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1170*c0909341SAndroid Build Coastguard Worker printf("Post-y-pal-indices: r=%d\n", ts->msac.rng);
1171*c0909341SAndroid Build Coastguard Worker }
1172*c0909341SAndroid Build Coastguard Worker
1173*c0909341SAndroid Build Coastguard Worker if (has_chroma && b->pal_sz[1]) {
1174*c0909341SAndroid Build Coastguard Worker uint8_t *pal_idx;
1175*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass) {
1176*c0909341SAndroid Build Coastguard Worker const int p = t->frame_thread.pass & 1;
1177*c0909341SAndroid Build Coastguard Worker assert(ts->frame_thread[p].pal_idx);
1178*c0909341SAndroid Build Coastguard Worker pal_idx = ts->frame_thread[p].pal_idx;
1179*c0909341SAndroid Build Coastguard Worker ts->frame_thread[p].pal_idx += cbw4 * cbh4 * 8;
1180*c0909341SAndroid Build Coastguard Worker } else
1181*c0909341SAndroid Build Coastguard Worker pal_idx = t->scratch.pal_idx_uv;
1182*c0909341SAndroid Build Coastguard Worker read_pal_indices(t, pal_idx, b, 1, cw4, ch4, cbw4, cbh4);
1183*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1184*c0909341SAndroid Build Coastguard Worker printf("Post-uv-pal-indices: r=%d\n", ts->msac.rng);
1185*c0909341SAndroid Build Coastguard Worker }
1186*c0909341SAndroid Build Coastguard Worker
1187*c0909341SAndroid Build Coastguard Worker const TxfmInfo *t_dim;
1188*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->segmentation.lossless[b->seg_id]) {
1189*c0909341SAndroid Build Coastguard Worker b->tx = b->uvtx = (int) TX_4X4;
1190*c0909341SAndroid Build Coastguard Worker t_dim = &dav1d_txfm_dimensions[TX_4X4];
1191*c0909341SAndroid Build Coastguard Worker } else {
1192*c0909341SAndroid Build Coastguard Worker b->tx = dav1d_max_txfm_size_for_bs[bs][0];
1193*c0909341SAndroid Build Coastguard Worker b->uvtx = dav1d_max_txfm_size_for_bs[bs][f->cur.p.layout];
1194*c0909341SAndroid Build Coastguard Worker t_dim = &dav1d_txfm_dimensions[b->tx];
1195*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->txfm_mode == DAV1D_TX_SWITCHABLE && t_dim->max > TX_4X4) {
1196*c0909341SAndroid Build Coastguard Worker const int tctx = get_tx_ctx(t->a, &t->l, t_dim, by4, bx4);
1197*c0909341SAndroid Build Coastguard Worker uint16_t *const tx_cdf = ts->cdf.m.txsz[t_dim->max - 1][tctx];
1198*c0909341SAndroid Build Coastguard Worker int depth = dav1d_msac_decode_symbol_adapt4(&ts->msac, tx_cdf,
1199*c0909341SAndroid Build Coastguard Worker imin(t_dim->max, 2));
1200*c0909341SAndroid Build Coastguard Worker
1201*c0909341SAndroid Build Coastguard Worker while (depth--) {
1202*c0909341SAndroid Build Coastguard Worker b->tx = t_dim->sub;
1203*c0909341SAndroid Build Coastguard Worker t_dim = &dav1d_txfm_dimensions[b->tx];
1204*c0909341SAndroid Build Coastguard Worker }
1205*c0909341SAndroid Build Coastguard Worker }
1206*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1207*c0909341SAndroid Build Coastguard Worker printf("Post-tx[%d]: r=%d\n", b->tx, ts->msac.rng);
1208*c0909341SAndroid Build Coastguard Worker }
1209*c0909341SAndroid Build Coastguard Worker
1210*c0909341SAndroid Build Coastguard Worker // reconstruction
1211*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass == 1) {
1212*c0909341SAndroid Build Coastguard Worker f->bd_fn.read_coef_blocks(t, bs, b);
1213*c0909341SAndroid Build Coastguard Worker } else {
1214*c0909341SAndroid Build Coastguard Worker f->bd_fn.recon_b_intra(t, bs, intra_edge_flags, b);
1215*c0909341SAndroid Build Coastguard Worker }
1216*c0909341SAndroid Build Coastguard Worker
1217*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->loopfilter.level_y[0] ||
1218*c0909341SAndroid Build Coastguard Worker f->frame_hdr->loopfilter.level_y[1])
1219*c0909341SAndroid Build Coastguard Worker {
1220*c0909341SAndroid Build Coastguard Worker dav1d_create_lf_mask_intra(t->lf_mask, f->lf.level, f->b4_stride,
1221*c0909341SAndroid Build Coastguard Worker (const uint8_t (*)[8][2])
1222*c0909341SAndroid Build Coastguard Worker &ts->lflvl[b->seg_id][0][0][0],
1223*c0909341SAndroid Build Coastguard Worker t->bx, t->by, f->w4, f->h4, bs,
1224*c0909341SAndroid Build Coastguard Worker b->tx, b->uvtx, f->cur.p.layout,
1225*c0909341SAndroid Build Coastguard Worker &t->a->tx_lpf_y[bx4], &t->l.tx_lpf_y[by4],
1226*c0909341SAndroid Build Coastguard Worker has_chroma ? &t->a->tx_lpf_uv[cbx4] : NULL,
1227*c0909341SAndroid Build Coastguard Worker has_chroma ? &t->l.tx_lpf_uv[cby4] : NULL);
1228*c0909341SAndroid Build Coastguard Worker }
1229*c0909341SAndroid Build Coastguard Worker // update contexts
1230*c0909341SAndroid Build Coastguard Worker const enum IntraPredMode y_mode_nofilt =
1231*c0909341SAndroid Build Coastguard Worker b->y_mode == FILTER_PRED ? DC_PRED : b->y_mode;
1232*c0909341SAndroid Build Coastguard Worker BlockContext *edge = t->a;
1233*c0909341SAndroid Build Coastguard Worker for (int i = 0, off = bx4; i < 2; i++, off = by4, edge = &t->l) {
1234*c0909341SAndroid Build Coastguard Worker int t_lsz = ((uint8_t *) &t_dim->lw)[i]; // lw then lh
1235*c0909341SAndroid Build Coastguard Worker #define set_ctx(rep_macro) \
1236*c0909341SAndroid Build Coastguard Worker rep_macro(edge->tx_intra, off, t_lsz); \
1237*c0909341SAndroid Build Coastguard Worker rep_macro(edge->tx, off, t_lsz); \
1238*c0909341SAndroid Build Coastguard Worker rep_macro(edge->mode, off, y_mode_nofilt); \
1239*c0909341SAndroid Build Coastguard Worker rep_macro(edge->pal_sz, off, b->pal_sz[0]); \
1240*c0909341SAndroid Build Coastguard Worker rep_macro(edge->seg_pred, off, seg_pred); \
1241*c0909341SAndroid Build Coastguard Worker rep_macro(edge->skip_mode, off, 0); \
1242*c0909341SAndroid Build Coastguard Worker rep_macro(edge->intra, off, 1); \
1243*c0909341SAndroid Build Coastguard Worker rep_macro(edge->skip, off, b->skip); \
1244*c0909341SAndroid Build Coastguard Worker /* see aomedia bug 2183 for why we use luma coordinates here */ \
1245*c0909341SAndroid Build Coastguard Worker rep_macro(t->pal_sz_uv[i], off, (has_chroma ? b->pal_sz[1] : 0)); \
1246*c0909341SAndroid Build Coastguard Worker if (IS_INTER_OR_SWITCH(f->frame_hdr)) { \
1247*c0909341SAndroid Build Coastguard Worker rep_macro(edge->comp_type, off, COMP_INTER_NONE); \
1248*c0909341SAndroid Build Coastguard Worker rep_macro(edge->ref[0], off, ((uint8_t) -1)); \
1249*c0909341SAndroid Build Coastguard Worker rep_macro(edge->ref[1], off, ((uint8_t) -1)); \
1250*c0909341SAndroid Build Coastguard Worker rep_macro(edge->filter[0], off, DAV1D_N_SWITCHABLE_FILTERS); \
1251*c0909341SAndroid Build Coastguard Worker rep_macro(edge->filter[1], off, DAV1D_N_SWITCHABLE_FILTERS); \
1252*c0909341SAndroid Build Coastguard Worker }
1253*c0909341SAndroid Build Coastguard Worker case_set(b_dim[2 + i]);
1254*c0909341SAndroid Build Coastguard Worker #undef set_ctx
1255*c0909341SAndroid Build Coastguard Worker }
1256*c0909341SAndroid Build Coastguard Worker if (b->pal_sz[0])
1257*c0909341SAndroid Build Coastguard Worker f->bd_fn.copy_pal_block_y(t, bx4, by4, bw4, bh4);
1258*c0909341SAndroid Build Coastguard Worker if (has_chroma) {
1259*c0909341SAndroid Build Coastguard Worker uint8_t uv_mode = b->uv_mode;
1260*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[ulog2(cbw4)](&t->a->uvmode[cbx4], uv_mode);
1261*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[ulog2(cbh4)](&t->l.uvmode[cby4], uv_mode);
1262*c0909341SAndroid Build Coastguard Worker if (b->pal_sz[1])
1263*c0909341SAndroid Build Coastguard Worker f->bd_fn.copy_pal_block_uv(t, bx4, by4, bw4, bh4);
1264*c0909341SAndroid Build Coastguard Worker }
1265*c0909341SAndroid Build Coastguard Worker if (IS_INTER_OR_SWITCH(f->frame_hdr) || f->frame_hdr->allow_intrabc)
1266*c0909341SAndroid Build Coastguard Worker splat_intraref(f->c, t, bs, bw4, bh4);
1267*c0909341SAndroid Build Coastguard Worker } else if (IS_KEY_OR_INTRA(f->frame_hdr)) {
1268*c0909341SAndroid Build Coastguard Worker // intra block copy
1269*c0909341SAndroid Build Coastguard Worker refmvs_candidate mvstack[8];
1270*c0909341SAndroid Build Coastguard Worker int n_mvs, ctx;
1271*c0909341SAndroid Build Coastguard Worker dav1d_refmvs_find(&t->rt, mvstack, &n_mvs, &ctx,
1272*c0909341SAndroid Build Coastguard Worker (union refmvs_refpair) { .ref = { 0, -1 }},
1273*c0909341SAndroid Build Coastguard Worker bs, intra_edge_flags, t->by, t->bx);
1274*c0909341SAndroid Build Coastguard Worker
1275*c0909341SAndroid Build Coastguard Worker if (mvstack[0].mv.mv[0].n)
1276*c0909341SAndroid Build Coastguard Worker b->mv[0] = mvstack[0].mv.mv[0];
1277*c0909341SAndroid Build Coastguard Worker else if (mvstack[1].mv.mv[0].n)
1278*c0909341SAndroid Build Coastguard Worker b->mv[0] = mvstack[1].mv.mv[0];
1279*c0909341SAndroid Build Coastguard Worker else {
1280*c0909341SAndroid Build Coastguard Worker if (t->by - (16 << f->seq_hdr->sb128) < ts->tiling.row_start) {
1281*c0909341SAndroid Build Coastguard Worker b->mv[0].y = 0;
1282*c0909341SAndroid Build Coastguard Worker b->mv[0].x = -(512 << f->seq_hdr->sb128) - 2048;
1283*c0909341SAndroid Build Coastguard Worker } else {
1284*c0909341SAndroid Build Coastguard Worker b->mv[0].y = -(512 << f->seq_hdr->sb128);
1285*c0909341SAndroid Build Coastguard Worker b->mv[0].x = 0;
1286*c0909341SAndroid Build Coastguard Worker }
1287*c0909341SAndroid Build Coastguard Worker }
1288*c0909341SAndroid Build Coastguard Worker
1289*c0909341SAndroid Build Coastguard Worker const union mv ref = b->mv[0];
1290*c0909341SAndroid Build Coastguard Worker read_mv_residual(ts, &b->mv[0], -1);
1291*c0909341SAndroid Build Coastguard Worker
1292*c0909341SAndroid Build Coastguard Worker // clip intrabc motion vector to decoded parts of current tile
1293*c0909341SAndroid Build Coastguard Worker int border_left = ts->tiling.col_start * 4;
1294*c0909341SAndroid Build Coastguard Worker int border_top = ts->tiling.row_start * 4;
1295*c0909341SAndroid Build Coastguard Worker if (has_chroma) {
1296*c0909341SAndroid Build Coastguard Worker if (bw4 < 2 && ss_hor)
1297*c0909341SAndroid Build Coastguard Worker border_left += 4;
1298*c0909341SAndroid Build Coastguard Worker if (bh4 < 2 && ss_ver)
1299*c0909341SAndroid Build Coastguard Worker border_top += 4;
1300*c0909341SAndroid Build Coastguard Worker }
1301*c0909341SAndroid Build Coastguard Worker int src_left = t->bx * 4 + (b->mv[0].x >> 3);
1302*c0909341SAndroid Build Coastguard Worker int src_top = t->by * 4 + (b->mv[0].y >> 3);
1303*c0909341SAndroid Build Coastguard Worker int src_right = src_left + bw4 * 4;
1304*c0909341SAndroid Build Coastguard Worker int src_bottom = src_top + bh4 * 4;
1305*c0909341SAndroid Build Coastguard Worker const int border_right = ((ts->tiling.col_end + (bw4 - 1)) & ~(bw4 - 1)) * 4;
1306*c0909341SAndroid Build Coastguard Worker
1307*c0909341SAndroid Build Coastguard Worker // check against left or right tile boundary and adjust if necessary
1308*c0909341SAndroid Build Coastguard Worker if (src_left < border_left) {
1309*c0909341SAndroid Build Coastguard Worker src_right += border_left - src_left;
1310*c0909341SAndroid Build Coastguard Worker src_left += border_left - src_left;
1311*c0909341SAndroid Build Coastguard Worker } else if (src_right > border_right) {
1312*c0909341SAndroid Build Coastguard Worker src_left -= src_right - border_right;
1313*c0909341SAndroid Build Coastguard Worker src_right -= src_right - border_right;
1314*c0909341SAndroid Build Coastguard Worker }
1315*c0909341SAndroid Build Coastguard Worker // check against top tile boundary and adjust if necessary
1316*c0909341SAndroid Build Coastguard Worker if (src_top < border_top) {
1317*c0909341SAndroid Build Coastguard Worker src_bottom += border_top - src_top;
1318*c0909341SAndroid Build Coastguard Worker src_top += border_top - src_top;
1319*c0909341SAndroid Build Coastguard Worker }
1320*c0909341SAndroid Build Coastguard Worker
1321*c0909341SAndroid Build Coastguard Worker const int sbx = (t->bx >> (4 + f->seq_hdr->sb128)) << (6 + f->seq_hdr->sb128);
1322*c0909341SAndroid Build Coastguard Worker const int sby = (t->by >> (4 + f->seq_hdr->sb128)) << (6 + f->seq_hdr->sb128);
1323*c0909341SAndroid Build Coastguard Worker const int sb_size = 1 << (6 + f->seq_hdr->sb128);
1324*c0909341SAndroid Build Coastguard Worker // check for overlap with current superblock
1325*c0909341SAndroid Build Coastguard Worker if (src_bottom > sby && src_right > sbx) {
1326*c0909341SAndroid Build Coastguard Worker if (src_top - border_top >= src_bottom - sby) {
1327*c0909341SAndroid Build Coastguard Worker // if possible move src up into the previous suberblock row
1328*c0909341SAndroid Build Coastguard Worker src_top -= src_bottom - sby;
1329*c0909341SAndroid Build Coastguard Worker src_bottom -= src_bottom - sby;
1330*c0909341SAndroid Build Coastguard Worker } else if (src_left - border_left >= src_right - sbx) {
1331*c0909341SAndroid Build Coastguard Worker // if possible move src left into the previous suberblock
1332*c0909341SAndroid Build Coastguard Worker src_left -= src_right - sbx;
1333*c0909341SAndroid Build Coastguard Worker src_right -= src_right - sbx;
1334*c0909341SAndroid Build Coastguard Worker }
1335*c0909341SAndroid Build Coastguard Worker }
1336*c0909341SAndroid Build Coastguard Worker // move src up if it is below current superblock row
1337*c0909341SAndroid Build Coastguard Worker if (src_bottom > sby + sb_size) {
1338*c0909341SAndroid Build Coastguard Worker src_top -= src_bottom - (sby + sb_size);
1339*c0909341SAndroid Build Coastguard Worker src_bottom -= src_bottom - (sby + sb_size);
1340*c0909341SAndroid Build Coastguard Worker }
1341*c0909341SAndroid Build Coastguard Worker // error out if mv still overlaps with the current superblock
1342*c0909341SAndroid Build Coastguard Worker if (src_bottom > sby && src_right > sbx)
1343*c0909341SAndroid Build Coastguard Worker return -1;
1344*c0909341SAndroid Build Coastguard Worker
1345*c0909341SAndroid Build Coastguard Worker b->mv[0].x = (src_left - t->bx * 4) * 8;
1346*c0909341SAndroid Build Coastguard Worker b->mv[0].y = (src_top - t->by * 4) * 8;
1347*c0909341SAndroid Build Coastguard Worker
1348*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1349*c0909341SAndroid Build Coastguard Worker printf("Post-dmv[%d/%d,ref=%d/%d|%d/%d]: r=%d\n",
1350*c0909341SAndroid Build Coastguard Worker b->mv[0].y, b->mv[0].x, ref.y, ref.x,
1351*c0909341SAndroid Build Coastguard Worker mvstack[0].mv.mv[0].y, mvstack[0].mv.mv[0].x, ts->msac.rng);
1352*c0909341SAndroid Build Coastguard Worker read_vartx_tree(t, b, bs, bx4, by4);
1353*c0909341SAndroid Build Coastguard Worker
1354*c0909341SAndroid Build Coastguard Worker // reconstruction
1355*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass == 1) {
1356*c0909341SAndroid Build Coastguard Worker f->bd_fn.read_coef_blocks(t, bs, b);
1357*c0909341SAndroid Build Coastguard Worker b->filter2d = FILTER_2D_BILINEAR;
1358*c0909341SAndroid Build Coastguard Worker } else {
1359*c0909341SAndroid Build Coastguard Worker if (f->bd_fn.recon_b_inter(t, bs, b)) return -1;
1360*c0909341SAndroid Build Coastguard Worker }
1361*c0909341SAndroid Build Coastguard Worker
1362*c0909341SAndroid Build Coastguard Worker splat_intrabc_mv(f->c, t, bs, b, bw4, bh4);
1363*c0909341SAndroid Build Coastguard Worker BlockContext *edge = t->a;
1364*c0909341SAndroid Build Coastguard Worker for (int i = 0, off = bx4; i < 2; i++, off = by4, edge = &t->l) {
1365*c0909341SAndroid Build Coastguard Worker #define set_ctx(rep_macro) \
1366*c0909341SAndroid Build Coastguard Worker rep_macro(edge->tx_intra, off, b_dim[2 + i]); \
1367*c0909341SAndroid Build Coastguard Worker rep_macro(edge->mode, off, DC_PRED); \
1368*c0909341SAndroid Build Coastguard Worker rep_macro(edge->pal_sz, off, 0); \
1369*c0909341SAndroid Build Coastguard Worker /* see aomedia bug 2183 for why this is outside if (has_chroma) */ \
1370*c0909341SAndroid Build Coastguard Worker rep_macro(t->pal_sz_uv[i], off, 0); \
1371*c0909341SAndroid Build Coastguard Worker rep_macro(edge->seg_pred, off, seg_pred); \
1372*c0909341SAndroid Build Coastguard Worker rep_macro(edge->skip_mode, off, 0); \
1373*c0909341SAndroid Build Coastguard Worker rep_macro(edge->intra, off, 0); \
1374*c0909341SAndroid Build Coastguard Worker rep_macro(edge->skip, off, b->skip)
1375*c0909341SAndroid Build Coastguard Worker case_set(b_dim[2 + i]);
1376*c0909341SAndroid Build Coastguard Worker #undef set_ctx
1377*c0909341SAndroid Build Coastguard Worker }
1378*c0909341SAndroid Build Coastguard Worker if (has_chroma) {
1379*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[ulog2(cbw4)](&t->a->uvmode[cbx4], DC_PRED);
1380*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[ulog2(cbh4)](&t->l.uvmode[cby4], DC_PRED);
1381*c0909341SAndroid Build Coastguard Worker }
1382*c0909341SAndroid Build Coastguard Worker } else {
1383*c0909341SAndroid Build Coastguard Worker // inter-specific mode/mv coding
1384*c0909341SAndroid Build Coastguard Worker int is_comp, has_subpel_filter;
1385*c0909341SAndroid Build Coastguard Worker
1386*c0909341SAndroid Build Coastguard Worker if (b->skip_mode) {
1387*c0909341SAndroid Build Coastguard Worker is_comp = 1;
1388*c0909341SAndroid Build Coastguard Worker } else if ((!seg || (seg->ref == -1 && !seg->globalmv && !seg->skip)) &&
1389*c0909341SAndroid Build Coastguard Worker f->frame_hdr->switchable_comp_refs && imin(bw4, bh4) > 1)
1390*c0909341SAndroid Build Coastguard Worker {
1391*c0909341SAndroid Build Coastguard Worker const int ctx = get_comp_ctx(t->a, &t->l, by4, bx4,
1392*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1393*c0909341SAndroid Build Coastguard Worker is_comp = dav1d_msac_decode_bool_adapt(&ts->msac,
1394*c0909341SAndroid Build Coastguard Worker ts->cdf.m.comp[ctx]);
1395*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1396*c0909341SAndroid Build Coastguard Worker printf("Post-compflag[%d]: r=%d\n", is_comp, ts->msac.rng);
1397*c0909341SAndroid Build Coastguard Worker } else {
1398*c0909341SAndroid Build Coastguard Worker is_comp = 0;
1399*c0909341SAndroid Build Coastguard Worker }
1400*c0909341SAndroid Build Coastguard Worker
1401*c0909341SAndroid Build Coastguard Worker if (b->skip_mode) {
1402*c0909341SAndroid Build Coastguard Worker b->ref[0] = f->frame_hdr->skip_mode_refs[0];
1403*c0909341SAndroid Build Coastguard Worker b->ref[1] = f->frame_hdr->skip_mode_refs[1];
1404*c0909341SAndroid Build Coastguard Worker b->comp_type = COMP_INTER_AVG;
1405*c0909341SAndroid Build Coastguard Worker b->inter_mode = NEARESTMV_NEARESTMV;
1406*c0909341SAndroid Build Coastguard Worker b->drl_idx = NEAREST_DRL;
1407*c0909341SAndroid Build Coastguard Worker has_subpel_filter = 0;
1408*c0909341SAndroid Build Coastguard Worker
1409*c0909341SAndroid Build Coastguard Worker refmvs_candidate mvstack[8];
1410*c0909341SAndroid Build Coastguard Worker int n_mvs, ctx;
1411*c0909341SAndroid Build Coastguard Worker dav1d_refmvs_find(&t->rt, mvstack, &n_mvs, &ctx,
1412*c0909341SAndroid Build Coastguard Worker (union refmvs_refpair) { .ref = {
1413*c0909341SAndroid Build Coastguard Worker b->ref[0] + 1, b->ref[1] + 1 }},
1414*c0909341SAndroid Build Coastguard Worker bs, intra_edge_flags, t->by, t->bx);
1415*c0909341SAndroid Build Coastguard Worker
1416*c0909341SAndroid Build Coastguard Worker b->mv[0] = mvstack[0].mv.mv[0];
1417*c0909341SAndroid Build Coastguard Worker b->mv[1] = mvstack[0].mv.mv[1];
1418*c0909341SAndroid Build Coastguard Worker fix_mv_precision(f->frame_hdr, &b->mv[0]);
1419*c0909341SAndroid Build Coastguard Worker fix_mv_precision(f->frame_hdr, &b->mv[1]);
1420*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1421*c0909341SAndroid Build Coastguard Worker printf("Post-skipmodeblock[mv=1:y=%d,x=%d,2:y=%d,x=%d,refs=%d+%d\n",
1422*c0909341SAndroid Build Coastguard Worker b->mv[0].y, b->mv[0].x, b->mv[1].y, b->mv[1].x,
1423*c0909341SAndroid Build Coastguard Worker b->ref[0], b->ref[1]);
1424*c0909341SAndroid Build Coastguard Worker } else if (is_comp) {
1425*c0909341SAndroid Build Coastguard Worker const int dir_ctx = get_comp_dir_ctx(t->a, &t->l, by4, bx4,
1426*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1427*c0909341SAndroid Build Coastguard Worker if (dav1d_msac_decode_bool_adapt(&ts->msac,
1428*c0909341SAndroid Build Coastguard Worker ts->cdf.m.comp_dir[dir_ctx]))
1429*c0909341SAndroid Build Coastguard Worker {
1430*c0909341SAndroid Build Coastguard Worker // bidir - first reference (fw)
1431*c0909341SAndroid Build Coastguard Worker const int ctx1 = av1_get_fwd_ref_ctx(t->a, &t->l, by4, bx4,
1432*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1433*c0909341SAndroid Build Coastguard Worker if (dav1d_msac_decode_bool_adapt(&ts->msac,
1434*c0909341SAndroid Build Coastguard Worker ts->cdf.m.comp_fwd_ref[0][ctx1]))
1435*c0909341SAndroid Build Coastguard Worker {
1436*c0909341SAndroid Build Coastguard Worker const int ctx2 = av1_get_fwd_ref_2_ctx(t->a, &t->l, by4, bx4,
1437*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1438*c0909341SAndroid Build Coastguard Worker b->ref[0] = 2 + dav1d_msac_decode_bool_adapt(&ts->msac,
1439*c0909341SAndroid Build Coastguard Worker ts->cdf.m.comp_fwd_ref[2][ctx2]);
1440*c0909341SAndroid Build Coastguard Worker } else {
1441*c0909341SAndroid Build Coastguard Worker const int ctx2 = av1_get_fwd_ref_1_ctx(t->a, &t->l, by4, bx4,
1442*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1443*c0909341SAndroid Build Coastguard Worker b->ref[0] = dav1d_msac_decode_bool_adapt(&ts->msac,
1444*c0909341SAndroid Build Coastguard Worker ts->cdf.m.comp_fwd_ref[1][ctx2]);
1445*c0909341SAndroid Build Coastguard Worker }
1446*c0909341SAndroid Build Coastguard Worker
1447*c0909341SAndroid Build Coastguard Worker // second reference (bw)
1448*c0909341SAndroid Build Coastguard Worker const int ctx3 = av1_get_bwd_ref_ctx(t->a, &t->l, by4, bx4,
1449*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1450*c0909341SAndroid Build Coastguard Worker if (dav1d_msac_decode_bool_adapt(&ts->msac,
1451*c0909341SAndroid Build Coastguard Worker ts->cdf.m.comp_bwd_ref[0][ctx3]))
1452*c0909341SAndroid Build Coastguard Worker {
1453*c0909341SAndroid Build Coastguard Worker b->ref[1] = 6;
1454*c0909341SAndroid Build Coastguard Worker } else {
1455*c0909341SAndroid Build Coastguard Worker const int ctx4 = av1_get_bwd_ref_1_ctx(t->a, &t->l, by4, bx4,
1456*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1457*c0909341SAndroid Build Coastguard Worker b->ref[1] = 4 + dav1d_msac_decode_bool_adapt(&ts->msac,
1458*c0909341SAndroid Build Coastguard Worker ts->cdf.m.comp_bwd_ref[1][ctx4]);
1459*c0909341SAndroid Build Coastguard Worker }
1460*c0909341SAndroid Build Coastguard Worker } else {
1461*c0909341SAndroid Build Coastguard Worker // unidir
1462*c0909341SAndroid Build Coastguard Worker const int uctx_p = av1_get_uni_p_ctx(t->a, &t->l, by4, bx4,
1463*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1464*c0909341SAndroid Build Coastguard Worker if (dav1d_msac_decode_bool_adapt(&ts->msac,
1465*c0909341SAndroid Build Coastguard Worker ts->cdf.m.comp_uni_ref[0][uctx_p]))
1466*c0909341SAndroid Build Coastguard Worker {
1467*c0909341SAndroid Build Coastguard Worker b->ref[0] = 4;
1468*c0909341SAndroid Build Coastguard Worker b->ref[1] = 6;
1469*c0909341SAndroid Build Coastguard Worker } else {
1470*c0909341SAndroid Build Coastguard Worker const int uctx_p1 = av1_get_uni_p1_ctx(t->a, &t->l, by4, bx4,
1471*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1472*c0909341SAndroid Build Coastguard Worker b->ref[0] = 0;
1473*c0909341SAndroid Build Coastguard Worker b->ref[1] = 1 + dav1d_msac_decode_bool_adapt(&ts->msac,
1474*c0909341SAndroid Build Coastguard Worker ts->cdf.m.comp_uni_ref[1][uctx_p1]);
1475*c0909341SAndroid Build Coastguard Worker if (b->ref[1] == 2) {
1476*c0909341SAndroid Build Coastguard Worker const int uctx_p2 = av1_get_uni_p2_ctx(t->a, &t->l, by4, bx4,
1477*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1478*c0909341SAndroid Build Coastguard Worker b->ref[1] += dav1d_msac_decode_bool_adapt(&ts->msac,
1479*c0909341SAndroid Build Coastguard Worker ts->cdf.m.comp_uni_ref[2][uctx_p2]);
1480*c0909341SAndroid Build Coastguard Worker }
1481*c0909341SAndroid Build Coastguard Worker }
1482*c0909341SAndroid Build Coastguard Worker }
1483*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1484*c0909341SAndroid Build Coastguard Worker printf("Post-refs[%d/%d]: r=%d\n",
1485*c0909341SAndroid Build Coastguard Worker b->ref[0], b->ref[1], ts->msac.rng);
1486*c0909341SAndroid Build Coastguard Worker
1487*c0909341SAndroid Build Coastguard Worker refmvs_candidate mvstack[8];
1488*c0909341SAndroid Build Coastguard Worker int n_mvs, ctx;
1489*c0909341SAndroid Build Coastguard Worker dav1d_refmvs_find(&t->rt, mvstack, &n_mvs, &ctx,
1490*c0909341SAndroid Build Coastguard Worker (union refmvs_refpair) { .ref = {
1491*c0909341SAndroid Build Coastguard Worker b->ref[0] + 1, b->ref[1] + 1 }},
1492*c0909341SAndroid Build Coastguard Worker bs, intra_edge_flags, t->by, t->bx);
1493*c0909341SAndroid Build Coastguard Worker
1494*c0909341SAndroid Build Coastguard Worker b->inter_mode = dav1d_msac_decode_symbol_adapt8(&ts->msac,
1495*c0909341SAndroid Build Coastguard Worker ts->cdf.m.comp_inter_mode[ctx],
1496*c0909341SAndroid Build Coastguard Worker N_COMP_INTER_PRED_MODES - 1);
1497*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1498*c0909341SAndroid Build Coastguard Worker printf("Post-compintermode[%d,ctx=%d,n_mvs=%d]: r=%d\n",
1499*c0909341SAndroid Build Coastguard Worker b->inter_mode, ctx, n_mvs, ts->msac.rng);
1500*c0909341SAndroid Build Coastguard Worker
1501*c0909341SAndroid Build Coastguard Worker const uint8_t *const im = dav1d_comp_inter_pred_modes[b->inter_mode];
1502*c0909341SAndroid Build Coastguard Worker b->drl_idx = NEAREST_DRL;
1503*c0909341SAndroid Build Coastguard Worker if (b->inter_mode == NEWMV_NEWMV) {
1504*c0909341SAndroid Build Coastguard Worker if (n_mvs > 1) { // NEARER, NEAR or NEARISH
1505*c0909341SAndroid Build Coastguard Worker const int drl_ctx_v1 = get_drl_context(mvstack, 0);
1506*c0909341SAndroid Build Coastguard Worker b->drl_idx += dav1d_msac_decode_bool_adapt(&ts->msac,
1507*c0909341SAndroid Build Coastguard Worker ts->cdf.m.drl_bit[drl_ctx_v1]);
1508*c0909341SAndroid Build Coastguard Worker if (b->drl_idx == NEARER_DRL && n_mvs > 2) {
1509*c0909341SAndroid Build Coastguard Worker const int drl_ctx_v2 = get_drl_context(mvstack, 1);
1510*c0909341SAndroid Build Coastguard Worker b->drl_idx += dav1d_msac_decode_bool_adapt(&ts->msac,
1511*c0909341SAndroid Build Coastguard Worker ts->cdf.m.drl_bit[drl_ctx_v2]);
1512*c0909341SAndroid Build Coastguard Worker }
1513*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1514*c0909341SAndroid Build Coastguard Worker printf("Post-drlidx[%d,n_mvs=%d]: r=%d\n",
1515*c0909341SAndroid Build Coastguard Worker b->drl_idx, n_mvs, ts->msac.rng);
1516*c0909341SAndroid Build Coastguard Worker }
1517*c0909341SAndroid Build Coastguard Worker } else if (im[0] == NEARMV || im[1] == NEARMV) {
1518*c0909341SAndroid Build Coastguard Worker b->drl_idx = NEARER_DRL;
1519*c0909341SAndroid Build Coastguard Worker if (n_mvs > 2) { // NEAR or NEARISH
1520*c0909341SAndroid Build Coastguard Worker const int drl_ctx_v2 = get_drl_context(mvstack, 1);
1521*c0909341SAndroid Build Coastguard Worker b->drl_idx += dav1d_msac_decode_bool_adapt(&ts->msac,
1522*c0909341SAndroid Build Coastguard Worker ts->cdf.m.drl_bit[drl_ctx_v2]);
1523*c0909341SAndroid Build Coastguard Worker if (b->drl_idx == NEAR_DRL && n_mvs > 3) {
1524*c0909341SAndroid Build Coastguard Worker const int drl_ctx_v3 = get_drl_context(mvstack, 2);
1525*c0909341SAndroid Build Coastguard Worker b->drl_idx += dav1d_msac_decode_bool_adapt(&ts->msac,
1526*c0909341SAndroid Build Coastguard Worker ts->cdf.m.drl_bit[drl_ctx_v3]);
1527*c0909341SAndroid Build Coastguard Worker }
1528*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1529*c0909341SAndroid Build Coastguard Worker printf("Post-drlidx[%d,n_mvs=%d]: r=%d\n",
1530*c0909341SAndroid Build Coastguard Worker b->drl_idx, n_mvs, ts->msac.rng);
1531*c0909341SAndroid Build Coastguard Worker }
1532*c0909341SAndroid Build Coastguard Worker }
1533*c0909341SAndroid Build Coastguard Worker assert(b->drl_idx >= NEAREST_DRL && b->drl_idx <= NEARISH_DRL);
1534*c0909341SAndroid Build Coastguard Worker
1535*c0909341SAndroid Build Coastguard Worker #define assign_comp_mv(idx) \
1536*c0909341SAndroid Build Coastguard Worker switch (im[idx]) { \
1537*c0909341SAndroid Build Coastguard Worker case NEARMV: \
1538*c0909341SAndroid Build Coastguard Worker case NEARESTMV: \
1539*c0909341SAndroid Build Coastguard Worker b->mv[idx] = mvstack[b->drl_idx].mv.mv[idx]; \
1540*c0909341SAndroid Build Coastguard Worker fix_mv_precision(f->frame_hdr, &b->mv[idx]); \
1541*c0909341SAndroid Build Coastguard Worker break; \
1542*c0909341SAndroid Build Coastguard Worker case GLOBALMV: \
1543*c0909341SAndroid Build Coastguard Worker has_subpel_filter |= \
1544*c0909341SAndroid Build Coastguard Worker f->frame_hdr->gmv[b->ref[idx]].type == DAV1D_WM_TYPE_TRANSLATION; \
1545*c0909341SAndroid Build Coastguard Worker b->mv[idx] = get_gmv_2d(&f->frame_hdr->gmv[b->ref[idx]], \
1546*c0909341SAndroid Build Coastguard Worker t->bx, t->by, bw4, bh4, f->frame_hdr); \
1547*c0909341SAndroid Build Coastguard Worker break; \
1548*c0909341SAndroid Build Coastguard Worker case NEWMV: \
1549*c0909341SAndroid Build Coastguard Worker b->mv[idx] = mvstack[b->drl_idx].mv.mv[idx]; \
1550*c0909341SAndroid Build Coastguard Worker const int mv_prec = f->frame_hdr->hp - f->frame_hdr->force_integer_mv; \
1551*c0909341SAndroid Build Coastguard Worker read_mv_residual(ts, &b->mv[idx], mv_prec); \
1552*c0909341SAndroid Build Coastguard Worker break; \
1553*c0909341SAndroid Build Coastguard Worker }
1554*c0909341SAndroid Build Coastguard Worker has_subpel_filter = imin(bw4, bh4) == 1 ||
1555*c0909341SAndroid Build Coastguard Worker b->inter_mode != GLOBALMV_GLOBALMV;
1556*c0909341SAndroid Build Coastguard Worker assign_comp_mv(0);
1557*c0909341SAndroid Build Coastguard Worker assign_comp_mv(1);
1558*c0909341SAndroid Build Coastguard Worker #undef assign_comp_mv
1559*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1560*c0909341SAndroid Build Coastguard Worker printf("Post-residual_mv[1:y=%d,x=%d,2:y=%d,x=%d]: r=%d\n",
1561*c0909341SAndroid Build Coastguard Worker b->mv[0].y, b->mv[0].x, b->mv[1].y, b->mv[1].x,
1562*c0909341SAndroid Build Coastguard Worker ts->msac.rng);
1563*c0909341SAndroid Build Coastguard Worker
1564*c0909341SAndroid Build Coastguard Worker // jnt_comp vs. seg vs. wedge
1565*c0909341SAndroid Build Coastguard Worker int is_segwedge = 0;
1566*c0909341SAndroid Build Coastguard Worker if (f->seq_hdr->masked_compound) {
1567*c0909341SAndroid Build Coastguard Worker const int mask_ctx = get_mask_comp_ctx(t->a, &t->l, by4, bx4);
1568*c0909341SAndroid Build Coastguard Worker
1569*c0909341SAndroid Build Coastguard Worker is_segwedge = dav1d_msac_decode_bool_adapt(&ts->msac,
1570*c0909341SAndroid Build Coastguard Worker ts->cdf.m.mask_comp[mask_ctx]);
1571*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1572*c0909341SAndroid Build Coastguard Worker printf("Post-segwedge_vs_jntavg[%d,ctx=%d]: r=%d\n",
1573*c0909341SAndroid Build Coastguard Worker is_segwedge, mask_ctx, ts->msac.rng);
1574*c0909341SAndroid Build Coastguard Worker }
1575*c0909341SAndroid Build Coastguard Worker
1576*c0909341SAndroid Build Coastguard Worker if (!is_segwedge) {
1577*c0909341SAndroid Build Coastguard Worker if (f->seq_hdr->jnt_comp) {
1578*c0909341SAndroid Build Coastguard Worker const int jnt_ctx =
1579*c0909341SAndroid Build Coastguard Worker get_jnt_comp_ctx(f->seq_hdr->order_hint_n_bits,
1580*c0909341SAndroid Build Coastguard Worker f->cur.frame_hdr->frame_offset,
1581*c0909341SAndroid Build Coastguard Worker f->refp[b->ref[0]].p.frame_hdr->frame_offset,
1582*c0909341SAndroid Build Coastguard Worker f->refp[b->ref[1]].p.frame_hdr->frame_offset,
1583*c0909341SAndroid Build Coastguard Worker t->a, &t->l, by4, bx4);
1584*c0909341SAndroid Build Coastguard Worker b->comp_type = COMP_INTER_WEIGHTED_AVG +
1585*c0909341SAndroid Build Coastguard Worker dav1d_msac_decode_bool_adapt(&ts->msac,
1586*c0909341SAndroid Build Coastguard Worker ts->cdf.m.jnt_comp[jnt_ctx]);
1587*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1588*c0909341SAndroid Build Coastguard Worker printf("Post-jnt_comp[%d,ctx=%d[ac:%d,ar:%d,lc:%d,lr:%d]]: r=%d\n",
1589*c0909341SAndroid Build Coastguard Worker b->comp_type == COMP_INTER_AVG,
1590*c0909341SAndroid Build Coastguard Worker jnt_ctx, t->a->comp_type[bx4], t->a->ref[0][bx4],
1591*c0909341SAndroid Build Coastguard Worker t->l.comp_type[by4], t->l.ref[0][by4],
1592*c0909341SAndroid Build Coastguard Worker ts->msac.rng);
1593*c0909341SAndroid Build Coastguard Worker } else {
1594*c0909341SAndroid Build Coastguard Worker b->comp_type = COMP_INTER_AVG;
1595*c0909341SAndroid Build Coastguard Worker }
1596*c0909341SAndroid Build Coastguard Worker } else {
1597*c0909341SAndroid Build Coastguard Worker if (wedge_allowed_mask & (1 << bs)) {
1598*c0909341SAndroid Build Coastguard Worker const int ctx = dav1d_wedge_ctx_lut[bs];
1599*c0909341SAndroid Build Coastguard Worker b->comp_type = COMP_INTER_WEDGE -
1600*c0909341SAndroid Build Coastguard Worker dav1d_msac_decode_bool_adapt(&ts->msac,
1601*c0909341SAndroid Build Coastguard Worker ts->cdf.m.wedge_comp[ctx]);
1602*c0909341SAndroid Build Coastguard Worker if (b->comp_type == COMP_INTER_WEDGE)
1603*c0909341SAndroid Build Coastguard Worker b->wedge_idx = dav1d_msac_decode_symbol_adapt16(&ts->msac,
1604*c0909341SAndroid Build Coastguard Worker ts->cdf.m.wedge_idx[ctx], 15);
1605*c0909341SAndroid Build Coastguard Worker } else {
1606*c0909341SAndroid Build Coastguard Worker b->comp_type = COMP_INTER_SEG;
1607*c0909341SAndroid Build Coastguard Worker }
1608*c0909341SAndroid Build Coastguard Worker b->mask_sign = dav1d_msac_decode_bool_equi(&ts->msac);
1609*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1610*c0909341SAndroid Build Coastguard Worker printf("Post-seg/wedge[%d,wedge_idx=%d,sign=%d]: r=%d\n",
1611*c0909341SAndroid Build Coastguard Worker b->comp_type == COMP_INTER_WEDGE,
1612*c0909341SAndroid Build Coastguard Worker b->wedge_idx, b->mask_sign, ts->msac.rng);
1613*c0909341SAndroid Build Coastguard Worker }
1614*c0909341SAndroid Build Coastguard Worker } else {
1615*c0909341SAndroid Build Coastguard Worker b->comp_type = COMP_INTER_NONE;
1616*c0909341SAndroid Build Coastguard Worker
1617*c0909341SAndroid Build Coastguard Worker // ref
1618*c0909341SAndroid Build Coastguard Worker if (seg && seg->ref > 0) {
1619*c0909341SAndroid Build Coastguard Worker b->ref[0] = seg->ref - 1;
1620*c0909341SAndroid Build Coastguard Worker } else if (seg && (seg->globalmv || seg->skip)) {
1621*c0909341SAndroid Build Coastguard Worker b->ref[0] = 0;
1622*c0909341SAndroid Build Coastguard Worker } else {
1623*c0909341SAndroid Build Coastguard Worker const int ctx1 = av1_get_ref_ctx(t->a, &t->l, by4, bx4,
1624*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1625*c0909341SAndroid Build Coastguard Worker if (dav1d_msac_decode_bool_adapt(&ts->msac,
1626*c0909341SAndroid Build Coastguard Worker ts->cdf.m.ref[0][ctx1]))
1627*c0909341SAndroid Build Coastguard Worker {
1628*c0909341SAndroid Build Coastguard Worker const int ctx2 = av1_get_ref_2_ctx(t->a, &t->l, by4, bx4,
1629*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1630*c0909341SAndroid Build Coastguard Worker if (dav1d_msac_decode_bool_adapt(&ts->msac,
1631*c0909341SAndroid Build Coastguard Worker ts->cdf.m.ref[1][ctx2]))
1632*c0909341SAndroid Build Coastguard Worker {
1633*c0909341SAndroid Build Coastguard Worker b->ref[0] = 6;
1634*c0909341SAndroid Build Coastguard Worker } else {
1635*c0909341SAndroid Build Coastguard Worker const int ctx3 = av1_get_ref_6_ctx(t->a, &t->l, by4, bx4,
1636*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1637*c0909341SAndroid Build Coastguard Worker b->ref[0] = 4 + dav1d_msac_decode_bool_adapt(&ts->msac,
1638*c0909341SAndroid Build Coastguard Worker ts->cdf.m.ref[5][ctx3]);
1639*c0909341SAndroid Build Coastguard Worker }
1640*c0909341SAndroid Build Coastguard Worker } else {
1641*c0909341SAndroid Build Coastguard Worker const int ctx2 = av1_get_ref_3_ctx(t->a, &t->l, by4, bx4,
1642*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1643*c0909341SAndroid Build Coastguard Worker if (dav1d_msac_decode_bool_adapt(&ts->msac,
1644*c0909341SAndroid Build Coastguard Worker ts->cdf.m.ref[2][ctx2]))
1645*c0909341SAndroid Build Coastguard Worker {
1646*c0909341SAndroid Build Coastguard Worker const int ctx3 = av1_get_ref_5_ctx(t->a, &t->l, by4, bx4,
1647*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1648*c0909341SAndroid Build Coastguard Worker b->ref[0] = 2 + dav1d_msac_decode_bool_adapt(&ts->msac,
1649*c0909341SAndroid Build Coastguard Worker ts->cdf.m.ref[4][ctx3]);
1650*c0909341SAndroid Build Coastguard Worker } else {
1651*c0909341SAndroid Build Coastguard Worker const int ctx3 = av1_get_ref_4_ctx(t->a, &t->l, by4, bx4,
1652*c0909341SAndroid Build Coastguard Worker have_top, have_left);
1653*c0909341SAndroid Build Coastguard Worker b->ref[0] = dav1d_msac_decode_bool_adapt(&ts->msac,
1654*c0909341SAndroid Build Coastguard Worker ts->cdf.m.ref[3][ctx3]);
1655*c0909341SAndroid Build Coastguard Worker }
1656*c0909341SAndroid Build Coastguard Worker }
1657*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1658*c0909341SAndroid Build Coastguard Worker printf("Post-ref[%d]: r=%d\n", b->ref[0], ts->msac.rng);
1659*c0909341SAndroid Build Coastguard Worker }
1660*c0909341SAndroid Build Coastguard Worker b->ref[1] = -1;
1661*c0909341SAndroid Build Coastguard Worker
1662*c0909341SAndroid Build Coastguard Worker refmvs_candidate mvstack[8];
1663*c0909341SAndroid Build Coastguard Worker int n_mvs, ctx;
1664*c0909341SAndroid Build Coastguard Worker dav1d_refmvs_find(&t->rt, mvstack, &n_mvs, &ctx,
1665*c0909341SAndroid Build Coastguard Worker (union refmvs_refpair) { .ref = { b->ref[0] + 1, -1 }},
1666*c0909341SAndroid Build Coastguard Worker bs, intra_edge_flags, t->by, t->bx);
1667*c0909341SAndroid Build Coastguard Worker
1668*c0909341SAndroid Build Coastguard Worker // mode parsing and mv derivation from ref_mvs
1669*c0909341SAndroid Build Coastguard Worker if ((seg && (seg->skip || seg->globalmv)) ||
1670*c0909341SAndroid Build Coastguard Worker dav1d_msac_decode_bool_adapt(&ts->msac,
1671*c0909341SAndroid Build Coastguard Worker ts->cdf.m.newmv_mode[ctx & 7]))
1672*c0909341SAndroid Build Coastguard Worker {
1673*c0909341SAndroid Build Coastguard Worker if ((seg && (seg->skip || seg->globalmv)) ||
1674*c0909341SAndroid Build Coastguard Worker !dav1d_msac_decode_bool_adapt(&ts->msac,
1675*c0909341SAndroid Build Coastguard Worker ts->cdf.m.globalmv_mode[(ctx >> 3) & 1]))
1676*c0909341SAndroid Build Coastguard Worker {
1677*c0909341SAndroid Build Coastguard Worker b->inter_mode = GLOBALMV;
1678*c0909341SAndroid Build Coastguard Worker b->mv[0] = get_gmv_2d(&f->frame_hdr->gmv[b->ref[0]],
1679*c0909341SAndroid Build Coastguard Worker t->bx, t->by, bw4, bh4, f->frame_hdr);
1680*c0909341SAndroid Build Coastguard Worker has_subpel_filter = imin(bw4, bh4) == 1 ||
1681*c0909341SAndroid Build Coastguard Worker f->frame_hdr->gmv[b->ref[0]].type == DAV1D_WM_TYPE_TRANSLATION;
1682*c0909341SAndroid Build Coastguard Worker } else {
1683*c0909341SAndroid Build Coastguard Worker has_subpel_filter = 1;
1684*c0909341SAndroid Build Coastguard Worker if (dav1d_msac_decode_bool_adapt(&ts->msac,
1685*c0909341SAndroid Build Coastguard Worker ts->cdf.m.refmv_mode[(ctx >> 4) & 15]))
1686*c0909341SAndroid Build Coastguard Worker { // NEAREST, NEARER, NEAR or NEARISH
1687*c0909341SAndroid Build Coastguard Worker b->inter_mode = NEARMV;
1688*c0909341SAndroid Build Coastguard Worker b->drl_idx = NEARER_DRL;
1689*c0909341SAndroid Build Coastguard Worker if (n_mvs > 2) { // NEARER, NEAR or NEARISH
1690*c0909341SAndroid Build Coastguard Worker const int drl_ctx_v2 = get_drl_context(mvstack, 1);
1691*c0909341SAndroid Build Coastguard Worker b->drl_idx += dav1d_msac_decode_bool_adapt(&ts->msac,
1692*c0909341SAndroid Build Coastguard Worker ts->cdf.m.drl_bit[drl_ctx_v2]);
1693*c0909341SAndroid Build Coastguard Worker if (b->drl_idx == NEAR_DRL && n_mvs > 3) { // NEAR or NEARISH
1694*c0909341SAndroid Build Coastguard Worker const int drl_ctx_v3 =
1695*c0909341SAndroid Build Coastguard Worker get_drl_context(mvstack, 2);
1696*c0909341SAndroid Build Coastguard Worker b->drl_idx += dav1d_msac_decode_bool_adapt(&ts->msac,
1697*c0909341SAndroid Build Coastguard Worker ts->cdf.m.drl_bit[drl_ctx_v3]);
1698*c0909341SAndroid Build Coastguard Worker }
1699*c0909341SAndroid Build Coastguard Worker }
1700*c0909341SAndroid Build Coastguard Worker } else {
1701*c0909341SAndroid Build Coastguard Worker b->inter_mode = NEARESTMV;
1702*c0909341SAndroid Build Coastguard Worker b->drl_idx = NEAREST_DRL;
1703*c0909341SAndroid Build Coastguard Worker }
1704*c0909341SAndroid Build Coastguard Worker assert(b->drl_idx >= NEAREST_DRL && b->drl_idx <= NEARISH_DRL);
1705*c0909341SAndroid Build Coastguard Worker b->mv[0] = mvstack[b->drl_idx].mv.mv[0];
1706*c0909341SAndroid Build Coastguard Worker if (b->drl_idx < NEAR_DRL)
1707*c0909341SAndroid Build Coastguard Worker fix_mv_precision(f->frame_hdr, &b->mv[0]);
1708*c0909341SAndroid Build Coastguard Worker }
1709*c0909341SAndroid Build Coastguard Worker
1710*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1711*c0909341SAndroid Build Coastguard Worker printf("Post-intermode[%d,drl=%d,mv=y:%d,x:%d,n_mvs=%d]: r=%d\n",
1712*c0909341SAndroid Build Coastguard Worker b->inter_mode, b->drl_idx, b->mv[0].y, b->mv[0].x, n_mvs,
1713*c0909341SAndroid Build Coastguard Worker ts->msac.rng);
1714*c0909341SAndroid Build Coastguard Worker } else {
1715*c0909341SAndroid Build Coastguard Worker has_subpel_filter = 1;
1716*c0909341SAndroid Build Coastguard Worker b->inter_mode = NEWMV;
1717*c0909341SAndroid Build Coastguard Worker b->drl_idx = NEAREST_DRL;
1718*c0909341SAndroid Build Coastguard Worker if (n_mvs > 1) { // NEARER, NEAR or NEARISH
1719*c0909341SAndroid Build Coastguard Worker const int drl_ctx_v1 = get_drl_context(mvstack, 0);
1720*c0909341SAndroid Build Coastguard Worker b->drl_idx += dav1d_msac_decode_bool_adapt(&ts->msac,
1721*c0909341SAndroid Build Coastguard Worker ts->cdf.m.drl_bit[drl_ctx_v1]);
1722*c0909341SAndroid Build Coastguard Worker if (b->drl_idx == NEARER_DRL && n_mvs > 2) { // NEAR or NEARISH
1723*c0909341SAndroid Build Coastguard Worker const int drl_ctx_v2 = get_drl_context(mvstack, 1);
1724*c0909341SAndroid Build Coastguard Worker b->drl_idx += dav1d_msac_decode_bool_adapt(&ts->msac,
1725*c0909341SAndroid Build Coastguard Worker ts->cdf.m.drl_bit[drl_ctx_v2]);
1726*c0909341SAndroid Build Coastguard Worker }
1727*c0909341SAndroid Build Coastguard Worker }
1728*c0909341SAndroid Build Coastguard Worker assert(b->drl_idx >= NEAREST_DRL && b->drl_idx <= NEARISH_DRL);
1729*c0909341SAndroid Build Coastguard Worker if (n_mvs > 1) {
1730*c0909341SAndroid Build Coastguard Worker b->mv[0] = mvstack[b->drl_idx].mv.mv[0];
1731*c0909341SAndroid Build Coastguard Worker } else {
1732*c0909341SAndroid Build Coastguard Worker assert(!b->drl_idx);
1733*c0909341SAndroid Build Coastguard Worker b->mv[0] = mvstack[0].mv.mv[0];
1734*c0909341SAndroid Build Coastguard Worker fix_mv_precision(f->frame_hdr, &b->mv[0]);
1735*c0909341SAndroid Build Coastguard Worker }
1736*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1737*c0909341SAndroid Build Coastguard Worker printf("Post-intermode[%d,drl=%d]: r=%d\n",
1738*c0909341SAndroid Build Coastguard Worker b->inter_mode, b->drl_idx, ts->msac.rng);
1739*c0909341SAndroid Build Coastguard Worker const int mv_prec = f->frame_hdr->hp - f->frame_hdr->force_integer_mv;
1740*c0909341SAndroid Build Coastguard Worker read_mv_residual(ts, &b->mv[0], mv_prec);
1741*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1742*c0909341SAndroid Build Coastguard Worker printf("Post-residualmv[mv=y:%d,x:%d]: r=%d\n",
1743*c0909341SAndroid Build Coastguard Worker b->mv[0].y, b->mv[0].x, ts->msac.rng);
1744*c0909341SAndroid Build Coastguard Worker }
1745*c0909341SAndroid Build Coastguard Worker
1746*c0909341SAndroid Build Coastguard Worker // interintra flags
1747*c0909341SAndroid Build Coastguard Worker const int ii_sz_grp = dav1d_ymode_size_context[bs];
1748*c0909341SAndroid Build Coastguard Worker if (f->seq_hdr->inter_intra &&
1749*c0909341SAndroid Build Coastguard Worker interintra_allowed_mask & (1 << bs) &&
1750*c0909341SAndroid Build Coastguard Worker dav1d_msac_decode_bool_adapt(&ts->msac,
1751*c0909341SAndroid Build Coastguard Worker ts->cdf.m.interintra[ii_sz_grp]))
1752*c0909341SAndroid Build Coastguard Worker {
1753*c0909341SAndroid Build Coastguard Worker b->interintra_mode = dav1d_msac_decode_symbol_adapt4(&ts->msac,
1754*c0909341SAndroid Build Coastguard Worker ts->cdf.m.interintra_mode[ii_sz_grp],
1755*c0909341SAndroid Build Coastguard Worker N_INTER_INTRA_PRED_MODES - 1);
1756*c0909341SAndroid Build Coastguard Worker const int wedge_ctx = dav1d_wedge_ctx_lut[bs];
1757*c0909341SAndroid Build Coastguard Worker b->interintra_type = INTER_INTRA_BLEND +
1758*c0909341SAndroid Build Coastguard Worker dav1d_msac_decode_bool_adapt(&ts->msac,
1759*c0909341SAndroid Build Coastguard Worker ts->cdf.m.interintra_wedge[wedge_ctx]);
1760*c0909341SAndroid Build Coastguard Worker if (b->interintra_type == INTER_INTRA_WEDGE)
1761*c0909341SAndroid Build Coastguard Worker b->wedge_idx = dav1d_msac_decode_symbol_adapt16(&ts->msac,
1762*c0909341SAndroid Build Coastguard Worker ts->cdf.m.wedge_idx[wedge_ctx], 15);
1763*c0909341SAndroid Build Coastguard Worker } else {
1764*c0909341SAndroid Build Coastguard Worker b->interintra_type = INTER_INTRA_NONE;
1765*c0909341SAndroid Build Coastguard Worker }
1766*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO && f->seq_hdr->inter_intra &&
1767*c0909341SAndroid Build Coastguard Worker interintra_allowed_mask & (1 << bs))
1768*c0909341SAndroid Build Coastguard Worker {
1769*c0909341SAndroid Build Coastguard Worker printf("Post-interintra[t=%d,m=%d,w=%d]: r=%d\n",
1770*c0909341SAndroid Build Coastguard Worker b->interintra_type, b->interintra_mode,
1771*c0909341SAndroid Build Coastguard Worker b->wedge_idx, ts->msac.rng);
1772*c0909341SAndroid Build Coastguard Worker }
1773*c0909341SAndroid Build Coastguard Worker
1774*c0909341SAndroid Build Coastguard Worker // motion variation
1775*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->switchable_motion_mode &&
1776*c0909341SAndroid Build Coastguard Worker b->interintra_type == INTER_INTRA_NONE && imin(bw4, bh4) >= 2 &&
1777*c0909341SAndroid Build Coastguard Worker // is not warped global motion
1778*c0909341SAndroid Build Coastguard Worker !(!f->frame_hdr->force_integer_mv && b->inter_mode == GLOBALMV &&
1779*c0909341SAndroid Build Coastguard Worker f->frame_hdr->gmv[b->ref[0]].type > DAV1D_WM_TYPE_TRANSLATION) &&
1780*c0909341SAndroid Build Coastguard Worker // has overlappable neighbours
1781*c0909341SAndroid Build Coastguard Worker ((have_left && findoddzero(&t->l.intra[by4 + 1], h4 >> 1)) ||
1782*c0909341SAndroid Build Coastguard Worker (have_top && findoddzero(&t->a->intra[bx4 + 1], w4 >> 1))))
1783*c0909341SAndroid Build Coastguard Worker {
1784*c0909341SAndroid Build Coastguard Worker // reaching here means the block allows obmc - check warp by
1785*c0909341SAndroid Build Coastguard Worker // finding matching-ref blocks in top/left edges
1786*c0909341SAndroid Build Coastguard Worker uint64_t mask[2] = { 0, 0 };
1787*c0909341SAndroid Build Coastguard Worker find_matching_ref(t, intra_edge_flags, bw4, bh4, w4, h4,
1788*c0909341SAndroid Build Coastguard Worker have_left, have_top, b->ref[0], mask);
1789*c0909341SAndroid Build Coastguard Worker const int allow_warp = !f->svc[b->ref[0]][0].scale &&
1790*c0909341SAndroid Build Coastguard Worker !f->frame_hdr->force_integer_mv &&
1791*c0909341SAndroid Build Coastguard Worker f->frame_hdr->warp_motion && (mask[0] | mask[1]);
1792*c0909341SAndroid Build Coastguard Worker
1793*c0909341SAndroid Build Coastguard Worker b->motion_mode = allow_warp ?
1794*c0909341SAndroid Build Coastguard Worker dav1d_msac_decode_symbol_adapt4(&ts->msac,
1795*c0909341SAndroid Build Coastguard Worker ts->cdf.m.motion_mode[bs], 2) :
1796*c0909341SAndroid Build Coastguard Worker dav1d_msac_decode_bool_adapt(&ts->msac, ts->cdf.m.obmc[bs]);
1797*c0909341SAndroid Build Coastguard Worker if (b->motion_mode == MM_WARP) {
1798*c0909341SAndroid Build Coastguard Worker has_subpel_filter = 0;
1799*c0909341SAndroid Build Coastguard Worker derive_warpmv(t, bw4, bh4, mask, b->mv[0], &t->warpmv);
1800*c0909341SAndroid Build Coastguard Worker #define signabs(v) v < 0 ? '-' : ' ', abs(v)
1801*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1802*c0909341SAndroid Build Coastguard Worker printf("[ %c%x %c%x %c%x\n %c%x %c%x %c%x ]\n"
1803*c0909341SAndroid Build Coastguard Worker "alpha=%c%x, beta=%c%x, gamma=%c%x, delta=%c%x, "
1804*c0909341SAndroid Build Coastguard Worker "mv=y:%d,x:%d\n",
1805*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.matrix[0]),
1806*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.matrix[1]),
1807*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.matrix[2]),
1808*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.matrix[3]),
1809*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.matrix[4]),
1810*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.matrix[5]),
1811*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.u.p.alpha),
1812*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.u.p.beta),
1813*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.u.p.gamma),
1814*c0909341SAndroid Build Coastguard Worker signabs(t->warpmv.u.p.delta),
1815*c0909341SAndroid Build Coastguard Worker b->mv[0].y, b->mv[0].x);
1816*c0909341SAndroid Build Coastguard Worker #undef signabs
1817*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass) {
1818*c0909341SAndroid Build Coastguard Worker if (t->warpmv.type == DAV1D_WM_TYPE_AFFINE) {
1819*c0909341SAndroid Build Coastguard Worker b->matrix[0] = t->warpmv.matrix[2] - 0x10000;
1820*c0909341SAndroid Build Coastguard Worker b->matrix[1] = t->warpmv.matrix[3];
1821*c0909341SAndroid Build Coastguard Worker b->matrix[2] = t->warpmv.matrix[4];
1822*c0909341SAndroid Build Coastguard Worker b->matrix[3] = t->warpmv.matrix[5] - 0x10000;
1823*c0909341SAndroid Build Coastguard Worker } else {
1824*c0909341SAndroid Build Coastguard Worker b->matrix[0] = SHRT_MIN;
1825*c0909341SAndroid Build Coastguard Worker }
1826*c0909341SAndroid Build Coastguard Worker }
1827*c0909341SAndroid Build Coastguard Worker }
1828*c0909341SAndroid Build Coastguard Worker
1829*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1830*c0909341SAndroid Build Coastguard Worker printf("Post-motionmode[%d]: r=%d [mask: 0x%" PRIx64 "/0x%"
1831*c0909341SAndroid Build Coastguard Worker PRIx64 "]\n", b->motion_mode, ts->msac.rng, mask[0],
1832*c0909341SAndroid Build Coastguard Worker mask[1]);
1833*c0909341SAndroid Build Coastguard Worker } else {
1834*c0909341SAndroid Build Coastguard Worker b->motion_mode = MM_TRANSLATION;
1835*c0909341SAndroid Build Coastguard Worker }
1836*c0909341SAndroid Build Coastguard Worker }
1837*c0909341SAndroid Build Coastguard Worker
1838*c0909341SAndroid Build Coastguard Worker // subpel filter
1839*c0909341SAndroid Build Coastguard Worker enum Dav1dFilterMode filter[2];
1840*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->subpel_filter_mode == DAV1D_FILTER_SWITCHABLE) {
1841*c0909341SAndroid Build Coastguard Worker if (has_subpel_filter) {
1842*c0909341SAndroid Build Coastguard Worker const int comp = b->comp_type != COMP_INTER_NONE;
1843*c0909341SAndroid Build Coastguard Worker const int ctx1 = get_filter_ctx(t->a, &t->l, comp, 0, b->ref[0],
1844*c0909341SAndroid Build Coastguard Worker by4, bx4);
1845*c0909341SAndroid Build Coastguard Worker filter[0] = dav1d_msac_decode_symbol_adapt4(&ts->msac,
1846*c0909341SAndroid Build Coastguard Worker ts->cdf.m.filter[0][ctx1],
1847*c0909341SAndroid Build Coastguard Worker DAV1D_N_SWITCHABLE_FILTERS - 1);
1848*c0909341SAndroid Build Coastguard Worker if (f->seq_hdr->dual_filter) {
1849*c0909341SAndroid Build Coastguard Worker const int ctx2 = get_filter_ctx(t->a, &t->l, comp, 1,
1850*c0909341SAndroid Build Coastguard Worker b->ref[0], by4, bx4);
1851*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1852*c0909341SAndroid Build Coastguard Worker printf("Post-subpel_filter1[%d,ctx=%d]: r=%d\n",
1853*c0909341SAndroid Build Coastguard Worker filter[0], ctx1, ts->msac.rng);
1854*c0909341SAndroid Build Coastguard Worker filter[1] = dav1d_msac_decode_symbol_adapt4(&ts->msac,
1855*c0909341SAndroid Build Coastguard Worker ts->cdf.m.filter[1][ctx2],
1856*c0909341SAndroid Build Coastguard Worker DAV1D_N_SWITCHABLE_FILTERS - 1);
1857*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1858*c0909341SAndroid Build Coastguard Worker printf("Post-subpel_filter2[%d,ctx=%d]: r=%d\n",
1859*c0909341SAndroid Build Coastguard Worker filter[1], ctx2, ts->msac.rng);
1860*c0909341SAndroid Build Coastguard Worker } else {
1861*c0909341SAndroid Build Coastguard Worker filter[1] = filter[0];
1862*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
1863*c0909341SAndroid Build Coastguard Worker printf("Post-subpel_filter[%d,ctx=%d]: r=%d\n",
1864*c0909341SAndroid Build Coastguard Worker filter[0], ctx1, ts->msac.rng);
1865*c0909341SAndroid Build Coastguard Worker }
1866*c0909341SAndroid Build Coastguard Worker } else {
1867*c0909341SAndroid Build Coastguard Worker filter[0] = filter[1] = DAV1D_FILTER_8TAP_REGULAR;
1868*c0909341SAndroid Build Coastguard Worker }
1869*c0909341SAndroid Build Coastguard Worker } else {
1870*c0909341SAndroid Build Coastguard Worker filter[0] = filter[1] = f->frame_hdr->subpel_filter_mode;
1871*c0909341SAndroid Build Coastguard Worker }
1872*c0909341SAndroid Build Coastguard Worker b->filter2d = dav1d_filter_2d[filter[1]][filter[0]];
1873*c0909341SAndroid Build Coastguard Worker
1874*c0909341SAndroid Build Coastguard Worker read_vartx_tree(t, b, bs, bx4, by4);
1875*c0909341SAndroid Build Coastguard Worker
1876*c0909341SAndroid Build Coastguard Worker // reconstruction
1877*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass == 1) {
1878*c0909341SAndroid Build Coastguard Worker f->bd_fn.read_coef_blocks(t, bs, b);
1879*c0909341SAndroid Build Coastguard Worker } else {
1880*c0909341SAndroid Build Coastguard Worker if (f->bd_fn.recon_b_inter(t, bs, b)) return -1;
1881*c0909341SAndroid Build Coastguard Worker }
1882*c0909341SAndroid Build Coastguard Worker
1883*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->loopfilter.level_y[0] ||
1884*c0909341SAndroid Build Coastguard Worker f->frame_hdr->loopfilter.level_y[1])
1885*c0909341SAndroid Build Coastguard Worker {
1886*c0909341SAndroid Build Coastguard Worker const int is_globalmv =
1887*c0909341SAndroid Build Coastguard Worker b->inter_mode == (is_comp ? GLOBALMV_GLOBALMV : GLOBALMV);
1888*c0909341SAndroid Build Coastguard Worker const uint8_t (*const lf_lvls)[8][2] = (const uint8_t (*)[8][2])
1889*c0909341SAndroid Build Coastguard Worker &ts->lflvl[b->seg_id][0][b->ref[0] + 1][!is_globalmv];
1890*c0909341SAndroid Build Coastguard Worker const uint16_t tx_split[2] = { b->tx_split0, b->tx_split1 };
1891*c0909341SAndroid Build Coastguard Worker enum RectTxfmSize ytx = b->max_ytx, uvtx = b->uvtx;
1892*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->segmentation.lossless[b->seg_id]) {
1893*c0909341SAndroid Build Coastguard Worker ytx = (enum RectTxfmSize) TX_4X4;
1894*c0909341SAndroid Build Coastguard Worker uvtx = (enum RectTxfmSize) TX_4X4;
1895*c0909341SAndroid Build Coastguard Worker }
1896*c0909341SAndroid Build Coastguard Worker dav1d_create_lf_mask_inter(t->lf_mask, f->lf.level, f->b4_stride, lf_lvls,
1897*c0909341SAndroid Build Coastguard Worker t->bx, t->by, f->w4, f->h4, b->skip, bs,
1898*c0909341SAndroid Build Coastguard Worker ytx, tx_split, uvtx, f->cur.p.layout,
1899*c0909341SAndroid Build Coastguard Worker &t->a->tx_lpf_y[bx4], &t->l.tx_lpf_y[by4],
1900*c0909341SAndroid Build Coastguard Worker has_chroma ? &t->a->tx_lpf_uv[cbx4] : NULL,
1901*c0909341SAndroid Build Coastguard Worker has_chroma ? &t->l.tx_lpf_uv[cby4] : NULL);
1902*c0909341SAndroid Build Coastguard Worker }
1903*c0909341SAndroid Build Coastguard Worker
1904*c0909341SAndroid Build Coastguard Worker // context updates
1905*c0909341SAndroid Build Coastguard Worker if (is_comp)
1906*c0909341SAndroid Build Coastguard Worker splat_tworef_mv(f->c, t, bs, b, bw4, bh4);
1907*c0909341SAndroid Build Coastguard Worker else
1908*c0909341SAndroid Build Coastguard Worker splat_oneref_mv(f->c, t, bs, b, bw4, bh4);
1909*c0909341SAndroid Build Coastguard Worker BlockContext *edge = t->a;
1910*c0909341SAndroid Build Coastguard Worker for (int i = 0, off = bx4; i < 2; i++, off = by4, edge = &t->l) {
1911*c0909341SAndroid Build Coastguard Worker #define set_ctx(rep_macro) \
1912*c0909341SAndroid Build Coastguard Worker rep_macro(edge->seg_pred, off, seg_pred); \
1913*c0909341SAndroid Build Coastguard Worker rep_macro(edge->skip_mode, off, b->skip_mode); \
1914*c0909341SAndroid Build Coastguard Worker rep_macro(edge->intra, off, 0); \
1915*c0909341SAndroid Build Coastguard Worker rep_macro(edge->skip, off, b->skip); \
1916*c0909341SAndroid Build Coastguard Worker rep_macro(edge->pal_sz, off, 0); \
1917*c0909341SAndroid Build Coastguard Worker /* see aomedia bug 2183 for why this is outside if (has_chroma) */ \
1918*c0909341SAndroid Build Coastguard Worker rep_macro(t->pal_sz_uv[i], off, 0); \
1919*c0909341SAndroid Build Coastguard Worker rep_macro(edge->tx_intra, off, b_dim[2 + i]); \
1920*c0909341SAndroid Build Coastguard Worker rep_macro(edge->comp_type, off, b->comp_type); \
1921*c0909341SAndroid Build Coastguard Worker rep_macro(edge->filter[0], off, filter[0]); \
1922*c0909341SAndroid Build Coastguard Worker rep_macro(edge->filter[1], off, filter[1]); \
1923*c0909341SAndroid Build Coastguard Worker rep_macro(edge->mode, off, b->inter_mode); \
1924*c0909341SAndroid Build Coastguard Worker rep_macro(edge->ref[0], off, b->ref[0]); \
1925*c0909341SAndroid Build Coastguard Worker rep_macro(edge->ref[1], off, ((uint8_t) b->ref[1]))
1926*c0909341SAndroid Build Coastguard Worker case_set(b_dim[2 + i]);
1927*c0909341SAndroid Build Coastguard Worker #undef set_ctx
1928*c0909341SAndroid Build Coastguard Worker }
1929*c0909341SAndroid Build Coastguard Worker if (has_chroma) {
1930*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[ulog2(cbw4)](&t->a->uvmode[cbx4], DC_PRED);
1931*c0909341SAndroid Build Coastguard Worker dav1d_memset_pow2[ulog2(cbh4)](&t->l.uvmode[cby4], DC_PRED);
1932*c0909341SAndroid Build Coastguard Worker }
1933*c0909341SAndroid Build Coastguard Worker }
1934*c0909341SAndroid Build Coastguard Worker
1935*c0909341SAndroid Build Coastguard Worker // update contexts
1936*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->segmentation.enabled &&
1937*c0909341SAndroid Build Coastguard Worker f->frame_hdr->segmentation.update_map)
1938*c0909341SAndroid Build Coastguard Worker {
1939*c0909341SAndroid Build Coastguard Worker uint8_t *seg_ptr = &f->cur_segmap[t->by * f->b4_stride + t->bx];
1940*c0909341SAndroid Build Coastguard Worker #define set_ctx(rep_macro) \
1941*c0909341SAndroid Build Coastguard Worker for (int y = 0; y < bh4; y++) { \
1942*c0909341SAndroid Build Coastguard Worker rep_macro(seg_ptr, 0, b->seg_id); \
1943*c0909341SAndroid Build Coastguard Worker seg_ptr += f->b4_stride; \
1944*c0909341SAndroid Build Coastguard Worker }
1945*c0909341SAndroid Build Coastguard Worker case_set(b_dim[2]);
1946*c0909341SAndroid Build Coastguard Worker #undef set_ctx
1947*c0909341SAndroid Build Coastguard Worker }
1948*c0909341SAndroid Build Coastguard Worker if (!b->skip) {
1949*c0909341SAndroid Build Coastguard Worker uint16_t (*noskip_mask)[2] = &t->lf_mask->noskip_mask[by4 >> 1];
1950*c0909341SAndroid Build Coastguard Worker const unsigned mask = (~0U >> (32 - bw4)) << (bx4 & 15);
1951*c0909341SAndroid Build Coastguard Worker const int bx_idx = (bx4 & 16) >> 4;
1952*c0909341SAndroid Build Coastguard Worker for (int y = 0; y < bh4; y += 2, noskip_mask++) {
1953*c0909341SAndroid Build Coastguard Worker (*noskip_mask)[bx_idx] |= mask;
1954*c0909341SAndroid Build Coastguard Worker if (bw4 == 32) // this should be mask >> 16, but it's 0xffffffff anyway
1955*c0909341SAndroid Build Coastguard Worker (*noskip_mask)[1] |= mask;
1956*c0909341SAndroid Build Coastguard Worker }
1957*c0909341SAndroid Build Coastguard Worker }
1958*c0909341SAndroid Build Coastguard Worker
1959*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass == 1 && !b->intra && IS_INTER_OR_SWITCH(f->frame_hdr)) {
1960*c0909341SAndroid Build Coastguard Worker const int sby = (t->by - ts->tiling.row_start) >> f->sb_shift;
1961*c0909341SAndroid Build Coastguard Worker int (*const lowest_px)[2] = ts->lowest_pixel[sby];
1962*c0909341SAndroid Build Coastguard Worker
1963*c0909341SAndroid Build Coastguard Worker // keep track of motion vectors for each reference
1964*c0909341SAndroid Build Coastguard Worker if (b->comp_type == COMP_INTER_NONE) {
1965*c0909341SAndroid Build Coastguard Worker // y
1966*c0909341SAndroid Build Coastguard Worker if (imin(bw4, bh4) > 1 &&
1967*c0909341SAndroid Build Coastguard Worker ((b->inter_mode == GLOBALMV && f->gmv_warp_allowed[b->ref[0]]) ||
1968*c0909341SAndroid Build Coastguard Worker (b->motion_mode == MM_WARP && t->warpmv.type > DAV1D_WM_TYPE_TRANSLATION)))
1969*c0909341SAndroid Build Coastguard Worker {
1970*c0909341SAndroid Build Coastguard Worker affine_lowest_px_luma(t, &lowest_px[b->ref[0]][0], b_dim,
1971*c0909341SAndroid Build Coastguard Worker b->motion_mode == MM_WARP ? &t->warpmv :
1972*c0909341SAndroid Build Coastguard Worker &f->frame_hdr->gmv[b->ref[0]]);
1973*c0909341SAndroid Build Coastguard Worker } else {
1974*c0909341SAndroid Build Coastguard Worker mc_lowest_px(&lowest_px[b->ref[0]][0], t->by, bh4, b->mv[0].y,
1975*c0909341SAndroid Build Coastguard Worker 0, &f->svc[b->ref[0]][1]);
1976*c0909341SAndroid Build Coastguard Worker if (b->motion_mode == MM_OBMC) {
1977*c0909341SAndroid Build Coastguard Worker obmc_lowest_px(t, lowest_px, 0, b_dim, bx4, by4, w4, h4);
1978*c0909341SAndroid Build Coastguard Worker }
1979*c0909341SAndroid Build Coastguard Worker }
1980*c0909341SAndroid Build Coastguard Worker
1981*c0909341SAndroid Build Coastguard Worker // uv
1982*c0909341SAndroid Build Coastguard Worker if (has_chroma) {
1983*c0909341SAndroid Build Coastguard Worker // sub8x8 derivation
1984*c0909341SAndroid Build Coastguard Worker int is_sub8x8 = bw4 == ss_hor || bh4 == ss_ver;
1985*c0909341SAndroid Build Coastguard Worker refmvs_block *const *r;
1986*c0909341SAndroid Build Coastguard Worker if (is_sub8x8) {
1987*c0909341SAndroid Build Coastguard Worker assert(ss_hor == 1);
1988*c0909341SAndroid Build Coastguard Worker r = &t->rt.r[(t->by & 31) + 5];
1989*c0909341SAndroid Build Coastguard Worker if (bw4 == 1) is_sub8x8 &= r[0][t->bx - 1].ref.ref[0] > 0;
1990*c0909341SAndroid Build Coastguard Worker if (bh4 == ss_ver) is_sub8x8 &= r[-1][t->bx].ref.ref[0] > 0;
1991*c0909341SAndroid Build Coastguard Worker if (bw4 == 1 && bh4 == ss_ver)
1992*c0909341SAndroid Build Coastguard Worker is_sub8x8 &= r[-1][t->bx - 1].ref.ref[0] > 0;
1993*c0909341SAndroid Build Coastguard Worker }
1994*c0909341SAndroid Build Coastguard Worker
1995*c0909341SAndroid Build Coastguard Worker // chroma prediction
1996*c0909341SAndroid Build Coastguard Worker if (is_sub8x8) {
1997*c0909341SAndroid Build Coastguard Worker assert(ss_hor == 1);
1998*c0909341SAndroid Build Coastguard Worker if (bw4 == 1 && bh4 == ss_ver) {
1999*c0909341SAndroid Build Coastguard Worker const refmvs_block *const rr = &r[-1][t->bx - 1];
2000*c0909341SAndroid Build Coastguard Worker mc_lowest_px(&lowest_px[rr->ref.ref[0] - 1][1],
2001*c0909341SAndroid Build Coastguard Worker t->by - 1, bh4, rr->mv.mv[0].y, ss_ver,
2002*c0909341SAndroid Build Coastguard Worker &f->svc[rr->ref.ref[0] - 1][1]);
2003*c0909341SAndroid Build Coastguard Worker }
2004*c0909341SAndroid Build Coastguard Worker if (bw4 == 1) {
2005*c0909341SAndroid Build Coastguard Worker const refmvs_block *const rr = &r[0][t->bx - 1];
2006*c0909341SAndroid Build Coastguard Worker mc_lowest_px(&lowest_px[rr->ref.ref[0] - 1][1],
2007*c0909341SAndroid Build Coastguard Worker t->by, bh4, rr->mv.mv[0].y, ss_ver,
2008*c0909341SAndroid Build Coastguard Worker &f->svc[rr->ref.ref[0] - 1][1]);
2009*c0909341SAndroid Build Coastguard Worker }
2010*c0909341SAndroid Build Coastguard Worker if (bh4 == ss_ver) {
2011*c0909341SAndroid Build Coastguard Worker const refmvs_block *const rr = &r[-1][t->bx];
2012*c0909341SAndroid Build Coastguard Worker mc_lowest_px(&lowest_px[rr->ref.ref[0] - 1][1],
2013*c0909341SAndroid Build Coastguard Worker t->by - 1, bh4, rr->mv.mv[0].y, ss_ver,
2014*c0909341SAndroid Build Coastguard Worker &f->svc[rr->ref.ref[0] - 1][1]);
2015*c0909341SAndroid Build Coastguard Worker }
2016*c0909341SAndroid Build Coastguard Worker mc_lowest_px(&lowest_px[b->ref[0]][1], t->by, bh4,
2017*c0909341SAndroid Build Coastguard Worker b->mv[0].y, ss_ver, &f->svc[b->ref[0]][1]);
2018*c0909341SAndroid Build Coastguard Worker } else {
2019*c0909341SAndroid Build Coastguard Worker if (imin(cbw4, cbh4) > 1 &&
2020*c0909341SAndroid Build Coastguard Worker ((b->inter_mode == GLOBALMV && f->gmv_warp_allowed[b->ref[0]]) ||
2021*c0909341SAndroid Build Coastguard Worker (b->motion_mode == MM_WARP && t->warpmv.type > DAV1D_WM_TYPE_TRANSLATION)))
2022*c0909341SAndroid Build Coastguard Worker {
2023*c0909341SAndroid Build Coastguard Worker affine_lowest_px_chroma(t, &lowest_px[b->ref[0]][1], b_dim,
2024*c0909341SAndroid Build Coastguard Worker b->motion_mode == MM_WARP ? &t->warpmv :
2025*c0909341SAndroid Build Coastguard Worker &f->frame_hdr->gmv[b->ref[0]]);
2026*c0909341SAndroid Build Coastguard Worker } else {
2027*c0909341SAndroid Build Coastguard Worker mc_lowest_px(&lowest_px[b->ref[0]][1],
2028*c0909341SAndroid Build Coastguard Worker t->by & ~ss_ver, bh4 << (bh4 == ss_ver),
2029*c0909341SAndroid Build Coastguard Worker b->mv[0].y, ss_ver, &f->svc[b->ref[0]][1]);
2030*c0909341SAndroid Build Coastguard Worker if (b->motion_mode == MM_OBMC) {
2031*c0909341SAndroid Build Coastguard Worker obmc_lowest_px(t, lowest_px, 1, b_dim, bx4, by4, w4, h4);
2032*c0909341SAndroid Build Coastguard Worker }
2033*c0909341SAndroid Build Coastguard Worker }
2034*c0909341SAndroid Build Coastguard Worker }
2035*c0909341SAndroid Build Coastguard Worker }
2036*c0909341SAndroid Build Coastguard Worker } else {
2037*c0909341SAndroid Build Coastguard Worker // y
2038*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < 2; i++) {
2039*c0909341SAndroid Build Coastguard Worker if (b->inter_mode == GLOBALMV_GLOBALMV && f->gmv_warp_allowed[b->ref[i]]) {
2040*c0909341SAndroid Build Coastguard Worker affine_lowest_px_luma(t, &lowest_px[b->ref[i]][0], b_dim,
2041*c0909341SAndroid Build Coastguard Worker &f->frame_hdr->gmv[b->ref[i]]);
2042*c0909341SAndroid Build Coastguard Worker } else {
2043*c0909341SAndroid Build Coastguard Worker mc_lowest_px(&lowest_px[b->ref[i]][0], t->by, bh4,
2044*c0909341SAndroid Build Coastguard Worker b->mv[i].y, 0, &f->svc[b->ref[i]][1]);
2045*c0909341SAndroid Build Coastguard Worker }
2046*c0909341SAndroid Build Coastguard Worker }
2047*c0909341SAndroid Build Coastguard Worker
2048*c0909341SAndroid Build Coastguard Worker // uv
2049*c0909341SAndroid Build Coastguard Worker if (has_chroma) for (int i = 0; i < 2; i++) {
2050*c0909341SAndroid Build Coastguard Worker if (b->inter_mode == GLOBALMV_GLOBALMV &&
2051*c0909341SAndroid Build Coastguard Worker imin(cbw4, cbh4) > 1 && f->gmv_warp_allowed[b->ref[i]])
2052*c0909341SAndroid Build Coastguard Worker {
2053*c0909341SAndroid Build Coastguard Worker affine_lowest_px_chroma(t, &lowest_px[b->ref[i]][1], b_dim,
2054*c0909341SAndroid Build Coastguard Worker &f->frame_hdr->gmv[b->ref[i]]);
2055*c0909341SAndroid Build Coastguard Worker } else {
2056*c0909341SAndroid Build Coastguard Worker mc_lowest_px(&lowest_px[b->ref[i]][1], t->by, bh4,
2057*c0909341SAndroid Build Coastguard Worker b->mv[i].y, ss_ver, &f->svc[b->ref[i]][1]);
2058*c0909341SAndroid Build Coastguard Worker }
2059*c0909341SAndroid Build Coastguard Worker }
2060*c0909341SAndroid Build Coastguard Worker }
2061*c0909341SAndroid Build Coastguard Worker }
2062*c0909341SAndroid Build Coastguard Worker
2063*c0909341SAndroid Build Coastguard Worker return 0;
2064*c0909341SAndroid Build Coastguard Worker }
2065*c0909341SAndroid Build Coastguard Worker
2066*c0909341SAndroid Build Coastguard Worker #if __has_feature(memory_sanitizer)
2067*c0909341SAndroid Build Coastguard Worker
2068*c0909341SAndroid Build Coastguard Worker #include <sanitizer/msan_interface.h>
2069*c0909341SAndroid Build Coastguard Worker
checked_decode_b(Dav1dTaskContext * const t,const enum BlockLevel bl,const enum BlockSize bs,const enum BlockPartition bp,const enum EdgeFlags intra_edge_flags)2070*c0909341SAndroid Build Coastguard Worker static int checked_decode_b(Dav1dTaskContext *const t,
2071*c0909341SAndroid Build Coastguard Worker const enum BlockLevel bl,
2072*c0909341SAndroid Build Coastguard Worker const enum BlockSize bs,
2073*c0909341SAndroid Build Coastguard Worker const enum BlockPartition bp,
2074*c0909341SAndroid Build Coastguard Worker const enum EdgeFlags intra_edge_flags)
2075*c0909341SAndroid Build Coastguard Worker {
2076*c0909341SAndroid Build Coastguard Worker const Dav1dFrameContext *const f = t->f;
2077*c0909341SAndroid Build Coastguard Worker const int err = decode_b(t, bl, bs, bp, intra_edge_flags);
2078*c0909341SAndroid Build Coastguard Worker
2079*c0909341SAndroid Build Coastguard Worker if (err == 0 && !(t->frame_thread.pass & 1)) {
2080*c0909341SAndroid Build Coastguard Worker const int ss_ver = f->cur.p.layout == DAV1D_PIXEL_LAYOUT_I420;
2081*c0909341SAndroid Build Coastguard Worker const int ss_hor = f->cur.p.layout != DAV1D_PIXEL_LAYOUT_I444;
2082*c0909341SAndroid Build Coastguard Worker const uint8_t *const b_dim = dav1d_block_dimensions[bs];
2083*c0909341SAndroid Build Coastguard Worker const int bw4 = b_dim[0], bh4 = b_dim[1];
2084*c0909341SAndroid Build Coastguard Worker const int w4 = imin(bw4, f->bw - t->bx), h4 = imin(bh4, f->bh - t->by);
2085*c0909341SAndroid Build Coastguard Worker const int has_chroma = f->seq_hdr->layout != DAV1D_PIXEL_LAYOUT_I400 &&
2086*c0909341SAndroid Build Coastguard Worker (bw4 > ss_hor || t->bx & 1) &&
2087*c0909341SAndroid Build Coastguard Worker (bh4 > ss_ver || t->by & 1);
2088*c0909341SAndroid Build Coastguard Worker
2089*c0909341SAndroid Build Coastguard Worker for (int p = 0; p < 1 + 2 * has_chroma; p++) {
2090*c0909341SAndroid Build Coastguard Worker const int ss_ver = p && f->cur.p.layout == DAV1D_PIXEL_LAYOUT_I420;
2091*c0909341SAndroid Build Coastguard Worker const int ss_hor = p && f->cur.p.layout != DAV1D_PIXEL_LAYOUT_I444;
2092*c0909341SAndroid Build Coastguard Worker const ptrdiff_t stride = f->cur.stride[!!p];
2093*c0909341SAndroid Build Coastguard Worker const int bx = t->bx & ~ss_hor;
2094*c0909341SAndroid Build Coastguard Worker const int by = t->by & ~ss_ver;
2095*c0909341SAndroid Build Coastguard Worker const int width = w4 << (2 - ss_hor + (bw4 == ss_hor));
2096*c0909341SAndroid Build Coastguard Worker const int height = h4 << (2 - ss_ver + (bh4 == ss_ver));
2097*c0909341SAndroid Build Coastguard Worker
2098*c0909341SAndroid Build Coastguard Worker const uint8_t *data = f->cur.data[p] + (by << (2 - ss_ver)) * stride +
2099*c0909341SAndroid Build Coastguard Worker (bx << (2 - ss_hor + !!f->seq_hdr->hbd));
2100*c0909341SAndroid Build Coastguard Worker
2101*c0909341SAndroid Build Coastguard Worker for (int y = 0; y < height; data += stride, y++) {
2102*c0909341SAndroid Build Coastguard Worker const size_t line_sz = width << !!f->seq_hdr->hbd;
2103*c0909341SAndroid Build Coastguard Worker if (__msan_test_shadow(data, line_sz) != -1) {
2104*c0909341SAndroid Build Coastguard Worker fprintf(stderr, "B[%d](%d, %d) w4:%d, h4:%d, row:%d\n",
2105*c0909341SAndroid Build Coastguard Worker p, bx, by, w4, h4, y);
2106*c0909341SAndroid Build Coastguard Worker __msan_check_mem_is_initialized(data, line_sz);
2107*c0909341SAndroid Build Coastguard Worker }
2108*c0909341SAndroid Build Coastguard Worker }
2109*c0909341SAndroid Build Coastguard Worker }
2110*c0909341SAndroid Build Coastguard Worker }
2111*c0909341SAndroid Build Coastguard Worker
2112*c0909341SAndroid Build Coastguard Worker return err;
2113*c0909341SAndroid Build Coastguard Worker }
2114*c0909341SAndroid Build Coastguard Worker
2115*c0909341SAndroid Build Coastguard Worker #define decode_b checked_decode_b
2116*c0909341SAndroid Build Coastguard Worker
2117*c0909341SAndroid Build Coastguard Worker #endif /* defined(__has_feature) */
2118*c0909341SAndroid Build Coastguard Worker
decode_sb(Dav1dTaskContext * const t,const enum BlockLevel bl,const EdgeNode * const node)2119*c0909341SAndroid Build Coastguard Worker static int decode_sb(Dav1dTaskContext *const t, const enum BlockLevel bl,
2120*c0909341SAndroid Build Coastguard Worker const EdgeNode *const node)
2121*c0909341SAndroid Build Coastguard Worker {
2122*c0909341SAndroid Build Coastguard Worker const Dav1dFrameContext *const f = t->f;
2123*c0909341SAndroid Build Coastguard Worker Dav1dTileState *const ts = t->ts;
2124*c0909341SAndroid Build Coastguard Worker const int hsz = 16 >> bl;
2125*c0909341SAndroid Build Coastguard Worker const int have_h_split = f->bw > t->bx + hsz;
2126*c0909341SAndroid Build Coastguard Worker const int have_v_split = f->bh > t->by + hsz;
2127*c0909341SAndroid Build Coastguard Worker
2128*c0909341SAndroid Build Coastguard Worker if (!have_h_split && !have_v_split) {
2129*c0909341SAndroid Build Coastguard Worker assert(bl < BL_8X8);
2130*c0909341SAndroid Build Coastguard Worker return decode_sb(t, bl + 1, INTRA_EDGE_SPLIT(node, 0));
2131*c0909341SAndroid Build Coastguard Worker }
2132*c0909341SAndroid Build Coastguard Worker
2133*c0909341SAndroid Build Coastguard Worker uint16_t *pc;
2134*c0909341SAndroid Build Coastguard Worker enum BlockPartition bp;
2135*c0909341SAndroid Build Coastguard Worker int ctx, bx8, by8;
2136*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass != 2) {
2137*c0909341SAndroid Build Coastguard Worker if (0 && bl == BL_64X64)
2138*c0909341SAndroid Build Coastguard Worker printf("poc=%d,y=%d,x=%d,bl=%d,r=%d\n",
2139*c0909341SAndroid Build Coastguard Worker f->frame_hdr->frame_offset, t->by, t->bx, bl, ts->msac.rng);
2140*c0909341SAndroid Build Coastguard Worker bx8 = (t->bx & 31) >> 1;
2141*c0909341SAndroid Build Coastguard Worker by8 = (t->by & 31) >> 1;
2142*c0909341SAndroid Build Coastguard Worker ctx = get_partition_ctx(t->a, &t->l, bl, by8, bx8);
2143*c0909341SAndroid Build Coastguard Worker pc = ts->cdf.m.partition[bl][ctx];
2144*c0909341SAndroid Build Coastguard Worker }
2145*c0909341SAndroid Build Coastguard Worker
2146*c0909341SAndroid Build Coastguard Worker if (have_h_split && have_v_split) {
2147*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass == 2) {
2148*c0909341SAndroid Build Coastguard Worker const Av1Block *const b = &f->frame_thread.b[t->by * f->b4_stride + t->bx];
2149*c0909341SAndroid Build Coastguard Worker bp = b->bl == bl ? b->bp : PARTITION_SPLIT;
2150*c0909341SAndroid Build Coastguard Worker } else {
2151*c0909341SAndroid Build Coastguard Worker bp = dav1d_msac_decode_symbol_adapt16(&ts->msac, pc,
2152*c0909341SAndroid Build Coastguard Worker dav1d_partition_type_count[bl]);
2153*c0909341SAndroid Build Coastguard Worker if (f->cur.p.layout == DAV1D_PIXEL_LAYOUT_I422 &&
2154*c0909341SAndroid Build Coastguard Worker (bp == PARTITION_V || bp == PARTITION_V4 ||
2155*c0909341SAndroid Build Coastguard Worker bp == PARTITION_T_LEFT_SPLIT || bp == PARTITION_T_RIGHT_SPLIT))
2156*c0909341SAndroid Build Coastguard Worker {
2157*c0909341SAndroid Build Coastguard Worker return 1;
2158*c0909341SAndroid Build Coastguard Worker }
2159*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
2160*c0909341SAndroid Build Coastguard Worker printf("poc=%d,y=%d,x=%d,bl=%d,ctx=%d,bp=%d: r=%d\n",
2161*c0909341SAndroid Build Coastguard Worker f->frame_hdr->frame_offset, t->by, t->bx, bl, ctx, bp,
2162*c0909341SAndroid Build Coastguard Worker ts->msac.rng);
2163*c0909341SAndroid Build Coastguard Worker }
2164*c0909341SAndroid Build Coastguard Worker const uint8_t *const b = dav1d_block_sizes[bl][bp];
2165*c0909341SAndroid Build Coastguard Worker
2166*c0909341SAndroid Build Coastguard Worker switch (bp) {
2167*c0909341SAndroid Build Coastguard Worker case PARTITION_NONE:
2168*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_NONE, node->o))
2169*c0909341SAndroid Build Coastguard Worker return -1;
2170*c0909341SAndroid Build Coastguard Worker break;
2171*c0909341SAndroid Build Coastguard Worker case PARTITION_H:
2172*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_H, node->h[0]))
2173*c0909341SAndroid Build Coastguard Worker return -1;
2174*c0909341SAndroid Build Coastguard Worker t->by += hsz;
2175*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_H, node->h[1]))
2176*c0909341SAndroid Build Coastguard Worker return -1;
2177*c0909341SAndroid Build Coastguard Worker t->by -= hsz;
2178*c0909341SAndroid Build Coastguard Worker break;
2179*c0909341SAndroid Build Coastguard Worker case PARTITION_V:
2180*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_V, node->v[0]))
2181*c0909341SAndroid Build Coastguard Worker return -1;
2182*c0909341SAndroid Build Coastguard Worker t->bx += hsz;
2183*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_V, node->v[1]))
2184*c0909341SAndroid Build Coastguard Worker return -1;
2185*c0909341SAndroid Build Coastguard Worker t->bx -= hsz;
2186*c0909341SAndroid Build Coastguard Worker break;
2187*c0909341SAndroid Build Coastguard Worker case PARTITION_SPLIT:
2188*c0909341SAndroid Build Coastguard Worker if (bl == BL_8X8) {
2189*c0909341SAndroid Build Coastguard Worker const EdgeTip *const tip = (const EdgeTip *) node;
2190*c0909341SAndroid Build Coastguard Worker assert(hsz == 1);
2191*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, BS_4x4, PARTITION_SPLIT, EDGE_ALL_TR_AND_BL))
2192*c0909341SAndroid Build Coastguard Worker return -1;
2193*c0909341SAndroid Build Coastguard Worker const enum Filter2d tl_filter = t->tl_4x4_filter;
2194*c0909341SAndroid Build Coastguard Worker t->bx++;
2195*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, BS_4x4, PARTITION_SPLIT, tip->split[0]))
2196*c0909341SAndroid Build Coastguard Worker return -1;
2197*c0909341SAndroid Build Coastguard Worker t->bx--;
2198*c0909341SAndroid Build Coastguard Worker t->by++;
2199*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, BS_4x4, PARTITION_SPLIT, tip->split[1]))
2200*c0909341SAndroid Build Coastguard Worker return -1;
2201*c0909341SAndroid Build Coastguard Worker t->bx++;
2202*c0909341SAndroid Build Coastguard Worker t->tl_4x4_filter = tl_filter;
2203*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, BS_4x4, PARTITION_SPLIT, tip->split[2]))
2204*c0909341SAndroid Build Coastguard Worker return -1;
2205*c0909341SAndroid Build Coastguard Worker t->bx--;
2206*c0909341SAndroid Build Coastguard Worker t->by--;
2207*c0909341SAndroid Build Coastguard Worker #if ARCH_X86_64
2208*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass) {
2209*c0909341SAndroid Build Coastguard Worker /* In 8-bit mode with 2-pass decoding the coefficient buffer
2210*c0909341SAndroid Build Coastguard Worker * can end up misaligned due to skips here. Work around
2211*c0909341SAndroid Build Coastguard Worker * the issue by explicitly realigning the buffer. */
2212*c0909341SAndroid Build Coastguard Worker const int p = t->frame_thread.pass & 1;
2213*c0909341SAndroid Build Coastguard Worker ts->frame_thread[p].cf =
2214*c0909341SAndroid Build Coastguard Worker (void*)(((uintptr_t)ts->frame_thread[p].cf + 63) & ~63);
2215*c0909341SAndroid Build Coastguard Worker }
2216*c0909341SAndroid Build Coastguard Worker #endif
2217*c0909341SAndroid Build Coastguard Worker } else {
2218*c0909341SAndroid Build Coastguard Worker if (decode_sb(t, bl + 1, INTRA_EDGE_SPLIT(node, 0)))
2219*c0909341SAndroid Build Coastguard Worker return 1;
2220*c0909341SAndroid Build Coastguard Worker t->bx += hsz;
2221*c0909341SAndroid Build Coastguard Worker if (decode_sb(t, bl + 1, INTRA_EDGE_SPLIT(node, 1)))
2222*c0909341SAndroid Build Coastguard Worker return 1;
2223*c0909341SAndroid Build Coastguard Worker t->bx -= hsz;
2224*c0909341SAndroid Build Coastguard Worker t->by += hsz;
2225*c0909341SAndroid Build Coastguard Worker if (decode_sb(t, bl + 1, INTRA_EDGE_SPLIT(node, 2)))
2226*c0909341SAndroid Build Coastguard Worker return 1;
2227*c0909341SAndroid Build Coastguard Worker t->bx += hsz;
2228*c0909341SAndroid Build Coastguard Worker if (decode_sb(t, bl + 1, INTRA_EDGE_SPLIT(node, 3)))
2229*c0909341SAndroid Build Coastguard Worker return 1;
2230*c0909341SAndroid Build Coastguard Worker t->bx -= hsz;
2231*c0909341SAndroid Build Coastguard Worker t->by -= hsz;
2232*c0909341SAndroid Build Coastguard Worker }
2233*c0909341SAndroid Build Coastguard Worker break;
2234*c0909341SAndroid Build Coastguard Worker case PARTITION_T_TOP_SPLIT: {
2235*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_T_TOP_SPLIT, EDGE_ALL_TR_AND_BL))
2236*c0909341SAndroid Build Coastguard Worker return -1;
2237*c0909341SAndroid Build Coastguard Worker t->bx += hsz;
2238*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_T_TOP_SPLIT, node->v[1]))
2239*c0909341SAndroid Build Coastguard Worker return -1;
2240*c0909341SAndroid Build Coastguard Worker t->bx -= hsz;
2241*c0909341SAndroid Build Coastguard Worker t->by += hsz;
2242*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[1], PARTITION_T_TOP_SPLIT, node->h[1]))
2243*c0909341SAndroid Build Coastguard Worker return -1;
2244*c0909341SAndroid Build Coastguard Worker t->by -= hsz;
2245*c0909341SAndroid Build Coastguard Worker break;
2246*c0909341SAndroid Build Coastguard Worker }
2247*c0909341SAndroid Build Coastguard Worker case PARTITION_T_BOTTOM_SPLIT: {
2248*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_T_BOTTOM_SPLIT, node->h[0]))
2249*c0909341SAndroid Build Coastguard Worker return -1;
2250*c0909341SAndroid Build Coastguard Worker t->by += hsz;
2251*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[1], PARTITION_T_BOTTOM_SPLIT, node->v[0]))
2252*c0909341SAndroid Build Coastguard Worker return -1;
2253*c0909341SAndroid Build Coastguard Worker t->bx += hsz;
2254*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[1], PARTITION_T_BOTTOM_SPLIT, 0))
2255*c0909341SAndroid Build Coastguard Worker return -1;
2256*c0909341SAndroid Build Coastguard Worker t->bx -= hsz;
2257*c0909341SAndroid Build Coastguard Worker t->by -= hsz;
2258*c0909341SAndroid Build Coastguard Worker break;
2259*c0909341SAndroid Build Coastguard Worker }
2260*c0909341SAndroid Build Coastguard Worker case PARTITION_T_LEFT_SPLIT: {
2261*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_T_LEFT_SPLIT, EDGE_ALL_TR_AND_BL))
2262*c0909341SAndroid Build Coastguard Worker return -1;
2263*c0909341SAndroid Build Coastguard Worker t->by += hsz;
2264*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_T_LEFT_SPLIT, node->h[1]))
2265*c0909341SAndroid Build Coastguard Worker return -1;
2266*c0909341SAndroid Build Coastguard Worker t->by -= hsz;
2267*c0909341SAndroid Build Coastguard Worker t->bx += hsz;
2268*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[1], PARTITION_T_LEFT_SPLIT, node->v[1]))
2269*c0909341SAndroid Build Coastguard Worker return -1;
2270*c0909341SAndroid Build Coastguard Worker t->bx -= hsz;
2271*c0909341SAndroid Build Coastguard Worker break;
2272*c0909341SAndroid Build Coastguard Worker }
2273*c0909341SAndroid Build Coastguard Worker case PARTITION_T_RIGHT_SPLIT: {
2274*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_T_RIGHT_SPLIT, node->v[0]))
2275*c0909341SAndroid Build Coastguard Worker return -1;
2276*c0909341SAndroid Build Coastguard Worker t->bx += hsz;
2277*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[1], PARTITION_T_RIGHT_SPLIT, node->h[0]))
2278*c0909341SAndroid Build Coastguard Worker return -1;
2279*c0909341SAndroid Build Coastguard Worker t->by += hsz;
2280*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[1], PARTITION_T_RIGHT_SPLIT, 0))
2281*c0909341SAndroid Build Coastguard Worker return -1;
2282*c0909341SAndroid Build Coastguard Worker t->by -= hsz;
2283*c0909341SAndroid Build Coastguard Worker t->bx -= hsz;
2284*c0909341SAndroid Build Coastguard Worker break;
2285*c0909341SAndroid Build Coastguard Worker }
2286*c0909341SAndroid Build Coastguard Worker case PARTITION_H4: {
2287*c0909341SAndroid Build Coastguard Worker const EdgeBranch *const branch = (const EdgeBranch *) node;
2288*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_H4, node->h[0]))
2289*c0909341SAndroid Build Coastguard Worker return -1;
2290*c0909341SAndroid Build Coastguard Worker t->by += hsz >> 1;
2291*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_H4, branch->h4))
2292*c0909341SAndroid Build Coastguard Worker return -1;
2293*c0909341SAndroid Build Coastguard Worker t->by += hsz >> 1;
2294*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_H4, EDGE_ALL_LEFT_HAS_BOTTOM))
2295*c0909341SAndroid Build Coastguard Worker return -1;
2296*c0909341SAndroid Build Coastguard Worker t->by += hsz >> 1;
2297*c0909341SAndroid Build Coastguard Worker if (t->by < f->bh)
2298*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_H4, node->h[1]))
2299*c0909341SAndroid Build Coastguard Worker return -1;
2300*c0909341SAndroid Build Coastguard Worker t->by -= hsz * 3 >> 1;
2301*c0909341SAndroid Build Coastguard Worker break;
2302*c0909341SAndroid Build Coastguard Worker }
2303*c0909341SAndroid Build Coastguard Worker case PARTITION_V4: {
2304*c0909341SAndroid Build Coastguard Worker const EdgeBranch *const branch = (const EdgeBranch *) node;
2305*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_V4, node->v[0]))
2306*c0909341SAndroid Build Coastguard Worker return -1;
2307*c0909341SAndroid Build Coastguard Worker t->bx += hsz >> 1;
2308*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_V4, branch->v4))
2309*c0909341SAndroid Build Coastguard Worker return -1;
2310*c0909341SAndroid Build Coastguard Worker t->bx += hsz >> 1;
2311*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_V4, EDGE_ALL_TOP_HAS_RIGHT))
2312*c0909341SAndroid Build Coastguard Worker return -1;
2313*c0909341SAndroid Build Coastguard Worker t->bx += hsz >> 1;
2314*c0909341SAndroid Build Coastguard Worker if (t->bx < f->bw)
2315*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, b[0], PARTITION_V4, node->v[1]))
2316*c0909341SAndroid Build Coastguard Worker return -1;
2317*c0909341SAndroid Build Coastguard Worker t->bx -= hsz * 3 >> 1;
2318*c0909341SAndroid Build Coastguard Worker break;
2319*c0909341SAndroid Build Coastguard Worker }
2320*c0909341SAndroid Build Coastguard Worker default: assert(0);
2321*c0909341SAndroid Build Coastguard Worker }
2322*c0909341SAndroid Build Coastguard Worker } else if (have_h_split) {
2323*c0909341SAndroid Build Coastguard Worker unsigned is_split;
2324*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass == 2) {
2325*c0909341SAndroid Build Coastguard Worker const Av1Block *const b = &f->frame_thread.b[t->by * f->b4_stride + t->bx];
2326*c0909341SAndroid Build Coastguard Worker is_split = b->bl != bl;
2327*c0909341SAndroid Build Coastguard Worker } else {
2328*c0909341SAndroid Build Coastguard Worker is_split = dav1d_msac_decode_bool(&ts->msac,
2329*c0909341SAndroid Build Coastguard Worker gather_top_partition_prob(pc, bl));
2330*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
2331*c0909341SAndroid Build Coastguard Worker printf("poc=%d,y=%d,x=%d,bl=%d,ctx=%d,bp=%d: r=%d\n",
2332*c0909341SAndroid Build Coastguard Worker f->frame_hdr->frame_offset, t->by, t->bx, bl, ctx,
2333*c0909341SAndroid Build Coastguard Worker is_split ? PARTITION_SPLIT : PARTITION_H, ts->msac.rng);
2334*c0909341SAndroid Build Coastguard Worker }
2335*c0909341SAndroid Build Coastguard Worker
2336*c0909341SAndroid Build Coastguard Worker assert(bl < BL_8X8);
2337*c0909341SAndroid Build Coastguard Worker if (is_split) {
2338*c0909341SAndroid Build Coastguard Worker bp = PARTITION_SPLIT;
2339*c0909341SAndroid Build Coastguard Worker if (decode_sb(t, bl + 1, INTRA_EDGE_SPLIT(node, 0))) return 1;
2340*c0909341SAndroid Build Coastguard Worker t->bx += hsz;
2341*c0909341SAndroid Build Coastguard Worker if (decode_sb(t, bl + 1, INTRA_EDGE_SPLIT(node, 1))) return 1;
2342*c0909341SAndroid Build Coastguard Worker t->bx -= hsz;
2343*c0909341SAndroid Build Coastguard Worker } else {
2344*c0909341SAndroid Build Coastguard Worker bp = PARTITION_H;
2345*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, dav1d_block_sizes[bl][PARTITION_H][0],
2346*c0909341SAndroid Build Coastguard Worker PARTITION_H, node->h[0]))
2347*c0909341SAndroid Build Coastguard Worker return -1;
2348*c0909341SAndroid Build Coastguard Worker }
2349*c0909341SAndroid Build Coastguard Worker } else {
2350*c0909341SAndroid Build Coastguard Worker assert(have_v_split);
2351*c0909341SAndroid Build Coastguard Worker unsigned is_split;
2352*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass == 2) {
2353*c0909341SAndroid Build Coastguard Worker const Av1Block *const b = &f->frame_thread.b[t->by * f->b4_stride + t->bx];
2354*c0909341SAndroid Build Coastguard Worker is_split = b->bl != bl;
2355*c0909341SAndroid Build Coastguard Worker } else {
2356*c0909341SAndroid Build Coastguard Worker is_split = dav1d_msac_decode_bool(&ts->msac,
2357*c0909341SAndroid Build Coastguard Worker gather_left_partition_prob(pc, bl));
2358*c0909341SAndroid Build Coastguard Worker if (f->cur.p.layout == DAV1D_PIXEL_LAYOUT_I422 && !is_split)
2359*c0909341SAndroid Build Coastguard Worker return 1;
2360*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
2361*c0909341SAndroid Build Coastguard Worker printf("poc=%d,y=%d,x=%d,bl=%d,ctx=%d,bp=%d: r=%d\n",
2362*c0909341SAndroid Build Coastguard Worker f->frame_hdr->frame_offset, t->by, t->bx, bl, ctx,
2363*c0909341SAndroid Build Coastguard Worker is_split ? PARTITION_SPLIT : PARTITION_V, ts->msac.rng);
2364*c0909341SAndroid Build Coastguard Worker }
2365*c0909341SAndroid Build Coastguard Worker
2366*c0909341SAndroid Build Coastguard Worker assert(bl < BL_8X8);
2367*c0909341SAndroid Build Coastguard Worker if (is_split) {
2368*c0909341SAndroid Build Coastguard Worker bp = PARTITION_SPLIT;
2369*c0909341SAndroid Build Coastguard Worker if (decode_sb(t, bl + 1, INTRA_EDGE_SPLIT(node, 0))) return 1;
2370*c0909341SAndroid Build Coastguard Worker t->by += hsz;
2371*c0909341SAndroid Build Coastguard Worker if (decode_sb(t, bl + 1, INTRA_EDGE_SPLIT(node, 2))) return 1;
2372*c0909341SAndroid Build Coastguard Worker t->by -= hsz;
2373*c0909341SAndroid Build Coastguard Worker } else {
2374*c0909341SAndroid Build Coastguard Worker bp = PARTITION_V;
2375*c0909341SAndroid Build Coastguard Worker if (decode_b(t, bl, dav1d_block_sizes[bl][PARTITION_V][0],
2376*c0909341SAndroid Build Coastguard Worker PARTITION_V, node->v[0]))
2377*c0909341SAndroid Build Coastguard Worker return -1;
2378*c0909341SAndroid Build Coastguard Worker }
2379*c0909341SAndroid Build Coastguard Worker }
2380*c0909341SAndroid Build Coastguard Worker
2381*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass != 2 && (bp != PARTITION_SPLIT || bl == BL_8X8)) {
2382*c0909341SAndroid Build Coastguard Worker #define set_ctx(rep_macro) \
2383*c0909341SAndroid Build Coastguard Worker rep_macro(t->a->partition, bx8, dav1d_al_part_ctx[0][bl][bp]); \
2384*c0909341SAndroid Build Coastguard Worker rep_macro(t->l.partition, by8, dav1d_al_part_ctx[1][bl][bp])
2385*c0909341SAndroid Build Coastguard Worker case_set_upto16(ulog2(hsz));
2386*c0909341SAndroid Build Coastguard Worker #undef set_ctx
2387*c0909341SAndroid Build Coastguard Worker }
2388*c0909341SAndroid Build Coastguard Worker
2389*c0909341SAndroid Build Coastguard Worker return 0;
2390*c0909341SAndroid Build Coastguard Worker }
2391*c0909341SAndroid Build Coastguard Worker
reset_context(BlockContext * const ctx,const int keyframe,const int pass)2392*c0909341SAndroid Build Coastguard Worker static void reset_context(BlockContext *const ctx, const int keyframe, const int pass) {
2393*c0909341SAndroid Build Coastguard Worker memset(ctx->intra, keyframe, sizeof(ctx->intra));
2394*c0909341SAndroid Build Coastguard Worker memset(ctx->uvmode, DC_PRED, sizeof(ctx->uvmode));
2395*c0909341SAndroid Build Coastguard Worker if (keyframe)
2396*c0909341SAndroid Build Coastguard Worker memset(ctx->mode, DC_PRED, sizeof(ctx->mode));
2397*c0909341SAndroid Build Coastguard Worker
2398*c0909341SAndroid Build Coastguard Worker if (pass == 2) return;
2399*c0909341SAndroid Build Coastguard Worker
2400*c0909341SAndroid Build Coastguard Worker memset(ctx->partition, 0, sizeof(ctx->partition));
2401*c0909341SAndroid Build Coastguard Worker memset(ctx->skip, 0, sizeof(ctx->skip));
2402*c0909341SAndroid Build Coastguard Worker memset(ctx->skip_mode, 0, sizeof(ctx->skip_mode));
2403*c0909341SAndroid Build Coastguard Worker memset(ctx->tx_lpf_y, 2, sizeof(ctx->tx_lpf_y));
2404*c0909341SAndroid Build Coastguard Worker memset(ctx->tx_lpf_uv, 1, sizeof(ctx->tx_lpf_uv));
2405*c0909341SAndroid Build Coastguard Worker memset(ctx->tx_intra, -1, sizeof(ctx->tx_intra));
2406*c0909341SAndroid Build Coastguard Worker memset(ctx->tx, TX_64X64, sizeof(ctx->tx));
2407*c0909341SAndroid Build Coastguard Worker if (!keyframe) {
2408*c0909341SAndroid Build Coastguard Worker memset(ctx->ref, -1, sizeof(ctx->ref));
2409*c0909341SAndroid Build Coastguard Worker memset(ctx->comp_type, 0, sizeof(ctx->comp_type));
2410*c0909341SAndroid Build Coastguard Worker memset(ctx->mode, NEARESTMV, sizeof(ctx->mode));
2411*c0909341SAndroid Build Coastguard Worker }
2412*c0909341SAndroid Build Coastguard Worker memset(ctx->lcoef, 0x40, sizeof(ctx->lcoef));
2413*c0909341SAndroid Build Coastguard Worker memset(ctx->ccoef, 0x40, sizeof(ctx->ccoef));
2414*c0909341SAndroid Build Coastguard Worker memset(ctx->filter, DAV1D_N_SWITCHABLE_FILTERS, sizeof(ctx->filter));
2415*c0909341SAndroid Build Coastguard Worker memset(ctx->seg_pred, 0, sizeof(ctx->seg_pred));
2416*c0909341SAndroid Build Coastguard Worker memset(ctx->pal_sz, 0, sizeof(ctx->pal_sz));
2417*c0909341SAndroid Build Coastguard Worker }
2418*c0909341SAndroid Build Coastguard Worker
2419*c0909341SAndroid Build Coastguard Worker // { Y+U+V, Y+U } * 4
2420*c0909341SAndroid Build Coastguard Worker static const uint8_t ss_size_mul[4][2] = {
2421*c0909341SAndroid Build Coastguard Worker [DAV1D_PIXEL_LAYOUT_I400] = { 4, 4 },
2422*c0909341SAndroid Build Coastguard Worker [DAV1D_PIXEL_LAYOUT_I420] = { 6, 5 },
2423*c0909341SAndroid Build Coastguard Worker [DAV1D_PIXEL_LAYOUT_I422] = { 8, 6 },
2424*c0909341SAndroid Build Coastguard Worker [DAV1D_PIXEL_LAYOUT_I444] = { 12, 8 },
2425*c0909341SAndroid Build Coastguard Worker };
2426*c0909341SAndroid Build Coastguard Worker
setup_tile(Dav1dTileState * const ts,const Dav1dFrameContext * const f,const uint8_t * const data,const size_t sz,const int tile_row,const int tile_col,const unsigned tile_start_off)2427*c0909341SAndroid Build Coastguard Worker static void setup_tile(Dav1dTileState *const ts,
2428*c0909341SAndroid Build Coastguard Worker const Dav1dFrameContext *const f,
2429*c0909341SAndroid Build Coastguard Worker const uint8_t *const data, const size_t sz,
2430*c0909341SAndroid Build Coastguard Worker const int tile_row, const int tile_col,
2431*c0909341SAndroid Build Coastguard Worker const unsigned tile_start_off)
2432*c0909341SAndroid Build Coastguard Worker {
2433*c0909341SAndroid Build Coastguard Worker const int col_sb_start = f->frame_hdr->tiling.col_start_sb[tile_col];
2434*c0909341SAndroid Build Coastguard Worker const int col_sb128_start = col_sb_start >> !f->seq_hdr->sb128;
2435*c0909341SAndroid Build Coastguard Worker const int col_sb_end = f->frame_hdr->tiling.col_start_sb[tile_col + 1];
2436*c0909341SAndroid Build Coastguard Worker const int row_sb_start = f->frame_hdr->tiling.row_start_sb[tile_row];
2437*c0909341SAndroid Build Coastguard Worker const int row_sb_end = f->frame_hdr->tiling.row_start_sb[tile_row + 1];
2438*c0909341SAndroid Build Coastguard Worker const int sb_shift = f->sb_shift;
2439*c0909341SAndroid Build Coastguard Worker
2440*c0909341SAndroid Build Coastguard Worker const uint8_t *const size_mul = ss_size_mul[f->cur.p.layout];
2441*c0909341SAndroid Build Coastguard Worker for (int p = 0; p < 2; p++) {
2442*c0909341SAndroid Build Coastguard Worker ts->frame_thread[p].pal_idx = f->frame_thread.pal_idx ?
2443*c0909341SAndroid Build Coastguard Worker &f->frame_thread.pal_idx[(size_t)tile_start_off * size_mul[1] / 8] :
2444*c0909341SAndroid Build Coastguard Worker NULL;
2445*c0909341SAndroid Build Coastguard Worker ts->frame_thread[p].cbi = f->frame_thread.cbi ?
2446*c0909341SAndroid Build Coastguard Worker &f->frame_thread.cbi[(size_t)tile_start_off * size_mul[0] / 64] :
2447*c0909341SAndroid Build Coastguard Worker NULL;
2448*c0909341SAndroid Build Coastguard Worker ts->frame_thread[p].cf = f->frame_thread.cf ?
2449*c0909341SAndroid Build Coastguard Worker (uint8_t*)f->frame_thread.cf +
2450*c0909341SAndroid Build Coastguard Worker (((size_t)tile_start_off * size_mul[0]) >> !f->seq_hdr->hbd) :
2451*c0909341SAndroid Build Coastguard Worker NULL;
2452*c0909341SAndroid Build Coastguard Worker }
2453*c0909341SAndroid Build Coastguard Worker
2454*c0909341SAndroid Build Coastguard Worker dav1d_cdf_thread_copy(&ts->cdf, &f->in_cdf);
2455*c0909341SAndroid Build Coastguard Worker ts->last_qidx = f->frame_hdr->quant.yac;
2456*c0909341SAndroid Build Coastguard Worker ts->last_delta_lf.u32 = 0;
2457*c0909341SAndroid Build Coastguard Worker
2458*c0909341SAndroid Build Coastguard Worker dav1d_msac_init(&ts->msac, data, sz, f->frame_hdr->disable_cdf_update);
2459*c0909341SAndroid Build Coastguard Worker
2460*c0909341SAndroid Build Coastguard Worker ts->tiling.row = tile_row;
2461*c0909341SAndroid Build Coastguard Worker ts->tiling.col = tile_col;
2462*c0909341SAndroid Build Coastguard Worker ts->tiling.col_start = col_sb_start << sb_shift;
2463*c0909341SAndroid Build Coastguard Worker ts->tiling.col_end = imin(col_sb_end << sb_shift, f->bw);
2464*c0909341SAndroid Build Coastguard Worker ts->tiling.row_start = row_sb_start << sb_shift;
2465*c0909341SAndroid Build Coastguard Worker ts->tiling.row_end = imin(row_sb_end << sb_shift, f->bh);
2466*c0909341SAndroid Build Coastguard Worker
2467*c0909341SAndroid Build Coastguard Worker // Reference Restoration Unit (used for exp coding)
2468*c0909341SAndroid Build Coastguard Worker int sb_idx, unit_idx;
2469*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->width[0] != f->frame_hdr->width[1]) {
2470*c0909341SAndroid Build Coastguard Worker // vertical components only
2471*c0909341SAndroid Build Coastguard Worker sb_idx = (ts->tiling.row_start >> 5) * f->sr_sb128w;
2472*c0909341SAndroid Build Coastguard Worker unit_idx = (ts->tiling.row_start & 16) >> 3;
2473*c0909341SAndroid Build Coastguard Worker } else {
2474*c0909341SAndroid Build Coastguard Worker sb_idx = (ts->tiling.row_start >> 5) * f->sb128w + col_sb128_start;
2475*c0909341SAndroid Build Coastguard Worker unit_idx = ((ts->tiling.row_start & 16) >> 3) +
2476*c0909341SAndroid Build Coastguard Worker ((ts->tiling.col_start & 16) >> 4);
2477*c0909341SAndroid Build Coastguard Worker }
2478*c0909341SAndroid Build Coastguard Worker for (int p = 0; p < 3; p++) {
2479*c0909341SAndroid Build Coastguard Worker if (!((f->lf.restore_planes >> p) & 1U))
2480*c0909341SAndroid Build Coastguard Worker continue;
2481*c0909341SAndroid Build Coastguard Worker
2482*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->width[0] != f->frame_hdr->width[1]) {
2483*c0909341SAndroid Build Coastguard Worker const int ss_hor = p && f->cur.p.layout != DAV1D_PIXEL_LAYOUT_I444;
2484*c0909341SAndroid Build Coastguard Worker const int d = f->frame_hdr->super_res.width_scale_denominator;
2485*c0909341SAndroid Build Coastguard Worker const int unit_size_log2 = f->frame_hdr->restoration.unit_size[!!p];
2486*c0909341SAndroid Build Coastguard Worker const int rnd = (8 << unit_size_log2) - 1, shift = unit_size_log2 + 3;
2487*c0909341SAndroid Build Coastguard Worker const int x = ((4 * ts->tiling.col_start * d >> ss_hor) + rnd) >> shift;
2488*c0909341SAndroid Build Coastguard Worker const int px_x = x << (unit_size_log2 + ss_hor);
2489*c0909341SAndroid Build Coastguard Worker const int u_idx = unit_idx + ((px_x & 64) >> 6);
2490*c0909341SAndroid Build Coastguard Worker const int sb128x = px_x >> 7;
2491*c0909341SAndroid Build Coastguard Worker if (sb128x >= f->sr_sb128w) continue;
2492*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p] = &f->lf.lr_mask[sb_idx + sb128x].lr[p][u_idx];
2493*c0909341SAndroid Build Coastguard Worker } else {
2494*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p] = &f->lf.lr_mask[sb_idx].lr[p][unit_idx];
2495*c0909341SAndroid Build Coastguard Worker }
2496*c0909341SAndroid Build Coastguard Worker
2497*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->filter_v[0] = 3;
2498*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->filter_v[1] = -7;
2499*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->filter_v[2] = 15;
2500*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->filter_h[0] = 3;
2501*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->filter_h[1] = -7;
2502*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->filter_h[2] = 15;
2503*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->sgr_weights[0] = -32;
2504*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->sgr_weights[1] = 31;
2505*c0909341SAndroid Build Coastguard Worker }
2506*c0909341SAndroid Build Coastguard Worker
2507*c0909341SAndroid Build Coastguard Worker if (f->c->n_tc > 1) {
2508*c0909341SAndroid Build Coastguard Worker for (int p = 0; p < 2; p++)
2509*c0909341SAndroid Build Coastguard Worker atomic_init(&ts->progress[p], row_sb_start);
2510*c0909341SAndroid Build Coastguard Worker }
2511*c0909341SAndroid Build Coastguard Worker }
2512*c0909341SAndroid Build Coastguard Worker
read_restoration_info(Dav1dTaskContext * const t,Av1RestorationUnit * const lr,const int p,const enum Dav1dRestorationType frame_type)2513*c0909341SAndroid Build Coastguard Worker static void read_restoration_info(Dav1dTaskContext *const t,
2514*c0909341SAndroid Build Coastguard Worker Av1RestorationUnit *const lr, const int p,
2515*c0909341SAndroid Build Coastguard Worker const enum Dav1dRestorationType frame_type)
2516*c0909341SAndroid Build Coastguard Worker {
2517*c0909341SAndroid Build Coastguard Worker const Dav1dFrameContext *const f = t->f;
2518*c0909341SAndroid Build Coastguard Worker Dav1dTileState *const ts = t->ts;
2519*c0909341SAndroid Build Coastguard Worker
2520*c0909341SAndroid Build Coastguard Worker if (frame_type == DAV1D_RESTORATION_SWITCHABLE) {
2521*c0909341SAndroid Build Coastguard Worker const int filter = dav1d_msac_decode_symbol_adapt4(&ts->msac,
2522*c0909341SAndroid Build Coastguard Worker ts->cdf.m.restore_switchable, 2);
2523*c0909341SAndroid Build Coastguard Worker lr->type = filter + !!filter; /* NONE/WIENER/SGRPROJ */
2524*c0909341SAndroid Build Coastguard Worker } else {
2525*c0909341SAndroid Build Coastguard Worker const unsigned type =
2526*c0909341SAndroid Build Coastguard Worker dav1d_msac_decode_bool_adapt(&ts->msac,
2527*c0909341SAndroid Build Coastguard Worker frame_type == DAV1D_RESTORATION_WIENER ?
2528*c0909341SAndroid Build Coastguard Worker ts->cdf.m.restore_wiener : ts->cdf.m.restore_sgrproj);
2529*c0909341SAndroid Build Coastguard Worker lr->type = type ? frame_type : DAV1D_RESTORATION_NONE;
2530*c0909341SAndroid Build Coastguard Worker }
2531*c0909341SAndroid Build Coastguard Worker
2532*c0909341SAndroid Build Coastguard Worker if (lr->type == DAV1D_RESTORATION_WIENER) {
2533*c0909341SAndroid Build Coastguard Worker lr->filter_v[0] = p ? 0 :
2534*c0909341SAndroid Build Coastguard Worker dav1d_msac_decode_subexp(&ts->msac,
2535*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->filter_v[0] + 5, 16, 1) - 5;
2536*c0909341SAndroid Build Coastguard Worker lr->filter_v[1] =
2537*c0909341SAndroid Build Coastguard Worker dav1d_msac_decode_subexp(&ts->msac,
2538*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->filter_v[1] + 23, 32, 2) - 23;
2539*c0909341SAndroid Build Coastguard Worker lr->filter_v[2] =
2540*c0909341SAndroid Build Coastguard Worker dav1d_msac_decode_subexp(&ts->msac,
2541*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->filter_v[2] + 17, 64, 3) - 17;
2542*c0909341SAndroid Build Coastguard Worker
2543*c0909341SAndroid Build Coastguard Worker lr->filter_h[0] = p ? 0 :
2544*c0909341SAndroid Build Coastguard Worker dav1d_msac_decode_subexp(&ts->msac,
2545*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->filter_h[0] + 5, 16, 1) - 5;
2546*c0909341SAndroid Build Coastguard Worker lr->filter_h[1] =
2547*c0909341SAndroid Build Coastguard Worker dav1d_msac_decode_subexp(&ts->msac,
2548*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->filter_h[1] + 23, 32, 2) - 23;
2549*c0909341SAndroid Build Coastguard Worker lr->filter_h[2] =
2550*c0909341SAndroid Build Coastguard Worker dav1d_msac_decode_subexp(&ts->msac,
2551*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->filter_h[2] + 17, 64, 3) - 17;
2552*c0909341SAndroid Build Coastguard Worker memcpy(lr->sgr_weights, ts->lr_ref[p]->sgr_weights, sizeof(lr->sgr_weights));
2553*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p] = lr;
2554*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
2555*c0909341SAndroid Build Coastguard Worker printf("Post-lr_wiener[pl=%d,v[%d,%d,%d],h[%d,%d,%d]]: r=%d\n",
2556*c0909341SAndroid Build Coastguard Worker p, lr->filter_v[0], lr->filter_v[1],
2557*c0909341SAndroid Build Coastguard Worker lr->filter_v[2], lr->filter_h[0],
2558*c0909341SAndroid Build Coastguard Worker lr->filter_h[1], lr->filter_h[2], ts->msac.rng);
2559*c0909341SAndroid Build Coastguard Worker } else if (lr->type == DAV1D_RESTORATION_SGRPROJ) {
2560*c0909341SAndroid Build Coastguard Worker const unsigned idx = dav1d_msac_decode_bools(&ts->msac, 4);
2561*c0909341SAndroid Build Coastguard Worker const uint16_t *const sgr_params = dav1d_sgr_params[idx];
2562*c0909341SAndroid Build Coastguard Worker lr->type += idx;
2563*c0909341SAndroid Build Coastguard Worker lr->sgr_weights[0] = sgr_params[0] ? dav1d_msac_decode_subexp(&ts->msac,
2564*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->sgr_weights[0] + 96, 128, 4) - 96 : 0;
2565*c0909341SAndroid Build Coastguard Worker lr->sgr_weights[1] = sgr_params[1] ? dav1d_msac_decode_subexp(&ts->msac,
2566*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p]->sgr_weights[1] + 32, 128, 4) - 32 : 95;
2567*c0909341SAndroid Build Coastguard Worker memcpy(lr->filter_v, ts->lr_ref[p]->filter_v, sizeof(lr->filter_v));
2568*c0909341SAndroid Build Coastguard Worker memcpy(lr->filter_h, ts->lr_ref[p]->filter_h, sizeof(lr->filter_h));
2569*c0909341SAndroid Build Coastguard Worker ts->lr_ref[p] = lr;
2570*c0909341SAndroid Build Coastguard Worker if (DEBUG_BLOCK_INFO)
2571*c0909341SAndroid Build Coastguard Worker printf("Post-lr_sgrproj[pl=%d,idx=%d,w[%d,%d]]: r=%d\n",
2572*c0909341SAndroid Build Coastguard Worker p, idx, lr->sgr_weights[0],
2573*c0909341SAndroid Build Coastguard Worker lr->sgr_weights[1], ts->msac.rng);
2574*c0909341SAndroid Build Coastguard Worker }
2575*c0909341SAndroid Build Coastguard Worker }
2576*c0909341SAndroid Build Coastguard Worker
2577*c0909341SAndroid Build Coastguard Worker // modeled after the equivalent function in aomdec:decodeframe.c
check_trailing_bits_after_symbol_coder(const MsacContext * const msac)2578*c0909341SAndroid Build Coastguard Worker static int check_trailing_bits_after_symbol_coder(const MsacContext *const msac) {
2579*c0909341SAndroid Build Coastguard Worker // check marker bit (single 1), followed by zeroes
2580*c0909341SAndroid Build Coastguard Worker const int n_bits = -(msac->cnt + 14);
2581*c0909341SAndroid Build Coastguard Worker assert(n_bits <= 0); // this assumes we errored out when cnt <= -15 in caller
2582*c0909341SAndroid Build Coastguard Worker const int n_bytes = (n_bits + 7) >> 3;
2583*c0909341SAndroid Build Coastguard Worker const uint8_t *p = &msac->buf_pos[n_bytes];
2584*c0909341SAndroid Build Coastguard Worker const int pattern = 128 >> ((n_bits - 1) & 7);
2585*c0909341SAndroid Build Coastguard Worker if ((p[-1] & (2 * pattern - 1)) != pattern)
2586*c0909341SAndroid Build Coastguard Worker return 1;
2587*c0909341SAndroid Build Coastguard Worker
2588*c0909341SAndroid Build Coastguard Worker // check remainder zero bytes
2589*c0909341SAndroid Build Coastguard Worker for (; p < msac->buf_end; p++)
2590*c0909341SAndroid Build Coastguard Worker if (*p)
2591*c0909341SAndroid Build Coastguard Worker return 1;
2592*c0909341SAndroid Build Coastguard Worker
2593*c0909341SAndroid Build Coastguard Worker return 0;
2594*c0909341SAndroid Build Coastguard Worker }
2595*c0909341SAndroid Build Coastguard Worker
dav1d_decode_tile_sbrow(Dav1dTaskContext * const t)2596*c0909341SAndroid Build Coastguard Worker int dav1d_decode_tile_sbrow(Dav1dTaskContext *const t) {
2597*c0909341SAndroid Build Coastguard Worker const Dav1dFrameContext *const f = t->f;
2598*c0909341SAndroid Build Coastguard Worker const enum BlockLevel root_bl = f->seq_hdr->sb128 ? BL_128X128 : BL_64X64;
2599*c0909341SAndroid Build Coastguard Worker Dav1dTileState *const ts = t->ts;
2600*c0909341SAndroid Build Coastguard Worker const Dav1dContext *const c = f->c;
2601*c0909341SAndroid Build Coastguard Worker const int sb_step = f->sb_step;
2602*c0909341SAndroid Build Coastguard Worker const int tile_row = ts->tiling.row, tile_col = ts->tiling.col;
2603*c0909341SAndroid Build Coastguard Worker const int col_sb_start = f->frame_hdr->tiling.col_start_sb[tile_col];
2604*c0909341SAndroid Build Coastguard Worker const int col_sb128_start = col_sb_start >> !f->seq_hdr->sb128;
2605*c0909341SAndroid Build Coastguard Worker
2606*c0909341SAndroid Build Coastguard Worker if (IS_INTER_OR_SWITCH(f->frame_hdr) || f->frame_hdr->allow_intrabc) {
2607*c0909341SAndroid Build Coastguard Worker dav1d_refmvs_tile_sbrow_init(&t->rt, &f->rf, ts->tiling.col_start,
2608*c0909341SAndroid Build Coastguard Worker ts->tiling.col_end, ts->tiling.row_start,
2609*c0909341SAndroid Build Coastguard Worker ts->tiling.row_end, t->by >> f->sb_shift,
2610*c0909341SAndroid Build Coastguard Worker ts->tiling.row, t->frame_thread.pass);
2611*c0909341SAndroid Build Coastguard Worker }
2612*c0909341SAndroid Build Coastguard Worker
2613*c0909341SAndroid Build Coastguard Worker if (IS_INTER_OR_SWITCH(f->frame_hdr) && c->n_fc > 1) {
2614*c0909341SAndroid Build Coastguard Worker const int sby = (t->by - ts->tiling.row_start) >> f->sb_shift;
2615*c0909341SAndroid Build Coastguard Worker int (*const lowest_px)[2] = ts->lowest_pixel[sby];
2616*c0909341SAndroid Build Coastguard Worker for (int n = 0; n < 7; n++)
2617*c0909341SAndroid Build Coastguard Worker for (int m = 0; m < 2; m++)
2618*c0909341SAndroid Build Coastguard Worker lowest_px[n][m] = INT_MIN;
2619*c0909341SAndroid Build Coastguard Worker }
2620*c0909341SAndroid Build Coastguard Worker
2621*c0909341SAndroid Build Coastguard Worker reset_context(&t->l, IS_KEY_OR_INTRA(f->frame_hdr), t->frame_thread.pass);
2622*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass == 2) {
2623*c0909341SAndroid Build Coastguard Worker const int off_2pass = c->n_tc > 1 ? f->sb128w * f->frame_hdr->tiling.rows : 0;
2624*c0909341SAndroid Build Coastguard Worker for (t->bx = ts->tiling.col_start,
2625*c0909341SAndroid Build Coastguard Worker t->a = f->a + off_2pass + col_sb128_start + tile_row * f->sb128w;
2626*c0909341SAndroid Build Coastguard Worker t->bx < ts->tiling.col_end; t->bx += sb_step)
2627*c0909341SAndroid Build Coastguard Worker {
2628*c0909341SAndroid Build Coastguard Worker if (atomic_load_explicit(c->flush, memory_order_acquire))
2629*c0909341SAndroid Build Coastguard Worker return 1;
2630*c0909341SAndroid Build Coastguard Worker if (decode_sb(t, root_bl, dav1d_intra_edge_tree[root_bl]))
2631*c0909341SAndroid Build Coastguard Worker return 1;
2632*c0909341SAndroid Build Coastguard Worker if (t->bx & 16 || f->seq_hdr->sb128)
2633*c0909341SAndroid Build Coastguard Worker t->a++;
2634*c0909341SAndroid Build Coastguard Worker }
2635*c0909341SAndroid Build Coastguard Worker f->bd_fn.backup_ipred_edge(t);
2636*c0909341SAndroid Build Coastguard Worker return 0;
2637*c0909341SAndroid Build Coastguard Worker }
2638*c0909341SAndroid Build Coastguard Worker
2639*c0909341SAndroid Build Coastguard Worker if (f->c->n_tc > 1 && f->frame_hdr->use_ref_frame_mvs) {
2640*c0909341SAndroid Build Coastguard Worker f->c->refmvs_dsp.load_tmvs(&f->rf, ts->tiling.row,
2641*c0909341SAndroid Build Coastguard Worker ts->tiling.col_start >> 1, ts->tiling.col_end >> 1,
2642*c0909341SAndroid Build Coastguard Worker t->by >> 1, (t->by + sb_step) >> 1);
2643*c0909341SAndroid Build Coastguard Worker }
2644*c0909341SAndroid Build Coastguard Worker memset(t->pal_sz_uv[1], 0, sizeof(*t->pal_sz_uv));
2645*c0909341SAndroid Build Coastguard Worker const int sb128y = t->by >> 5;
2646*c0909341SAndroid Build Coastguard Worker for (t->bx = ts->tiling.col_start, t->a = f->a + col_sb128_start + tile_row * f->sb128w,
2647*c0909341SAndroid Build Coastguard Worker t->lf_mask = f->lf.mask + sb128y * f->sb128w + col_sb128_start;
2648*c0909341SAndroid Build Coastguard Worker t->bx < ts->tiling.col_end; t->bx += sb_step)
2649*c0909341SAndroid Build Coastguard Worker {
2650*c0909341SAndroid Build Coastguard Worker if (atomic_load_explicit(c->flush, memory_order_acquire))
2651*c0909341SAndroid Build Coastguard Worker return 1;
2652*c0909341SAndroid Build Coastguard Worker if (root_bl == BL_128X128) {
2653*c0909341SAndroid Build Coastguard Worker t->cur_sb_cdef_idx_ptr = t->lf_mask->cdef_idx;
2654*c0909341SAndroid Build Coastguard Worker t->cur_sb_cdef_idx_ptr[0] = -1;
2655*c0909341SAndroid Build Coastguard Worker t->cur_sb_cdef_idx_ptr[1] = -1;
2656*c0909341SAndroid Build Coastguard Worker t->cur_sb_cdef_idx_ptr[2] = -1;
2657*c0909341SAndroid Build Coastguard Worker t->cur_sb_cdef_idx_ptr[3] = -1;
2658*c0909341SAndroid Build Coastguard Worker } else {
2659*c0909341SAndroid Build Coastguard Worker t->cur_sb_cdef_idx_ptr =
2660*c0909341SAndroid Build Coastguard Worker &t->lf_mask->cdef_idx[((t->bx & 16) >> 4) +
2661*c0909341SAndroid Build Coastguard Worker ((t->by & 16) >> 3)];
2662*c0909341SAndroid Build Coastguard Worker t->cur_sb_cdef_idx_ptr[0] = -1;
2663*c0909341SAndroid Build Coastguard Worker }
2664*c0909341SAndroid Build Coastguard Worker // Restoration filter
2665*c0909341SAndroid Build Coastguard Worker for (int p = 0; p < 3; p++) {
2666*c0909341SAndroid Build Coastguard Worker if (!((f->lf.restore_planes >> p) & 1U))
2667*c0909341SAndroid Build Coastguard Worker continue;
2668*c0909341SAndroid Build Coastguard Worker
2669*c0909341SAndroid Build Coastguard Worker const int ss_ver = p && f->cur.p.layout == DAV1D_PIXEL_LAYOUT_I420;
2670*c0909341SAndroid Build Coastguard Worker const int ss_hor = p && f->cur.p.layout != DAV1D_PIXEL_LAYOUT_I444;
2671*c0909341SAndroid Build Coastguard Worker const int unit_size_log2 = f->frame_hdr->restoration.unit_size[!!p];
2672*c0909341SAndroid Build Coastguard Worker const int y = t->by * 4 >> ss_ver;
2673*c0909341SAndroid Build Coastguard Worker const int h = (f->cur.p.h + ss_ver) >> ss_ver;
2674*c0909341SAndroid Build Coastguard Worker
2675*c0909341SAndroid Build Coastguard Worker const int unit_size = 1 << unit_size_log2;
2676*c0909341SAndroid Build Coastguard Worker const unsigned mask = unit_size - 1;
2677*c0909341SAndroid Build Coastguard Worker if (y & mask) continue;
2678*c0909341SAndroid Build Coastguard Worker const int half_unit = unit_size >> 1;
2679*c0909341SAndroid Build Coastguard Worker // Round half up at frame boundaries, if there's more than one
2680*c0909341SAndroid Build Coastguard Worker // restoration unit
2681*c0909341SAndroid Build Coastguard Worker if (y && y + half_unit > h) continue;
2682*c0909341SAndroid Build Coastguard Worker
2683*c0909341SAndroid Build Coastguard Worker const enum Dav1dRestorationType frame_type = f->frame_hdr->restoration.type[p];
2684*c0909341SAndroid Build Coastguard Worker
2685*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->width[0] != f->frame_hdr->width[1]) {
2686*c0909341SAndroid Build Coastguard Worker const int w = (f->sr_cur.p.p.w + ss_hor) >> ss_hor;
2687*c0909341SAndroid Build Coastguard Worker const int n_units = imax(1, (w + half_unit) >> unit_size_log2);
2688*c0909341SAndroid Build Coastguard Worker
2689*c0909341SAndroid Build Coastguard Worker const int d = f->frame_hdr->super_res.width_scale_denominator;
2690*c0909341SAndroid Build Coastguard Worker const int rnd = unit_size * 8 - 1, shift = unit_size_log2 + 3;
2691*c0909341SAndroid Build Coastguard Worker const int x0 = ((4 * t->bx * d >> ss_hor) + rnd) >> shift;
2692*c0909341SAndroid Build Coastguard Worker const int x1 = ((4 * (t->bx + sb_step) * d >> ss_hor) + rnd) >> shift;
2693*c0909341SAndroid Build Coastguard Worker
2694*c0909341SAndroid Build Coastguard Worker for (int x = x0; x < imin(x1, n_units); x++) {
2695*c0909341SAndroid Build Coastguard Worker const int px_x = x << (unit_size_log2 + ss_hor);
2696*c0909341SAndroid Build Coastguard Worker const int sb_idx = (t->by >> 5) * f->sr_sb128w + (px_x >> 7);
2697*c0909341SAndroid Build Coastguard Worker const int unit_idx = ((t->by & 16) >> 3) + ((px_x & 64) >> 6);
2698*c0909341SAndroid Build Coastguard Worker Av1RestorationUnit *const lr = &f->lf.lr_mask[sb_idx].lr[p][unit_idx];
2699*c0909341SAndroid Build Coastguard Worker
2700*c0909341SAndroid Build Coastguard Worker read_restoration_info(t, lr, p, frame_type);
2701*c0909341SAndroid Build Coastguard Worker }
2702*c0909341SAndroid Build Coastguard Worker } else {
2703*c0909341SAndroid Build Coastguard Worker const int x = 4 * t->bx >> ss_hor;
2704*c0909341SAndroid Build Coastguard Worker if (x & mask) continue;
2705*c0909341SAndroid Build Coastguard Worker const int w = (f->cur.p.w + ss_hor) >> ss_hor;
2706*c0909341SAndroid Build Coastguard Worker // Round half up at frame boundaries, if there's more than one
2707*c0909341SAndroid Build Coastguard Worker // restoration unit
2708*c0909341SAndroid Build Coastguard Worker if (x && x + half_unit > w) continue;
2709*c0909341SAndroid Build Coastguard Worker const int sb_idx = (t->by >> 5) * f->sr_sb128w + (t->bx >> 5);
2710*c0909341SAndroid Build Coastguard Worker const int unit_idx = ((t->by & 16) >> 3) + ((t->bx & 16) >> 4);
2711*c0909341SAndroid Build Coastguard Worker Av1RestorationUnit *const lr = &f->lf.lr_mask[sb_idx].lr[p][unit_idx];
2712*c0909341SAndroid Build Coastguard Worker
2713*c0909341SAndroid Build Coastguard Worker read_restoration_info(t, lr, p, frame_type);
2714*c0909341SAndroid Build Coastguard Worker }
2715*c0909341SAndroid Build Coastguard Worker }
2716*c0909341SAndroid Build Coastguard Worker if (decode_sb(t, root_bl, dav1d_intra_edge_tree[root_bl]))
2717*c0909341SAndroid Build Coastguard Worker return 1;
2718*c0909341SAndroid Build Coastguard Worker if (t->bx & 16 || f->seq_hdr->sb128) {
2719*c0909341SAndroid Build Coastguard Worker t->a++;
2720*c0909341SAndroid Build Coastguard Worker t->lf_mask++;
2721*c0909341SAndroid Build Coastguard Worker }
2722*c0909341SAndroid Build Coastguard Worker }
2723*c0909341SAndroid Build Coastguard Worker
2724*c0909341SAndroid Build Coastguard Worker if (f->seq_hdr->ref_frame_mvs && f->c->n_tc > 1 && IS_INTER_OR_SWITCH(f->frame_hdr)) {
2725*c0909341SAndroid Build Coastguard Worker dav1d_refmvs_save_tmvs(&f->c->refmvs_dsp, &t->rt,
2726*c0909341SAndroid Build Coastguard Worker ts->tiling.col_start >> 1, ts->tiling.col_end >> 1,
2727*c0909341SAndroid Build Coastguard Worker t->by >> 1, (t->by + sb_step) >> 1);
2728*c0909341SAndroid Build Coastguard Worker }
2729*c0909341SAndroid Build Coastguard Worker
2730*c0909341SAndroid Build Coastguard Worker // backup pre-loopfilter pixels for intra prediction of the next sbrow
2731*c0909341SAndroid Build Coastguard Worker if (t->frame_thread.pass != 1)
2732*c0909341SAndroid Build Coastguard Worker f->bd_fn.backup_ipred_edge(t);
2733*c0909341SAndroid Build Coastguard Worker
2734*c0909341SAndroid Build Coastguard Worker // backup t->a/l.tx_lpf_y/uv at tile boundaries to use them to "fix"
2735*c0909341SAndroid Build Coastguard Worker // up the initial value in neighbour tiles when running the loopfilter
2736*c0909341SAndroid Build Coastguard Worker int align_h = (f->bh + 31) & ~31;
2737*c0909341SAndroid Build Coastguard Worker memcpy(&f->lf.tx_lpf_right_edge[0][align_h * tile_col + t->by],
2738*c0909341SAndroid Build Coastguard Worker &t->l.tx_lpf_y[t->by & 16], sb_step);
2739*c0909341SAndroid Build Coastguard Worker const int ss_ver = f->cur.p.layout == DAV1D_PIXEL_LAYOUT_I420;
2740*c0909341SAndroid Build Coastguard Worker align_h >>= ss_ver;
2741*c0909341SAndroid Build Coastguard Worker memcpy(&f->lf.tx_lpf_right_edge[1][align_h * tile_col + (t->by >> ss_ver)],
2742*c0909341SAndroid Build Coastguard Worker &t->l.tx_lpf_uv[(t->by & 16) >> ss_ver], sb_step >> ss_ver);
2743*c0909341SAndroid Build Coastguard Worker
2744*c0909341SAndroid Build Coastguard Worker // error out on symbol decoder overread
2745*c0909341SAndroid Build Coastguard Worker if (ts->msac.cnt <= -15) return 1;
2746*c0909341SAndroid Build Coastguard Worker
2747*c0909341SAndroid Build Coastguard Worker return c->strict_std_compliance &&
2748*c0909341SAndroid Build Coastguard Worker (t->by >> f->sb_shift) + 1 >= f->frame_hdr->tiling.row_start_sb[tile_row + 1] &&
2749*c0909341SAndroid Build Coastguard Worker check_trailing_bits_after_symbol_coder(&ts->msac);
2750*c0909341SAndroid Build Coastguard Worker }
2751*c0909341SAndroid Build Coastguard Worker
dav1d_decode_frame_init(Dav1dFrameContext * const f)2752*c0909341SAndroid Build Coastguard Worker int dav1d_decode_frame_init(Dav1dFrameContext *const f) {
2753*c0909341SAndroid Build Coastguard Worker const Dav1dContext *const c = f->c;
2754*c0909341SAndroid Build Coastguard Worker int retval = DAV1D_ERR(ENOMEM);
2755*c0909341SAndroid Build Coastguard Worker
2756*c0909341SAndroid Build Coastguard Worker if (f->sbh > f->lf.start_of_tile_row_sz) {
2757*c0909341SAndroid Build Coastguard Worker dav1d_free(f->lf.start_of_tile_row);
2758*c0909341SAndroid Build Coastguard Worker f->lf.start_of_tile_row = dav1d_malloc(ALLOC_TILE, f->sbh * sizeof(uint8_t));
2759*c0909341SAndroid Build Coastguard Worker if (!f->lf.start_of_tile_row) {
2760*c0909341SAndroid Build Coastguard Worker f->lf.start_of_tile_row_sz = 0;
2761*c0909341SAndroid Build Coastguard Worker goto error;
2762*c0909341SAndroid Build Coastguard Worker }
2763*c0909341SAndroid Build Coastguard Worker f->lf.start_of_tile_row_sz = f->sbh;
2764*c0909341SAndroid Build Coastguard Worker }
2765*c0909341SAndroid Build Coastguard Worker int sby = 0;
2766*c0909341SAndroid Build Coastguard Worker for (int tile_row = 0; tile_row < f->frame_hdr->tiling.rows; tile_row++) {
2767*c0909341SAndroid Build Coastguard Worker f->lf.start_of_tile_row[sby++] = tile_row;
2768*c0909341SAndroid Build Coastguard Worker while (sby < f->frame_hdr->tiling.row_start_sb[tile_row + 1])
2769*c0909341SAndroid Build Coastguard Worker f->lf.start_of_tile_row[sby++] = 0;
2770*c0909341SAndroid Build Coastguard Worker }
2771*c0909341SAndroid Build Coastguard Worker
2772*c0909341SAndroid Build Coastguard Worker const int n_ts = f->frame_hdr->tiling.cols * f->frame_hdr->tiling.rows;
2773*c0909341SAndroid Build Coastguard Worker if (n_ts != f->n_ts) {
2774*c0909341SAndroid Build Coastguard Worker if (c->n_fc > 1) {
2775*c0909341SAndroid Build Coastguard Worker dav1d_free(f->frame_thread.tile_start_off);
2776*c0909341SAndroid Build Coastguard Worker f->frame_thread.tile_start_off =
2777*c0909341SAndroid Build Coastguard Worker dav1d_malloc(ALLOC_TILE, sizeof(*f->frame_thread.tile_start_off) * n_ts);
2778*c0909341SAndroid Build Coastguard Worker if (!f->frame_thread.tile_start_off) {
2779*c0909341SAndroid Build Coastguard Worker f->n_ts = 0;
2780*c0909341SAndroid Build Coastguard Worker goto error;
2781*c0909341SAndroid Build Coastguard Worker }
2782*c0909341SAndroid Build Coastguard Worker }
2783*c0909341SAndroid Build Coastguard Worker dav1d_free_aligned(f->ts);
2784*c0909341SAndroid Build Coastguard Worker f->ts = dav1d_alloc_aligned(ALLOC_TILE, sizeof(*f->ts) * n_ts, 32);
2785*c0909341SAndroid Build Coastguard Worker if (!f->ts) goto error;
2786*c0909341SAndroid Build Coastguard Worker f->n_ts = n_ts;
2787*c0909341SAndroid Build Coastguard Worker }
2788*c0909341SAndroid Build Coastguard Worker
2789*c0909341SAndroid Build Coastguard Worker const int a_sz = f->sb128w * f->frame_hdr->tiling.rows * (1 + (c->n_fc > 1 && c->n_tc > 1));
2790*c0909341SAndroid Build Coastguard Worker if (a_sz != f->a_sz) {
2791*c0909341SAndroid Build Coastguard Worker dav1d_free(f->a);
2792*c0909341SAndroid Build Coastguard Worker f->a = dav1d_malloc(ALLOC_TILE, sizeof(*f->a) * a_sz);
2793*c0909341SAndroid Build Coastguard Worker if (!f->a) {
2794*c0909341SAndroid Build Coastguard Worker f->a_sz = 0;
2795*c0909341SAndroid Build Coastguard Worker goto error;
2796*c0909341SAndroid Build Coastguard Worker }
2797*c0909341SAndroid Build Coastguard Worker f->a_sz = a_sz;
2798*c0909341SAndroid Build Coastguard Worker }
2799*c0909341SAndroid Build Coastguard Worker
2800*c0909341SAndroid Build Coastguard Worker const int num_sb128 = f->sb128w * f->sb128h;
2801*c0909341SAndroid Build Coastguard Worker const uint8_t *const size_mul = ss_size_mul[f->cur.p.layout];
2802*c0909341SAndroid Build Coastguard Worker const int hbd = !!f->seq_hdr->hbd;
2803*c0909341SAndroid Build Coastguard Worker if (c->n_fc > 1) {
2804*c0909341SAndroid Build Coastguard Worker const unsigned sb_step4 = f->sb_step * 4;
2805*c0909341SAndroid Build Coastguard Worker int tile_idx = 0;
2806*c0909341SAndroid Build Coastguard Worker for (int tile_row = 0; tile_row < f->frame_hdr->tiling.rows; tile_row++) {
2807*c0909341SAndroid Build Coastguard Worker const unsigned row_off = f->frame_hdr->tiling.row_start_sb[tile_row] *
2808*c0909341SAndroid Build Coastguard Worker sb_step4 * f->sb128w * 128;
2809*c0909341SAndroid Build Coastguard Worker const unsigned b_diff = (f->frame_hdr->tiling.row_start_sb[tile_row + 1] -
2810*c0909341SAndroid Build Coastguard Worker f->frame_hdr->tiling.row_start_sb[tile_row]) * sb_step4;
2811*c0909341SAndroid Build Coastguard Worker for (int tile_col = 0; tile_col < f->frame_hdr->tiling.cols; tile_col++) {
2812*c0909341SAndroid Build Coastguard Worker f->frame_thread.tile_start_off[tile_idx++] = row_off + b_diff *
2813*c0909341SAndroid Build Coastguard Worker f->frame_hdr->tiling.col_start_sb[tile_col] * sb_step4;
2814*c0909341SAndroid Build Coastguard Worker }
2815*c0909341SAndroid Build Coastguard Worker }
2816*c0909341SAndroid Build Coastguard Worker
2817*c0909341SAndroid Build Coastguard Worker const int lowest_pixel_mem_sz = f->frame_hdr->tiling.cols * f->sbh;
2818*c0909341SAndroid Build Coastguard Worker if (lowest_pixel_mem_sz != f->tile_thread.lowest_pixel_mem_sz) {
2819*c0909341SAndroid Build Coastguard Worker dav1d_free(f->tile_thread.lowest_pixel_mem);
2820*c0909341SAndroid Build Coastguard Worker f->tile_thread.lowest_pixel_mem =
2821*c0909341SAndroid Build Coastguard Worker dav1d_malloc(ALLOC_TILE, lowest_pixel_mem_sz *
2822*c0909341SAndroid Build Coastguard Worker sizeof(*f->tile_thread.lowest_pixel_mem));
2823*c0909341SAndroid Build Coastguard Worker if (!f->tile_thread.lowest_pixel_mem) {
2824*c0909341SAndroid Build Coastguard Worker f->tile_thread.lowest_pixel_mem_sz = 0;
2825*c0909341SAndroid Build Coastguard Worker goto error;
2826*c0909341SAndroid Build Coastguard Worker }
2827*c0909341SAndroid Build Coastguard Worker f->tile_thread.lowest_pixel_mem_sz = lowest_pixel_mem_sz;
2828*c0909341SAndroid Build Coastguard Worker }
2829*c0909341SAndroid Build Coastguard Worker int (*lowest_pixel_ptr)[7][2] = f->tile_thread.lowest_pixel_mem;
2830*c0909341SAndroid Build Coastguard Worker for (int tile_row = 0, tile_row_base = 0; tile_row < f->frame_hdr->tiling.rows;
2831*c0909341SAndroid Build Coastguard Worker tile_row++, tile_row_base += f->frame_hdr->tiling.cols)
2832*c0909341SAndroid Build Coastguard Worker {
2833*c0909341SAndroid Build Coastguard Worker const int tile_row_sb_h = f->frame_hdr->tiling.row_start_sb[tile_row + 1] -
2834*c0909341SAndroid Build Coastguard Worker f->frame_hdr->tiling.row_start_sb[tile_row];
2835*c0909341SAndroid Build Coastguard Worker for (int tile_col = 0; tile_col < f->frame_hdr->tiling.cols; tile_col++) {
2836*c0909341SAndroid Build Coastguard Worker f->ts[tile_row_base + tile_col].lowest_pixel = lowest_pixel_ptr;
2837*c0909341SAndroid Build Coastguard Worker lowest_pixel_ptr += tile_row_sb_h;
2838*c0909341SAndroid Build Coastguard Worker }
2839*c0909341SAndroid Build Coastguard Worker }
2840*c0909341SAndroid Build Coastguard Worker
2841*c0909341SAndroid Build Coastguard Worker const int cbi_sz = num_sb128 * size_mul[0];
2842*c0909341SAndroid Build Coastguard Worker if (cbi_sz != f->frame_thread.cbi_sz) {
2843*c0909341SAndroid Build Coastguard Worker dav1d_free_aligned(f->frame_thread.cbi);
2844*c0909341SAndroid Build Coastguard Worker f->frame_thread.cbi =
2845*c0909341SAndroid Build Coastguard Worker dav1d_alloc_aligned(ALLOC_BLOCK, sizeof(*f->frame_thread.cbi) *
2846*c0909341SAndroid Build Coastguard Worker cbi_sz * 32 * 32 / 4, 64);
2847*c0909341SAndroid Build Coastguard Worker if (!f->frame_thread.cbi) {
2848*c0909341SAndroid Build Coastguard Worker f->frame_thread.cbi_sz = 0;
2849*c0909341SAndroid Build Coastguard Worker goto error;
2850*c0909341SAndroid Build Coastguard Worker }
2851*c0909341SAndroid Build Coastguard Worker f->frame_thread.cbi_sz = cbi_sz;
2852*c0909341SAndroid Build Coastguard Worker }
2853*c0909341SAndroid Build Coastguard Worker
2854*c0909341SAndroid Build Coastguard Worker const int cf_sz = (num_sb128 * size_mul[0]) << hbd;
2855*c0909341SAndroid Build Coastguard Worker if (cf_sz != f->frame_thread.cf_sz) {
2856*c0909341SAndroid Build Coastguard Worker dav1d_free_aligned(f->frame_thread.cf);
2857*c0909341SAndroid Build Coastguard Worker f->frame_thread.cf =
2858*c0909341SAndroid Build Coastguard Worker dav1d_alloc_aligned(ALLOC_COEF, (size_t)cf_sz * 128 * 128 / 2, 64);
2859*c0909341SAndroid Build Coastguard Worker if (!f->frame_thread.cf) {
2860*c0909341SAndroid Build Coastguard Worker f->frame_thread.cf_sz = 0;
2861*c0909341SAndroid Build Coastguard Worker goto error;
2862*c0909341SAndroid Build Coastguard Worker }
2863*c0909341SAndroid Build Coastguard Worker memset(f->frame_thread.cf, 0, (size_t)cf_sz * 128 * 128 / 2);
2864*c0909341SAndroid Build Coastguard Worker f->frame_thread.cf_sz = cf_sz;
2865*c0909341SAndroid Build Coastguard Worker }
2866*c0909341SAndroid Build Coastguard Worker
2867*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->allow_screen_content_tools) {
2868*c0909341SAndroid Build Coastguard Worker const int pal_sz = num_sb128 << hbd;
2869*c0909341SAndroid Build Coastguard Worker if (pal_sz != f->frame_thread.pal_sz) {
2870*c0909341SAndroid Build Coastguard Worker dav1d_free_aligned(f->frame_thread.pal);
2871*c0909341SAndroid Build Coastguard Worker f->frame_thread.pal =
2872*c0909341SAndroid Build Coastguard Worker dav1d_alloc_aligned(ALLOC_PAL, sizeof(*f->frame_thread.pal) *
2873*c0909341SAndroid Build Coastguard Worker pal_sz * 16 * 16, 64);
2874*c0909341SAndroid Build Coastguard Worker if (!f->frame_thread.pal) {
2875*c0909341SAndroid Build Coastguard Worker f->frame_thread.pal_sz = 0;
2876*c0909341SAndroid Build Coastguard Worker goto error;
2877*c0909341SAndroid Build Coastguard Worker }
2878*c0909341SAndroid Build Coastguard Worker f->frame_thread.pal_sz = pal_sz;
2879*c0909341SAndroid Build Coastguard Worker }
2880*c0909341SAndroid Build Coastguard Worker
2881*c0909341SAndroid Build Coastguard Worker const int pal_idx_sz = num_sb128 * size_mul[1];
2882*c0909341SAndroid Build Coastguard Worker if (pal_idx_sz != f->frame_thread.pal_idx_sz) {
2883*c0909341SAndroid Build Coastguard Worker dav1d_free_aligned(f->frame_thread.pal_idx);
2884*c0909341SAndroid Build Coastguard Worker f->frame_thread.pal_idx =
2885*c0909341SAndroid Build Coastguard Worker dav1d_alloc_aligned(ALLOC_PAL, sizeof(*f->frame_thread.pal_idx) *
2886*c0909341SAndroid Build Coastguard Worker pal_idx_sz * 128 * 128 / 8, 64);
2887*c0909341SAndroid Build Coastguard Worker if (!f->frame_thread.pal_idx) {
2888*c0909341SAndroid Build Coastguard Worker f->frame_thread.pal_idx_sz = 0;
2889*c0909341SAndroid Build Coastguard Worker goto error;
2890*c0909341SAndroid Build Coastguard Worker }
2891*c0909341SAndroid Build Coastguard Worker f->frame_thread.pal_idx_sz = pal_idx_sz;
2892*c0909341SAndroid Build Coastguard Worker }
2893*c0909341SAndroid Build Coastguard Worker } else if (f->frame_thread.pal) {
2894*c0909341SAndroid Build Coastguard Worker dav1d_freep_aligned(&f->frame_thread.pal);
2895*c0909341SAndroid Build Coastguard Worker dav1d_freep_aligned(&f->frame_thread.pal_idx);
2896*c0909341SAndroid Build Coastguard Worker f->frame_thread.pal_sz = f->frame_thread.pal_idx_sz = 0;
2897*c0909341SAndroid Build Coastguard Worker }
2898*c0909341SAndroid Build Coastguard Worker }
2899*c0909341SAndroid Build Coastguard Worker
2900*c0909341SAndroid Build Coastguard Worker // update allocation of block contexts for above
2901*c0909341SAndroid Build Coastguard Worker ptrdiff_t y_stride = f->cur.stride[0], uv_stride = f->cur.stride[1];
2902*c0909341SAndroid Build Coastguard Worker const int has_resize = f->frame_hdr->width[0] != f->frame_hdr->width[1];
2903*c0909341SAndroid Build Coastguard Worker const int need_cdef_lpf_copy = c->n_tc > 1 && has_resize;
2904*c0909341SAndroid Build Coastguard Worker if (y_stride * f->sbh * 4 != f->lf.cdef_buf_plane_sz[0] ||
2905*c0909341SAndroid Build Coastguard Worker uv_stride * f->sbh * 8 != f->lf.cdef_buf_plane_sz[1] ||
2906*c0909341SAndroid Build Coastguard Worker need_cdef_lpf_copy != f->lf.need_cdef_lpf_copy ||
2907*c0909341SAndroid Build Coastguard Worker f->sbh != f->lf.cdef_buf_sbh)
2908*c0909341SAndroid Build Coastguard Worker {
2909*c0909341SAndroid Build Coastguard Worker dav1d_free_aligned(f->lf.cdef_line_buf);
2910*c0909341SAndroid Build Coastguard Worker size_t alloc_sz = 64;
2911*c0909341SAndroid Build Coastguard Worker alloc_sz += (size_t)llabs(y_stride) * 4 * f->sbh << need_cdef_lpf_copy;
2912*c0909341SAndroid Build Coastguard Worker alloc_sz += (size_t)llabs(uv_stride) * 8 * f->sbh << need_cdef_lpf_copy;
2913*c0909341SAndroid Build Coastguard Worker uint8_t *ptr = f->lf.cdef_line_buf = dav1d_alloc_aligned(ALLOC_CDEF, alloc_sz, 32);
2914*c0909341SAndroid Build Coastguard Worker if (!ptr) {
2915*c0909341SAndroid Build Coastguard Worker f->lf.cdef_buf_plane_sz[0] = f->lf.cdef_buf_plane_sz[1] = 0;
2916*c0909341SAndroid Build Coastguard Worker goto error;
2917*c0909341SAndroid Build Coastguard Worker }
2918*c0909341SAndroid Build Coastguard Worker
2919*c0909341SAndroid Build Coastguard Worker ptr += 32;
2920*c0909341SAndroid Build Coastguard Worker if (y_stride < 0) {
2921*c0909341SAndroid Build Coastguard Worker f->lf.cdef_line[0][0] = ptr - y_stride * (f->sbh * 4 - 1);
2922*c0909341SAndroid Build Coastguard Worker f->lf.cdef_line[1][0] = ptr - y_stride * (f->sbh * 4 - 3);
2923*c0909341SAndroid Build Coastguard Worker } else {
2924*c0909341SAndroid Build Coastguard Worker f->lf.cdef_line[0][0] = ptr + y_stride * 0;
2925*c0909341SAndroid Build Coastguard Worker f->lf.cdef_line[1][0] = ptr + y_stride * 2;
2926*c0909341SAndroid Build Coastguard Worker }
2927*c0909341SAndroid Build Coastguard Worker ptr += llabs(y_stride) * f->sbh * 4;
2928*c0909341SAndroid Build Coastguard Worker if (uv_stride < 0) {
2929*c0909341SAndroid Build Coastguard Worker f->lf.cdef_line[0][1] = ptr - uv_stride * (f->sbh * 8 - 1);
2930*c0909341SAndroid Build Coastguard Worker f->lf.cdef_line[0][2] = ptr - uv_stride * (f->sbh * 8 - 3);
2931*c0909341SAndroid Build Coastguard Worker f->lf.cdef_line[1][1] = ptr - uv_stride * (f->sbh * 8 - 5);
2932*c0909341SAndroid Build Coastguard Worker f->lf.cdef_line[1][2] = ptr - uv_stride * (f->sbh * 8 - 7);
2933*c0909341SAndroid Build Coastguard Worker } else {
2934*c0909341SAndroid Build Coastguard Worker f->lf.cdef_line[0][1] = ptr + uv_stride * 0;
2935*c0909341SAndroid Build Coastguard Worker f->lf.cdef_line[0][2] = ptr + uv_stride * 2;
2936*c0909341SAndroid Build Coastguard Worker f->lf.cdef_line[1][1] = ptr + uv_stride * 4;
2937*c0909341SAndroid Build Coastguard Worker f->lf.cdef_line[1][2] = ptr + uv_stride * 6;
2938*c0909341SAndroid Build Coastguard Worker }
2939*c0909341SAndroid Build Coastguard Worker
2940*c0909341SAndroid Build Coastguard Worker if (need_cdef_lpf_copy) {
2941*c0909341SAndroid Build Coastguard Worker ptr += llabs(uv_stride) * f->sbh * 8;
2942*c0909341SAndroid Build Coastguard Worker if (y_stride < 0)
2943*c0909341SAndroid Build Coastguard Worker f->lf.cdef_lpf_line[0] = ptr - y_stride * (f->sbh * 4 - 1);
2944*c0909341SAndroid Build Coastguard Worker else
2945*c0909341SAndroid Build Coastguard Worker f->lf.cdef_lpf_line[0] = ptr;
2946*c0909341SAndroid Build Coastguard Worker ptr += llabs(y_stride) * f->sbh * 4;
2947*c0909341SAndroid Build Coastguard Worker if (uv_stride < 0) {
2948*c0909341SAndroid Build Coastguard Worker f->lf.cdef_lpf_line[1] = ptr - uv_stride * (f->sbh * 4 - 1);
2949*c0909341SAndroid Build Coastguard Worker f->lf.cdef_lpf_line[2] = ptr - uv_stride * (f->sbh * 8 - 1);
2950*c0909341SAndroid Build Coastguard Worker } else {
2951*c0909341SAndroid Build Coastguard Worker f->lf.cdef_lpf_line[1] = ptr;
2952*c0909341SAndroid Build Coastguard Worker f->lf.cdef_lpf_line[2] = ptr + uv_stride * f->sbh * 4;
2953*c0909341SAndroid Build Coastguard Worker }
2954*c0909341SAndroid Build Coastguard Worker }
2955*c0909341SAndroid Build Coastguard Worker
2956*c0909341SAndroid Build Coastguard Worker f->lf.cdef_buf_plane_sz[0] = (int) y_stride * f->sbh * 4;
2957*c0909341SAndroid Build Coastguard Worker f->lf.cdef_buf_plane_sz[1] = (int) uv_stride * f->sbh * 8;
2958*c0909341SAndroid Build Coastguard Worker f->lf.need_cdef_lpf_copy = need_cdef_lpf_copy;
2959*c0909341SAndroid Build Coastguard Worker f->lf.cdef_buf_sbh = f->sbh;
2960*c0909341SAndroid Build Coastguard Worker }
2961*c0909341SAndroid Build Coastguard Worker
2962*c0909341SAndroid Build Coastguard Worker const int sb128 = f->seq_hdr->sb128;
2963*c0909341SAndroid Build Coastguard Worker const int num_lines = c->n_tc > 1 ? f->sbh * 4 << sb128 : 12;
2964*c0909341SAndroid Build Coastguard Worker y_stride = f->sr_cur.p.stride[0], uv_stride = f->sr_cur.p.stride[1];
2965*c0909341SAndroid Build Coastguard Worker if (y_stride * num_lines != f->lf.lr_buf_plane_sz[0] ||
2966*c0909341SAndroid Build Coastguard Worker uv_stride * num_lines * 2 != f->lf.lr_buf_plane_sz[1])
2967*c0909341SAndroid Build Coastguard Worker {
2968*c0909341SAndroid Build Coastguard Worker dav1d_free_aligned(f->lf.lr_line_buf);
2969*c0909341SAndroid Build Coastguard Worker // lr simd may overread the input, so slightly over-allocate the lpf buffer
2970*c0909341SAndroid Build Coastguard Worker size_t alloc_sz = 128;
2971*c0909341SAndroid Build Coastguard Worker alloc_sz += (size_t)llabs(y_stride) * num_lines;
2972*c0909341SAndroid Build Coastguard Worker alloc_sz += (size_t)llabs(uv_stride) * num_lines * 2;
2973*c0909341SAndroid Build Coastguard Worker uint8_t *ptr = f->lf.lr_line_buf = dav1d_alloc_aligned(ALLOC_LR, alloc_sz, 64);
2974*c0909341SAndroid Build Coastguard Worker if (!ptr) {
2975*c0909341SAndroid Build Coastguard Worker f->lf.lr_buf_plane_sz[0] = f->lf.lr_buf_plane_sz[1] = 0;
2976*c0909341SAndroid Build Coastguard Worker goto error;
2977*c0909341SAndroid Build Coastguard Worker }
2978*c0909341SAndroid Build Coastguard Worker
2979*c0909341SAndroid Build Coastguard Worker ptr += 64;
2980*c0909341SAndroid Build Coastguard Worker if (y_stride < 0)
2981*c0909341SAndroid Build Coastguard Worker f->lf.lr_lpf_line[0] = ptr - y_stride * (num_lines - 1);
2982*c0909341SAndroid Build Coastguard Worker else
2983*c0909341SAndroid Build Coastguard Worker f->lf.lr_lpf_line[0] = ptr;
2984*c0909341SAndroid Build Coastguard Worker ptr += llabs(y_stride) * num_lines;
2985*c0909341SAndroid Build Coastguard Worker if (uv_stride < 0) {
2986*c0909341SAndroid Build Coastguard Worker f->lf.lr_lpf_line[1] = ptr - uv_stride * (num_lines * 1 - 1);
2987*c0909341SAndroid Build Coastguard Worker f->lf.lr_lpf_line[2] = ptr - uv_stride * (num_lines * 2 - 1);
2988*c0909341SAndroid Build Coastguard Worker } else {
2989*c0909341SAndroid Build Coastguard Worker f->lf.lr_lpf_line[1] = ptr;
2990*c0909341SAndroid Build Coastguard Worker f->lf.lr_lpf_line[2] = ptr + uv_stride * num_lines;
2991*c0909341SAndroid Build Coastguard Worker }
2992*c0909341SAndroid Build Coastguard Worker
2993*c0909341SAndroid Build Coastguard Worker f->lf.lr_buf_plane_sz[0] = (int) y_stride * num_lines;
2994*c0909341SAndroid Build Coastguard Worker f->lf.lr_buf_plane_sz[1] = (int) uv_stride * num_lines * 2;
2995*c0909341SAndroid Build Coastguard Worker }
2996*c0909341SAndroid Build Coastguard Worker
2997*c0909341SAndroid Build Coastguard Worker // update allocation for loopfilter masks
2998*c0909341SAndroid Build Coastguard Worker if (num_sb128 != f->lf.mask_sz) {
2999*c0909341SAndroid Build Coastguard Worker dav1d_free(f->lf.mask);
3000*c0909341SAndroid Build Coastguard Worker dav1d_free(f->lf.level);
3001*c0909341SAndroid Build Coastguard Worker f->lf.mask = dav1d_malloc(ALLOC_LF, sizeof(*f->lf.mask) * num_sb128);
3002*c0909341SAndroid Build Coastguard Worker // over-allocate by 3 bytes since some of the SIMD implementations
3003*c0909341SAndroid Build Coastguard Worker // index this from the level type and can thus over-read by up to 3
3004*c0909341SAndroid Build Coastguard Worker f->lf.level = dav1d_malloc(ALLOC_LF, sizeof(*f->lf.level) * num_sb128 * 32 * 32 + 3);
3005*c0909341SAndroid Build Coastguard Worker if (!f->lf.mask || !f->lf.level) {
3006*c0909341SAndroid Build Coastguard Worker f->lf.mask_sz = 0;
3007*c0909341SAndroid Build Coastguard Worker goto error;
3008*c0909341SAndroid Build Coastguard Worker }
3009*c0909341SAndroid Build Coastguard Worker if (c->n_fc > 1) {
3010*c0909341SAndroid Build Coastguard Worker dav1d_free(f->frame_thread.b);
3011*c0909341SAndroid Build Coastguard Worker f->frame_thread.b = dav1d_malloc(ALLOC_BLOCK, sizeof(*f->frame_thread.b) *
3012*c0909341SAndroid Build Coastguard Worker num_sb128 * 32 * 32);
3013*c0909341SAndroid Build Coastguard Worker if (!f->frame_thread.b) {
3014*c0909341SAndroid Build Coastguard Worker f->lf.mask_sz = 0;
3015*c0909341SAndroid Build Coastguard Worker goto error;
3016*c0909341SAndroid Build Coastguard Worker }
3017*c0909341SAndroid Build Coastguard Worker }
3018*c0909341SAndroid Build Coastguard Worker f->lf.mask_sz = num_sb128;
3019*c0909341SAndroid Build Coastguard Worker }
3020*c0909341SAndroid Build Coastguard Worker
3021*c0909341SAndroid Build Coastguard Worker f->sr_sb128w = (f->sr_cur.p.p.w + 127) >> 7;
3022*c0909341SAndroid Build Coastguard Worker const int lr_mask_sz = f->sr_sb128w * f->sb128h;
3023*c0909341SAndroid Build Coastguard Worker if (lr_mask_sz != f->lf.lr_mask_sz) {
3024*c0909341SAndroid Build Coastguard Worker dav1d_free(f->lf.lr_mask);
3025*c0909341SAndroid Build Coastguard Worker f->lf.lr_mask = dav1d_malloc(ALLOC_LR, sizeof(*f->lf.lr_mask) * lr_mask_sz);
3026*c0909341SAndroid Build Coastguard Worker if (!f->lf.lr_mask) {
3027*c0909341SAndroid Build Coastguard Worker f->lf.lr_mask_sz = 0;
3028*c0909341SAndroid Build Coastguard Worker goto error;
3029*c0909341SAndroid Build Coastguard Worker }
3030*c0909341SAndroid Build Coastguard Worker f->lf.lr_mask_sz = lr_mask_sz;
3031*c0909341SAndroid Build Coastguard Worker }
3032*c0909341SAndroid Build Coastguard Worker f->lf.restore_planes =
3033*c0909341SAndroid Build Coastguard Worker ((f->frame_hdr->restoration.type[0] != DAV1D_RESTORATION_NONE) << 0) +
3034*c0909341SAndroid Build Coastguard Worker ((f->frame_hdr->restoration.type[1] != DAV1D_RESTORATION_NONE) << 1) +
3035*c0909341SAndroid Build Coastguard Worker ((f->frame_hdr->restoration.type[2] != DAV1D_RESTORATION_NONE) << 2);
3036*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->loopfilter.sharpness != f->lf.last_sharpness) {
3037*c0909341SAndroid Build Coastguard Worker dav1d_calc_eih(&f->lf.lim_lut, f->frame_hdr->loopfilter.sharpness);
3038*c0909341SAndroid Build Coastguard Worker f->lf.last_sharpness = f->frame_hdr->loopfilter.sharpness;
3039*c0909341SAndroid Build Coastguard Worker }
3040*c0909341SAndroid Build Coastguard Worker dav1d_calc_lf_values(f->lf.lvl, f->frame_hdr, (int8_t[4]) { 0, 0, 0, 0 });
3041*c0909341SAndroid Build Coastguard Worker memset(f->lf.mask, 0, sizeof(*f->lf.mask) * num_sb128);
3042*c0909341SAndroid Build Coastguard Worker
3043*c0909341SAndroid Build Coastguard Worker const int ipred_edge_sz = f->sbh * f->sb128w << hbd;
3044*c0909341SAndroid Build Coastguard Worker if (ipred_edge_sz != f->ipred_edge_sz) {
3045*c0909341SAndroid Build Coastguard Worker dav1d_free_aligned(f->ipred_edge[0]);
3046*c0909341SAndroid Build Coastguard Worker uint8_t *ptr = f->ipred_edge[0] =
3047*c0909341SAndroid Build Coastguard Worker dav1d_alloc_aligned(ALLOC_IPRED, ipred_edge_sz * 128 * 3, 64);
3048*c0909341SAndroid Build Coastguard Worker if (!ptr) {
3049*c0909341SAndroid Build Coastguard Worker f->ipred_edge_sz = 0;
3050*c0909341SAndroid Build Coastguard Worker goto error;
3051*c0909341SAndroid Build Coastguard Worker }
3052*c0909341SAndroid Build Coastguard Worker f->ipred_edge[1] = ptr + ipred_edge_sz * 128 * 1;
3053*c0909341SAndroid Build Coastguard Worker f->ipred_edge[2] = ptr + ipred_edge_sz * 128 * 2;
3054*c0909341SAndroid Build Coastguard Worker f->ipred_edge_sz = ipred_edge_sz;
3055*c0909341SAndroid Build Coastguard Worker }
3056*c0909341SAndroid Build Coastguard Worker
3057*c0909341SAndroid Build Coastguard Worker const int re_sz = f->sb128h * f->frame_hdr->tiling.cols;
3058*c0909341SAndroid Build Coastguard Worker if (re_sz != f->lf.re_sz) {
3059*c0909341SAndroid Build Coastguard Worker dav1d_free(f->lf.tx_lpf_right_edge[0]);
3060*c0909341SAndroid Build Coastguard Worker f->lf.tx_lpf_right_edge[0] = dav1d_malloc(ALLOC_LF, re_sz * 32 * 2);
3061*c0909341SAndroid Build Coastguard Worker if (!f->lf.tx_lpf_right_edge[0]) {
3062*c0909341SAndroid Build Coastguard Worker f->lf.re_sz = 0;
3063*c0909341SAndroid Build Coastguard Worker goto error;
3064*c0909341SAndroid Build Coastguard Worker }
3065*c0909341SAndroid Build Coastguard Worker f->lf.tx_lpf_right_edge[1] = f->lf.tx_lpf_right_edge[0] + re_sz * 32;
3066*c0909341SAndroid Build Coastguard Worker f->lf.re_sz = re_sz;
3067*c0909341SAndroid Build Coastguard Worker }
3068*c0909341SAndroid Build Coastguard Worker
3069*c0909341SAndroid Build Coastguard Worker // init ref mvs
3070*c0909341SAndroid Build Coastguard Worker if (IS_INTER_OR_SWITCH(f->frame_hdr) || f->frame_hdr->allow_intrabc) {
3071*c0909341SAndroid Build Coastguard Worker const int ret =
3072*c0909341SAndroid Build Coastguard Worker dav1d_refmvs_init_frame(&f->rf, f->seq_hdr, f->frame_hdr,
3073*c0909341SAndroid Build Coastguard Worker f->refpoc, f->mvs, f->refrefpoc, f->ref_mvs,
3074*c0909341SAndroid Build Coastguard Worker f->c->n_tc, f->c->n_fc);
3075*c0909341SAndroid Build Coastguard Worker if (ret < 0) goto error;
3076*c0909341SAndroid Build Coastguard Worker }
3077*c0909341SAndroid Build Coastguard Worker
3078*c0909341SAndroid Build Coastguard Worker // setup dequant tables
3079*c0909341SAndroid Build Coastguard Worker init_quant_tables(f->seq_hdr, f->frame_hdr, f->frame_hdr->quant.yac, f->dq);
3080*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->quant.qm)
3081*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < N_RECT_TX_SIZES; i++) {
3082*c0909341SAndroid Build Coastguard Worker f->qm[i][0] = dav1d_qm_tbl[f->frame_hdr->quant.qm_y][0][i];
3083*c0909341SAndroid Build Coastguard Worker f->qm[i][1] = dav1d_qm_tbl[f->frame_hdr->quant.qm_u][1][i];
3084*c0909341SAndroid Build Coastguard Worker f->qm[i][2] = dav1d_qm_tbl[f->frame_hdr->quant.qm_v][1][i];
3085*c0909341SAndroid Build Coastguard Worker }
3086*c0909341SAndroid Build Coastguard Worker else
3087*c0909341SAndroid Build Coastguard Worker memset(f->qm, 0, sizeof(f->qm));
3088*c0909341SAndroid Build Coastguard Worker
3089*c0909341SAndroid Build Coastguard Worker // setup jnt_comp weights
3090*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->switchable_comp_refs) {
3091*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < 7; i++) {
3092*c0909341SAndroid Build Coastguard Worker const unsigned ref0poc = f->refp[i].p.frame_hdr->frame_offset;
3093*c0909341SAndroid Build Coastguard Worker
3094*c0909341SAndroid Build Coastguard Worker for (int j = i + 1; j < 7; j++) {
3095*c0909341SAndroid Build Coastguard Worker const unsigned ref1poc = f->refp[j].p.frame_hdr->frame_offset;
3096*c0909341SAndroid Build Coastguard Worker
3097*c0909341SAndroid Build Coastguard Worker const unsigned d1 =
3098*c0909341SAndroid Build Coastguard Worker imin(abs(get_poc_diff(f->seq_hdr->order_hint_n_bits, ref0poc,
3099*c0909341SAndroid Build Coastguard Worker f->cur.frame_hdr->frame_offset)), 31);
3100*c0909341SAndroid Build Coastguard Worker const unsigned d0 =
3101*c0909341SAndroid Build Coastguard Worker imin(abs(get_poc_diff(f->seq_hdr->order_hint_n_bits, ref1poc,
3102*c0909341SAndroid Build Coastguard Worker f->cur.frame_hdr->frame_offset)), 31);
3103*c0909341SAndroid Build Coastguard Worker const int order = d0 <= d1;
3104*c0909341SAndroid Build Coastguard Worker
3105*c0909341SAndroid Build Coastguard Worker static const uint8_t quant_dist_weight[3][2] = {
3106*c0909341SAndroid Build Coastguard Worker { 2, 3 }, { 2, 5 }, { 2, 7 }
3107*c0909341SAndroid Build Coastguard Worker };
3108*c0909341SAndroid Build Coastguard Worker static const uint8_t quant_dist_lookup_table[4][2] = {
3109*c0909341SAndroid Build Coastguard Worker { 9, 7 }, { 11, 5 }, { 12, 4 }, { 13, 3 }
3110*c0909341SAndroid Build Coastguard Worker };
3111*c0909341SAndroid Build Coastguard Worker
3112*c0909341SAndroid Build Coastguard Worker int k;
3113*c0909341SAndroid Build Coastguard Worker for (k = 0; k < 3; k++) {
3114*c0909341SAndroid Build Coastguard Worker const int c0 = quant_dist_weight[k][order];
3115*c0909341SAndroid Build Coastguard Worker const int c1 = quant_dist_weight[k][!order];
3116*c0909341SAndroid Build Coastguard Worker const int d0_c0 = d0 * c0;
3117*c0909341SAndroid Build Coastguard Worker const int d1_c1 = d1 * c1;
3118*c0909341SAndroid Build Coastguard Worker if ((d0 > d1 && d0_c0 < d1_c1) || (d0 <= d1 && d0_c0 > d1_c1)) break;
3119*c0909341SAndroid Build Coastguard Worker }
3120*c0909341SAndroid Build Coastguard Worker
3121*c0909341SAndroid Build Coastguard Worker f->jnt_weights[i][j] = quant_dist_lookup_table[k][order];
3122*c0909341SAndroid Build Coastguard Worker }
3123*c0909341SAndroid Build Coastguard Worker }
3124*c0909341SAndroid Build Coastguard Worker }
3125*c0909341SAndroid Build Coastguard Worker
3126*c0909341SAndroid Build Coastguard Worker /* Init loopfilter pointers. Increasing NULL pointers is technically UB,
3127*c0909341SAndroid Build Coastguard Worker * so just point the chroma pointers in 4:0:0 to the luma plane here to
3128*c0909341SAndroid Build Coastguard Worker * avoid having additional in-loop branches in various places. We never
3129*c0909341SAndroid Build Coastguard Worker * dereference those pointers so it doesn't really matter what they
3130*c0909341SAndroid Build Coastguard Worker * point at, as long as the pointers are valid. */
3131*c0909341SAndroid Build Coastguard Worker const int has_chroma = f->cur.p.layout != DAV1D_PIXEL_LAYOUT_I400;
3132*c0909341SAndroid Build Coastguard Worker f->lf.p[0] = f->cur.data[0];
3133*c0909341SAndroid Build Coastguard Worker f->lf.p[1] = f->cur.data[has_chroma ? 1 : 0];
3134*c0909341SAndroid Build Coastguard Worker f->lf.p[2] = f->cur.data[has_chroma ? 2 : 0];
3135*c0909341SAndroid Build Coastguard Worker f->lf.sr_p[0] = f->sr_cur.p.data[0];
3136*c0909341SAndroid Build Coastguard Worker f->lf.sr_p[1] = f->sr_cur.p.data[has_chroma ? 1 : 0];
3137*c0909341SAndroid Build Coastguard Worker f->lf.sr_p[2] = f->sr_cur.p.data[has_chroma ? 2 : 0];
3138*c0909341SAndroid Build Coastguard Worker
3139*c0909341SAndroid Build Coastguard Worker retval = 0;
3140*c0909341SAndroid Build Coastguard Worker error:
3141*c0909341SAndroid Build Coastguard Worker return retval;
3142*c0909341SAndroid Build Coastguard Worker }
3143*c0909341SAndroid Build Coastguard Worker
dav1d_decode_frame_init_cdf(Dav1dFrameContext * const f)3144*c0909341SAndroid Build Coastguard Worker int dav1d_decode_frame_init_cdf(Dav1dFrameContext *const f) {
3145*c0909341SAndroid Build Coastguard Worker const Dav1dContext *const c = f->c;
3146*c0909341SAndroid Build Coastguard Worker int retval = DAV1D_ERR(EINVAL);
3147*c0909341SAndroid Build Coastguard Worker
3148*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->refresh_context)
3149*c0909341SAndroid Build Coastguard Worker dav1d_cdf_thread_copy(f->out_cdf.data.cdf, &f->in_cdf);
3150*c0909341SAndroid Build Coastguard Worker
3151*c0909341SAndroid Build Coastguard Worker // parse individual tiles per tile group
3152*c0909341SAndroid Build Coastguard Worker int tile_row = 0, tile_col = 0;
3153*c0909341SAndroid Build Coastguard Worker f->task_thread.update_set = 0;
3154*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < f->n_tile_data; i++) {
3155*c0909341SAndroid Build Coastguard Worker const uint8_t *data = f->tile[i].data.data;
3156*c0909341SAndroid Build Coastguard Worker size_t size = f->tile[i].data.sz;
3157*c0909341SAndroid Build Coastguard Worker
3158*c0909341SAndroid Build Coastguard Worker for (int j = f->tile[i].start; j <= f->tile[i].end; j++) {
3159*c0909341SAndroid Build Coastguard Worker size_t tile_sz;
3160*c0909341SAndroid Build Coastguard Worker if (j == f->tile[i].end) {
3161*c0909341SAndroid Build Coastguard Worker tile_sz = size;
3162*c0909341SAndroid Build Coastguard Worker } else {
3163*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->tiling.n_bytes > size) goto error;
3164*c0909341SAndroid Build Coastguard Worker tile_sz = 0;
3165*c0909341SAndroid Build Coastguard Worker for (unsigned k = 0; k < f->frame_hdr->tiling.n_bytes; k++)
3166*c0909341SAndroid Build Coastguard Worker tile_sz |= (unsigned)*data++ << (k * 8);
3167*c0909341SAndroid Build Coastguard Worker tile_sz++;
3168*c0909341SAndroid Build Coastguard Worker size -= f->frame_hdr->tiling.n_bytes;
3169*c0909341SAndroid Build Coastguard Worker if (tile_sz > size) goto error;
3170*c0909341SAndroid Build Coastguard Worker }
3171*c0909341SAndroid Build Coastguard Worker
3172*c0909341SAndroid Build Coastguard Worker setup_tile(&f->ts[j], f, data, tile_sz, tile_row, tile_col++,
3173*c0909341SAndroid Build Coastguard Worker c->n_fc > 1 ? f->frame_thread.tile_start_off[j] : 0);
3174*c0909341SAndroid Build Coastguard Worker
3175*c0909341SAndroid Build Coastguard Worker if (tile_col == f->frame_hdr->tiling.cols) {
3176*c0909341SAndroid Build Coastguard Worker tile_col = 0;
3177*c0909341SAndroid Build Coastguard Worker tile_row++;
3178*c0909341SAndroid Build Coastguard Worker }
3179*c0909341SAndroid Build Coastguard Worker if (j == f->frame_hdr->tiling.update && f->frame_hdr->refresh_context)
3180*c0909341SAndroid Build Coastguard Worker f->task_thread.update_set = 1;
3181*c0909341SAndroid Build Coastguard Worker data += tile_sz;
3182*c0909341SAndroid Build Coastguard Worker size -= tile_sz;
3183*c0909341SAndroid Build Coastguard Worker }
3184*c0909341SAndroid Build Coastguard Worker }
3185*c0909341SAndroid Build Coastguard Worker
3186*c0909341SAndroid Build Coastguard Worker if (c->n_tc > 1) {
3187*c0909341SAndroid Build Coastguard Worker const int uses_2pass = c->n_fc > 1;
3188*c0909341SAndroid Build Coastguard Worker for (int n = 0; n < f->sb128w * f->frame_hdr->tiling.rows * (1 + uses_2pass); n++)
3189*c0909341SAndroid Build Coastguard Worker reset_context(&f->a[n], IS_KEY_OR_INTRA(f->frame_hdr),
3190*c0909341SAndroid Build Coastguard Worker uses_2pass ? 1 + (n >= f->sb128w * f->frame_hdr->tiling.rows) : 0);
3191*c0909341SAndroid Build Coastguard Worker }
3192*c0909341SAndroid Build Coastguard Worker
3193*c0909341SAndroid Build Coastguard Worker retval = 0;
3194*c0909341SAndroid Build Coastguard Worker error:
3195*c0909341SAndroid Build Coastguard Worker return retval;
3196*c0909341SAndroid Build Coastguard Worker }
3197*c0909341SAndroid Build Coastguard Worker
dav1d_decode_frame_main(Dav1dFrameContext * const f)3198*c0909341SAndroid Build Coastguard Worker int dav1d_decode_frame_main(Dav1dFrameContext *const f) {
3199*c0909341SAndroid Build Coastguard Worker const Dav1dContext *const c = f->c;
3200*c0909341SAndroid Build Coastguard Worker int retval = DAV1D_ERR(EINVAL);
3201*c0909341SAndroid Build Coastguard Worker
3202*c0909341SAndroid Build Coastguard Worker assert(f->c->n_tc == 1);
3203*c0909341SAndroid Build Coastguard Worker
3204*c0909341SAndroid Build Coastguard Worker Dav1dTaskContext *const t = &c->tc[f - c->fc];
3205*c0909341SAndroid Build Coastguard Worker t->f = f;
3206*c0909341SAndroid Build Coastguard Worker t->frame_thread.pass = 0;
3207*c0909341SAndroid Build Coastguard Worker
3208*c0909341SAndroid Build Coastguard Worker for (int n = 0; n < f->sb128w * f->frame_hdr->tiling.rows; n++)
3209*c0909341SAndroid Build Coastguard Worker reset_context(&f->a[n], IS_KEY_OR_INTRA(f->frame_hdr), 0);
3210*c0909341SAndroid Build Coastguard Worker
3211*c0909341SAndroid Build Coastguard Worker // no threading - we explicitly interleave tile/sbrow decoding
3212*c0909341SAndroid Build Coastguard Worker // and post-filtering, so that the full process runs in-line
3213*c0909341SAndroid Build Coastguard Worker for (int tile_row = 0; tile_row < f->frame_hdr->tiling.rows; tile_row++) {
3214*c0909341SAndroid Build Coastguard Worker const int sbh_end =
3215*c0909341SAndroid Build Coastguard Worker imin(f->frame_hdr->tiling.row_start_sb[tile_row + 1], f->sbh);
3216*c0909341SAndroid Build Coastguard Worker for (int sby = f->frame_hdr->tiling.row_start_sb[tile_row];
3217*c0909341SAndroid Build Coastguard Worker sby < sbh_end; sby++)
3218*c0909341SAndroid Build Coastguard Worker {
3219*c0909341SAndroid Build Coastguard Worker t->by = sby << (4 + f->seq_hdr->sb128);
3220*c0909341SAndroid Build Coastguard Worker const int by_end = (t->by + f->sb_step) >> 1;
3221*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->use_ref_frame_mvs) {
3222*c0909341SAndroid Build Coastguard Worker f->c->refmvs_dsp.load_tmvs(&f->rf, tile_row,
3223*c0909341SAndroid Build Coastguard Worker 0, f->bw >> 1, t->by >> 1, by_end);
3224*c0909341SAndroid Build Coastguard Worker }
3225*c0909341SAndroid Build Coastguard Worker for (int tile_col = 0; tile_col < f->frame_hdr->tiling.cols; tile_col++) {
3226*c0909341SAndroid Build Coastguard Worker t->ts = &f->ts[tile_row * f->frame_hdr->tiling.cols + tile_col];
3227*c0909341SAndroid Build Coastguard Worker if (dav1d_decode_tile_sbrow(t)) goto error;
3228*c0909341SAndroid Build Coastguard Worker }
3229*c0909341SAndroid Build Coastguard Worker if (IS_INTER_OR_SWITCH(f->frame_hdr)) {
3230*c0909341SAndroid Build Coastguard Worker dav1d_refmvs_save_tmvs(&f->c->refmvs_dsp, &t->rt,
3231*c0909341SAndroid Build Coastguard Worker 0, f->bw >> 1, t->by >> 1, by_end);
3232*c0909341SAndroid Build Coastguard Worker }
3233*c0909341SAndroid Build Coastguard Worker
3234*c0909341SAndroid Build Coastguard Worker // loopfilter + cdef + restoration
3235*c0909341SAndroid Build Coastguard Worker f->bd_fn.filter_sbrow(f, sby);
3236*c0909341SAndroid Build Coastguard Worker }
3237*c0909341SAndroid Build Coastguard Worker }
3238*c0909341SAndroid Build Coastguard Worker
3239*c0909341SAndroid Build Coastguard Worker retval = 0;
3240*c0909341SAndroid Build Coastguard Worker error:
3241*c0909341SAndroid Build Coastguard Worker return retval;
3242*c0909341SAndroid Build Coastguard Worker }
3243*c0909341SAndroid Build Coastguard Worker
dav1d_decode_frame_exit(Dav1dFrameContext * const f,int retval)3244*c0909341SAndroid Build Coastguard Worker void dav1d_decode_frame_exit(Dav1dFrameContext *const f, int retval) {
3245*c0909341SAndroid Build Coastguard Worker const Dav1dContext *const c = f->c;
3246*c0909341SAndroid Build Coastguard Worker
3247*c0909341SAndroid Build Coastguard Worker if (f->sr_cur.p.data[0])
3248*c0909341SAndroid Build Coastguard Worker atomic_init(&f->task_thread.error, 0);
3249*c0909341SAndroid Build Coastguard Worker
3250*c0909341SAndroid Build Coastguard Worker if (c->n_fc > 1 && retval && f->frame_thread.cf) {
3251*c0909341SAndroid Build Coastguard Worker memset(f->frame_thread.cf, 0,
3252*c0909341SAndroid Build Coastguard Worker (size_t)f->frame_thread.cf_sz * 128 * 128 / 2);
3253*c0909341SAndroid Build Coastguard Worker }
3254*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < 7; i++) {
3255*c0909341SAndroid Build Coastguard Worker if (f->refp[i].p.frame_hdr) {
3256*c0909341SAndroid Build Coastguard Worker if (!retval && c->n_fc > 1 && c->strict_std_compliance &&
3257*c0909341SAndroid Build Coastguard Worker atomic_load(&f->refp[i].progress[1]) == FRAME_ERROR)
3258*c0909341SAndroid Build Coastguard Worker {
3259*c0909341SAndroid Build Coastguard Worker retval = DAV1D_ERR(EINVAL);
3260*c0909341SAndroid Build Coastguard Worker atomic_store(&f->task_thread.error, 1);
3261*c0909341SAndroid Build Coastguard Worker atomic_store(&f->sr_cur.progress[1], FRAME_ERROR);
3262*c0909341SAndroid Build Coastguard Worker }
3263*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_unref(&f->refp[i]);
3264*c0909341SAndroid Build Coastguard Worker }
3265*c0909341SAndroid Build Coastguard Worker dav1d_ref_dec(&f->ref_mvs_ref[i]);
3266*c0909341SAndroid Build Coastguard Worker }
3267*c0909341SAndroid Build Coastguard Worker
3268*c0909341SAndroid Build Coastguard Worker dav1d_picture_unref_internal(&f->cur);
3269*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_unref(&f->sr_cur);
3270*c0909341SAndroid Build Coastguard Worker dav1d_cdf_thread_unref(&f->in_cdf);
3271*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr && f->frame_hdr->refresh_context) {
3272*c0909341SAndroid Build Coastguard Worker if (f->out_cdf.progress)
3273*c0909341SAndroid Build Coastguard Worker atomic_store(f->out_cdf.progress, retval == 0 ? 1 : TILE_ERROR);
3274*c0909341SAndroid Build Coastguard Worker dav1d_cdf_thread_unref(&f->out_cdf);
3275*c0909341SAndroid Build Coastguard Worker }
3276*c0909341SAndroid Build Coastguard Worker dav1d_ref_dec(&f->cur_segmap_ref);
3277*c0909341SAndroid Build Coastguard Worker dav1d_ref_dec(&f->prev_segmap_ref);
3278*c0909341SAndroid Build Coastguard Worker dav1d_ref_dec(&f->mvs_ref);
3279*c0909341SAndroid Build Coastguard Worker dav1d_ref_dec(&f->seq_hdr_ref);
3280*c0909341SAndroid Build Coastguard Worker dav1d_ref_dec(&f->frame_hdr_ref);
3281*c0909341SAndroid Build Coastguard Worker
3282*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < f->n_tile_data; i++)
3283*c0909341SAndroid Build Coastguard Worker dav1d_data_unref_internal(&f->tile[i].data);
3284*c0909341SAndroid Build Coastguard Worker f->task_thread.retval = retval;
3285*c0909341SAndroid Build Coastguard Worker }
3286*c0909341SAndroid Build Coastguard Worker
dav1d_decode_frame(Dav1dFrameContext * const f)3287*c0909341SAndroid Build Coastguard Worker int dav1d_decode_frame(Dav1dFrameContext *const f) {
3288*c0909341SAndroid Build Coastguard Worker assert(f->c->n_fc == 1);
3289*c0909341SAndroid Build Coastguard Worker // if n_tc > 1 (but n_fc == 1), we could run init/exit in the task
3290*c0909341SAndroid Build Coastguard Worker // threads also. Not sure it makes a measurable difference.
3291*c0909341SAndroid Build Coastguard Worker int res = dav1d_decode_frame_init(f);
3292*c0909341SAndroid Build Coastguard Worker if (!res) res = dav1d_decode_frame_init_cdf(f);
3293*c0909341SAndroid Build Coastguard Worker // wait until all threads have completed
3294*c0909341SAndroid Build Coastguard Worker if (!res) {
3295*c0909341SAndroid Build Coastguard Worker if (f->c->n_tc > 1) {
3296*c0909341SAndroid Build Coastguard Worker res = dav1d_task_create_tile_sbrow(f, 0, 1);
3297*c0909341SAndroid Build Coastguard Worker pthread_mutex_lock(&f->task_thread.ttd->lock);
3298*c0909341SAndroid Build Coastguard Worker pthread_cond_signal(&f->task_thread.ttd->cond);
3299*c0909341SAndroid Build Coastguard Worker if (!res) {
3300*c0909341SAndroid Build Coastguard Worker while (!f->task_thread.done[0] ||
3301*c0909341SAndroid Build Coastguard Worker atomic_load(&f->task_thread.task_counter) > 0)
3302*c0909341SAndroid Build Coastguard Worker {
3303*c0909341SAndroid Build Coastguard Worker pthread_cond_wait(&f->task_thread.cond,
3304*c0909341SAndroid Build Coastguard Worker &f->task_thread.ttd->lock);
3305*c0909341SAndroid Build Coastguard Worker }
3306*c0909341SAndroid Build Coastguard Worker }
3307*c0909341SAndroid Build Coastguard Worker pthread_mutex_unlock(&f->task_thread.ttd->lock);
3308*c0909341SAndroid Build Coastguard Worker res = f->task_thread.retval;
3309*c0909341SAndroid Build Coastguard Worker } else {
3310*c0909341SAndroid Build Coastguard Worker res = dav1d_decode_frame_main(f);
3311*c0909341SAndroid Build Coastguard Worker if (!res && f->frame_hdr->refresh_context && f->task_thread.update_set) {
3312*c0909341SAndroid Build Coastguard Worker dav1d_cdf_thread_update(f->frame_hdr, f->out_cdf.data.cdf,
3313*c0909341SAndroid Build Coastguard Worker &f->ts[f->frame_hdr->tiling.update].cdf);
3314*c0909341SAndroid Build Coastguard Worker }
3315*c0909341SAndroid Build Coastguard Worker }
3316*c0909341SAndroid Build Coastguard Worker }
3317*c0909341SAndroid Build Coastguard Worker dav1d_decode_frame_exit(f, res);
3318*c0909341SAndroid Build Coastguard Worker res = f->task_thread.retval;
3319*c0909341SAndroid Build Coastguard Worker f->n_tile_data = 0;
3320*c0909341SAndroid Build Coastguard Worker return res;
3321*c0909341SAndroid Build Coastguard Worker }
3322*c0909341SAndroid Build Coastguard Worker
get_upscale_x0(const int in_w,const int out_w,const int step)3323*c0909341SAndroid Build Coastguard Worker static int get_upscale_x0(const int in_w, const int out_w, const int step) {
3324*c0909341SAndroid Build Coastguard Worker const int err = out_w * step - (in_w << 14);
3325*c0909341SAndroid Build Coastguard Worker const int x0 = (-((out_w - in_w) << 13) + (out_w >> 1)) / out_w + 128 - (err / 2);
3326*c0909341SAndroid Build Coastguard Worker return x0 & 0x3fff;
3327*c0909341SAndroid Build Coastguard Worker }
3328*c0909341SAndroid Build Coastguard Worker
dav1d_submit_frame(Dav1dContext * const c)3329*c0909341SAndroid Build Coastguard Worker int dav1d_submit_frame(Dav1dContext *const c) {
3330*c0909341SAndroid Build Coastguard Worker Dav1dFrameContext *f;
3331*c0909341SAndroid Build Coastguard Worker int res = -1;
3332*c0909341SAndroid Build Coastguard Worker
3333*c0909341SAndroid Build Coastguard Worker // wait for c->out_delayed[next] and move into c->out if visible
3334*c0909341SAndroid Build Coastguard Worker Dav1dThreadPicture *out_delayed;
3335*c0909341SAndroid Build Coastguard Worker if (c->n_fc > 1) {
3336*c0909341SAndroid Build Coastguard Worker pthread_mutex_lock(&c->task_thread.lock);
3337*c0909341SAndroid Build Coastguard Worker const unsigned next = c->frame_thread.next++;
3338*c0909341SAndroid Build Coastguard Worker if (c->frame_thread.next == c->n_fc)
3339*c0909341SAndroid Build Coastguard Worker c->frame_thread.next = 0;
3340*c0909341SAndroid Build Coastguard Worker
3341*c0909341SAndroid Build Coastguard Worker f = &c->fc[next];
3342*c0909341SAndroid Build Coastguard Worker while (f->n_tile_data > 0)
3343*c0909341SAndroid Build Coastguard Worker pthread_cond_wait(&f->task_thread.cond,
3344*c0909341SAndroid Build Coastguard Worker &c->task_thread.lock);
3345*c0909341SAndroid Build Coastguard Worker out_delayed = &c->frame_thread.out_delayed[next];
3346*c0909341SAndroid Build Coastguard Worker if (out_delayed->p.data[0] || atomic_load(&f->task_thread.error)) {
3347*c0909341SAndroid Build Coastguard Worker unsigned first = atomic_load(&c->task_thread.first);
3348*c0909341SAndroid Build Coastguard Worker if (first + 1U < c->n_fc)
3349*c0909341SAndroid Build Coastguard Worker atomic_fetch_add(&c->task_thread.first, 1U);
3350*c0909341SAndroid Build Coastguard Worker else
3351*c0909341SAndroid Build Coastguard Worker atomic_store(&c->task_thread.first, 0);
3352*c0909341SAndroid Build Coastguard Worker atomic_compare_exchange_strong(&c->task_thread.reset_task_cur,
3353*c0909341SAndroid Build Coastguard Worker &first, UINT_MAX);
3354*c0909341SAndroid Build Coastguard Worker if (c->task_thread.cur && c->task_thread.cur < c->n_fc)
3355*c0909341SAndroid Build Coastguard Worker c->task_thread.cur--;
3356*c0909341SAndroid Build Coastguard Worker }
3357*c0909341SAndroid Build Coastguard Worker const int error = f->task_thread.retval;
3358*c0909341SAndroid Build Coastguard Worker if (error) {
3359*c0909341SAndroid Build Coastguard Worker f->task_thread.retval = 0;
3360*c0909341SAndroid Build Coastguard Worker c->cached_error = error;
3361*c0909341SAndroid Build Coastguard Worker dav1d_data_props_copy(&c->cached_error_props, &out_delayed->p.m);
3362*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_unref(out_delayed);
3363*c0909341SAndroid Build Coastguard Worker } else if (out_delayed->p.data[0]) {
3364*c0909341SAndroid Build Coastguard Worker const unsigned progress = atomic_load_explicit(&out_delayed->progress[1],
3365*c0909341SAndroid Build Coastguard Worker memory_order_relaxed);
3366*c0909341SAndroid Build Coastguard Worker if ((out_delayed->visible || c->output_invisible_frames) &&
3367*c0909341SAndroid Build Coastguard Worker progress != FRAME_ERROR)
3368*c0909341SAndroid Build Coastguard Worker {
3369*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_ref(&c->out, out_delayed);
3370*c0909341SAndroid Build Coastguard Worker c->event_flags |= dav1d_picture_get_event_flags(out_delayed);
3371*c0909341SAndroid Build Coastguard Worker }
3372*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_unref(out_delayed);
3373*c0909341SAndroid Build Coastguard Worker }
3374*c0909341SAndroid Build Coastguard Worker } else {
3375*c0909341SAndroid Build Coastguard Worker f = c->fc;
3376*c0909341SAndroid Build Coastguard Worker }
3377*c0909341SAndroid Build Coastguard Worker
3378*c0909341SAndroid Build Coastguard Worker f->seq_hdr = c->seq_hdr;
3379*c0909341SAndroid Build Coastguard Worker f->seq_hdr_ref = c->seq_hdr_ref;
3380*c0909341SAndroid Build Coastguard Worker dav1d_ref_inc(f->seq_hdr_ref);
3381*c0909341SAndroid Build Coastguard Worker f->frame_hdr = c->frame_hdr;
3382*c0909341SAndroid Build Coastguard Worker f->frame_hdr_ref = c->frame_hdr_ref;
3383*c0909341SAndroid Build Coastguard Worker c->frame_hdr = NULL;
3384*c0909341SAndroid Build Coastguard Worker c->frame_hdr_ref = NULL;
3385*c0909341SAndroid Build Coastguard Worker f->dsp = &c->dsp[f->seq_hdr->hbd];
3386*c0909341SAndroid Build Coastguard Worker
3387*c0909341SAndroid Build Coastguard Worker const int bpc = 8 + 2 * f->seq_hdr->hbd;
3388*c0909341SAndroid Build Coastguard Worker
3389*c0909341SAndroid Build Coastguard Worker if (!f->dsp->ipred.intra_pred[DC_PRED]) {
3390*c0909341SAndroid Build Coastguard Worker Dav1dDSPContext *const dsp = &c->dsp[f->seq_hdr->hbd];
3391*c0909341SAndroid Build Coastguard Worker
3392*c0909341SAndroid Build Coastguard Worker switch (bpc) {
3393*c0909341SAndroid Build Coastguard Worker #define assign_bitdepth_case(bd) \
3394*c0909341SAndroid Build Coastguard Worker dav1d_cdef_dsp_init_##bd##bpc(&dsp->cdef); \
3395*c0909341SAndroid Build Coastguard Worker dav1d_intra_pred_dsp_init_##bd##bpc(&dsp->ipred); \
3396*c0909341SAndroid Build Coastguard Worker dav1d_itx_dsp_init_##bd##bpc(&dsp->itx, bpc); \
3397*c0909341SAndroid Build Coastguard Worker dav1d_loop_filter_dsp_init_##bd##bpc(&dsp->lf); \
3398*c0909341SAndroid Build Coastguard Worker dav1d_loop_restoration_dsp_init_##bd##bpc(&dsp->lr, bpc); \
3399*c0909341SAndroid Build Coastguard Worker dav1d_mc_dsp_init_##bd##bpc(&dsp->mc); \
3400*c0909341SAndroid Build Coastguard Worker dav1d_film_grain_dsp_init_##bd##bpc(&dsp->fg); \
3401*c0909341SAndroid Build Coastguard Worker break
3402*c0909341SAndroid Build Coastguard Worker #if CONFIG_8BPC
3403*c0909341SAndroid Build Coastguard Worker case 8:
3404*c0909341SAndroid Build Coastguard Worker assign_bitdepth_case(8);
3405*c0909341SAndroid Build Coastguard Worker #endif
3406*c0909341SAndroid Build Coastguard Worker #if CONFIG_16BPC
3407*c0909341SAndroid Build Coastguard Worker case 10:
3408*c0909341SAndroid Build Coastguard Worker case 12:
3409*c0909341SAndroid Build Coastguard Worker assign_bitdepth_case(16);
3410*c0909341SAndroid Build Coastguard Worker #endif
3411*c0909341SAndroid Build Coastguard Worker #undef assign_bitdepth_case
3412*c0909341SAndroid Build Coastguard Worker default:
3413*c0909341SAndroid Build Coastguard Worker dav1d_log(c, "Compiled without support for %d-bit decoding\n",
3414*c0909341SAndroid Build Coastguard Worker 8 + 2 * f->seq_hdr->hbd);
3415*c0909341SAndroid Build Coastguard Worker res = DAV1D_ERR(ENOPROTOOPT);
3416*c0909341SAndroid Build Coastguard Worker goto error;
3417*c0909341SAndroid Build Coastguard Worker }
3418*c0909341SAndroid Build Coastguard Worker }
3419*c0909341SAndroid Build Coastguard Worker
3420*c0909341SAndroid Build Coastguard Worker #define assign_bitdepth_case(bd) \
3421*c0909341SAndroid Build Coastguard Worker f->bd_fn.recon_b_inter = dav1d_recon_b_inter_##bd##bpc; \
3422*c0909341SAndroid Build Coastguard Worker f->bd_fn.recon_b_intra = dav1d_recon_b_intra_##bd##bpc; \
3423*c0909341SAndroid Build Coastguard Worker f->bd_fn.filter_sbrow = dav1d_filter_sbrow_##bd##bpc; \
3424*c0909341SAndroid Build Coastguard Worker f->bd_fn.filter_sbrow_deblock_cols = dav1d_filter_sbrow_deblock_cols_##bd##bpc; \
3425*c0909341SAndroid Build Coastguard Worker f->bd_fn.filter_sbrow_deblock_rows = dav1d_filter_sbrow_deblock_rows_##bd##bpc; \
3426*c0909341SAndroid Build Coastguard Worker f->bd_fn.filter_sbrow_cdef = dav1d_filter_sbrow_cdef_##bd##bpc; \
3427*c0909341SAndroid Build Coastguard Worker f->bd_fn.filter_sbrow_resize = dav1d_filter_sbrow_resize_##bd##bpc; \
3428*c0909341SAndroid Build Coastguard Worker f->bd_fn.filter_sbrow_lr = dav1d_filter_sbrow_lr_##bd##bpc; \
3429*c0909341SAndroid Build Coastguard Worker f->bd_fn.backup_ipred_edge = dav1d_backup_ipred_edge_##bd##bpc; \
3430*c0909341SAndroid Build Coastguard Worker f->bd_fn.read_coef_blocks = dav1d_read_coef_blocks_##bd##bpc; \
3431*c0909341SAndroid Build Coastguard Worker f->bd_fn.copy_pal_block_y = dav1d_copy_pal_block_y_##bd##bpc; \
3432*c0909341SAndroid Build Coastguard Worker f->bd_fn.copy_pal_block_uv = dav1d_copy_pal_block_uv_##bd##bpc; \
3433*c0909341SAndroid Build Coastguard Worker f->bd_fn.read_pal_plane = dav1d_read_pal_plane_##bd##bpc; \
3434*c0909341SAndroid Build Coastguard Worker f->bd_fn.read_pal_uv = dav1d_read_pal_uv_##bd##bpc
3435*c0909341SAndroid Build Coastguard Worker if (!f->seq_hdr->hbd) {
3436*c0909341SAndroid Build Coastguard Worker #if CONFIG_8BPC
3437*c0909341SAndroid Build Coastguard Worker assign_bitdepth_case(8);
3438*c0909341SAndroid Build Coastguard Worker #endif
3439*c0909341SAndroid Build Coastguard Worker } else {
3440*c0909341SAndroid Build Coastguard Worker #if CONFIG_16BPC
3441*c0909341SAndroid Build Coastguard Worker assign_bitdepth_case(16);
3442*c0909341SAndroid Build Coastguard Worker #endif
3443*c0909341SAndroid Build Coastguard Worker }
3444*c0909341SAndroid Build Coastguard Worker #undef assign_bitdepth_case
3445*c0909341SAndroid Build Coastguard Worker
3446*c0909341SAndroid Build Coastguard Worker int ref_coded_width[7];
3447*c0909341SAndroid Build Coastguard Worker if (IS_INTER_OR_SWITCH(f->frame_hdr)) {
3448*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->primary_ref_frame != DAV1D_PRIMARY_REF_NONE) {
3449*c0909341SAndroid Build Coastguard Worker const int pri_ref = f->frame_hdr->refidx[f->frame_hdr->primary_ref_frame];
3450*c0909341SAndroid Build Coastguard Worker if (!c->refs[pri_ref].p.p.data[0]) {
3451*c0909341SAndroid Build Coastguard Worker res = DAV1D_ERR(EINVAL);
3452*c0909341SAndroid Build Coastguard Worker goto error;
3453*c0909341SAndroid Build Coastguard Worker }
3454*c0909341SAndroid Build Coastguard Worker }
3455*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < 7; i++) {
3456*c0909341SAndroid Build Coastguard Worker const int refidx = f->frame_hdr->refidx[i];
3457*c0909341SAndroid Build Coastguard Worker if (!c->refs[refidx].p.p.data[0] ||
3458*c0909341SAndroid Build Coastguard Worker f->frame_hdr->width[0] * 2 < c->refs[refidx].p.p.p.w ||
3459*c0909341SAndroid Build Coastguard Worker f->frame_hdr->height * 2 < c->refs[refidx].p.p.p.h ||
3460*c0909341SAndroid Build Coastguard Worker f->frame_hdr->width[0] > c->refs[refidx].p.p.p.w * 16 ||
3461*c0909341SAndroid Build Coastguard Worker f->frame_hdr->height > c->refs[refidx].p.p.p.h * 16 ||
3462*c0909341SAndroid Build Coastguard Worker f->seq_hdr->layout != c->refs[refidx].p.p.p.layout ||
3463*c0909341SAndroid Build Coastguard Worker bpc != c->refs[refidx].p.p.p.bpc)
3464*c0909341SAndroid Build Coastguard Worker {
3465*c0909341SAndroid Build Coastguard Worker for (int j = 0; j < i; j++)
3466*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_unref(&f->refp[j]);
3467*c0909341SAndroid Build Coastguard Worker res = DAV1D_ERR(EINVAL);
3468*c0909341SAndroid Build Coastguard Worker goto error;
3469*c0909341SAndroid Build Coastguard Worker }
3470*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_ref(&f->refp[i], &c->refs[refidx].p);
3471*c0909341SAndroid Build Coastguard Worker ref_coded_width[i] = c->refs[refidx].p.p.frame_hdr->width[0];
3472*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->width[0] != c->refs[refidx].p.p.p.w ||
3473*c0909341SAndroid Build Coastguard Worker f->frame_hdr->height != c->refs[refidx].p.p.p.h)
3474*c0909341SAndroid Build Coastguard Worker {
3475*c0909341SAndroid Build Coastguard Worker #define scale_fac(ref_sz, this_sz) \
3476*c0909341SAndroid Build Coastguard Worker ((((ref_sz) << 14) + ((this_sz) >> 1)) / (this_sz))
3477*c0909341SAndroid Build Coastguard Worker f->svc[i][0].scale = scale_fac(c->refs[refidx].p.p.p.w,
3478*c0909341SAndroid Build Coastguard Worker f->frame_hdr->width[0]);
3479*c0909341SAndroid Build Coastguard Worker f->svc[i][1].scale = scale_fac(c->refs[refidx].p.p.p.h,
3480*c0909341SAndroid Build Coastguard Worker f->frame_hdr->height);
3481*c0909341SAndroid Build Coastguard Worker f->svc[i][0].step = (f->svc[i][0].scale + 8) >> 4;
3482*c0909341SAndroid Build Coastguard Worker f->svc[i][1].step = (f->svc[i][1].scale + 8) >> 4;
3483*c0909341SAndroid Build Coastguard Worker } else {
3484*c0909341SAndroid Build Coastguard Worker f->svc[i][0].scale = f->svc[i][1].scale = 0;
3485*c0909341SAndroid Build Coastguard Worker }
3486*c0909341SAndroid Build Coastguard Worker f->gmv_warp_allowed[i] = f->frame_hdr->gmv[i].type > DAV1D_WM_TYPE_TRANSLATION &&
3487*c0909341SAndroid Build Coastguard Worker !f->frame_hdr->force_integer_mv &&
3488*c0909341SAndroid Build Coastguard Worker !dav1d_get_shear_params(&f->frame_hdr->gmv[i]) &&
3489*c0909341SAndroid Build Coastguard Worker !f->svc[i][0].scale;
3490*c0909341SAndroid Build Coastguard Worker }
3491*c0909341SAndroid Build Coastguard Worker }
3492*c0909341SAndroid Build Coastguard Worker
3493*c0909341SAndroid Build Coastguard Worker // setup entropy
3494*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->primary_ref_frame == DAV1D_PRIMARY_REF_NONE) {
3495*c0909341SAndroid Build Coastguard Worker dav1d_cdf_thread_init_static(&f->in_cdf, f->frame_hdr->quant.yac);
3496*c0909341SAndroid Build Coastguard Worker } else {
3497*c0909341SAndroid Build Coastguard Worker const int pri_ref = f->frame_hdr->refidx[f->frame_hdr->primary_ref_frame];
3498*c0909341SAndroid Build Coastguard Worker dav1d_cdf_thread_ref(&f->in_cdf, &c->cdf[pri_ref]);
3499*c0909341SAndroid Build Coastguard Worker }
3500*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->refresh_context) {
3501*c0909341SAndroid Build Coastguard Worker res = dav1d_cdf_thread_alloc(c, &f->out_cdf, c->n_fc > 1);
3502*c0909341SAndroid Build Coastguard Worker if (res < 0) goto error;
3503*c0909341SAndroid Build Coastguard Worker }
3504*c0909341SAndroid Build Coastguard Worker
3505*c0909341SAndroid Build Coastguard Worker // FIXME qsort so tiles are in order (for frame threading)
3506*c0909341SAndroid Build Coastguard Worker if (f->n_tile_data_alloc < c->n_tile_data) {
3507*c0909341SAndroid Build Coastguard Worker dav1d_free(f->tile);
3508*c0909341SAndroid Build Coastguard Worker assert(c->n_tile_data < INT_MAX / (int)sizeof(*f->tile));
3509*c0909341SAndroid Build Coastguard Worker f->tile = dav1d_malloc(ALLOC_TILE, c->n_tile_data * sizeof(*f->tile));
3510*c0909341SAndroid Build Coastguard Worker if (!f->tile) {
3511*c0909341SAndroid Build Coastguard Worker f->n_tile_data_alloc = f->n_tile_data = 0;
3512*c0909341SAndroid Build Coastguard Worker res = DAV1D_ERR(ENOMEM);
3513*c0909341SAndroid Build Coastguard Worker goto error;
3514*c0909341SAndroid Build Coastguard Worker }
3515*c0909341SAndroid Build Coastguard Worker f->n_tile_data_alloc = c->n_tile_data;
3516*c0909341SAndroid Build Coastguard Worker }
3517*c0909341SAndroid Build Coastguard Worker memcpy(f->tile, c->tile, c->n_tile_data * sizeof(*f->tile));
3518*c0909341SAndroid Build Coastguard Worker memset(c->tile, 0, c->n_tile_data * sizeof(*c->tile));
3519*c0909341SAndroid Build Coastguard Worker f->n_tile_data = c->n_tile_data;
3520*c0909341SAndroid Build Coastguard Worker c->n_tile_data = 0;
3521*c0909341SAndroid Build Coastguard Worker
3522*c0909341SAndroid Build Coastguard Worker // allocate frame
3523*c0909341SAndroid Build Coastguard Worker res = dav1d_thread_picture_alloc(c, f, bpc);
3524*c0909341SAndroid Build Coastguard Worker if (res < 0) goto error;
3525*c0909341SAndroid Build Coastguard Worker
3526*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->width[0] != f->frame_hdr->width[1]) {
3527*c0909341SAndroid Build Coastguard Worker res = dav1d_picture_alloc_copy(c, &f->cur, f->frame_hdr->width[0], &f->sr_cur.p);
3528*c0909341SAndroid Build Coastguard Worker if (res < 0) goto error;
3529*c0909341SAndroid Build Coastguard Worker } else {
3530*c0909341SAndroid Build Coastguard Worker dav1d_picture_ref(&f->cur, &f->sr_cur.p);
3531*c0909341SAndroid Build Coastguard Worker }
3532*c0909341SAndroid Build Coastguard Worker
3533*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->width[0] != f->frame_hdr->width[1]) {
3534*c0909341SAndroid Build Coastguard Worker f->resize_step[0] = scale_fac(f->cur.p.w, f->sr_cur.p.p.w);
3535*c0909341SAndroid Build Coastguard Worker const int ss_hor = f->cur.p.layout != DAV1D_PIXEL_LAYOUT_I444;
3536*c0909341SAndroid Build Coastguard Worker const int in_cw = (f->cur.p.w + ss_hor) >> ss_hor;
3537*c0909341SAndroid Build Coastguard Worker const int out_cw = (f->sr_cur.p.p.w + ss_hor) >> ss_hor;
3538*c0909341SAndroid Build Coastguard Worker f->resize_step[1] = scale_fac(in_cw, out_cw);
3539*c0909341SAndroid Build Coastguard Worker #undef scale_fac
3540*c0909341SAndroid Build Coastguard Worker f->resize_start[0] = get_upscale_x0(f->cur.p.w, f->sr_cur.p.p.w, f->resize_step[0]);
3541*c0909341SAndroid Build Coastguard Worker f->resize_start[1] = get_upscale_x0(in_cw, out_cw, f->resize_step[1]);
3542*c0909341SAndroid Build Coastguard Worker }
3543*c0909341SAndroid Build Coastguard Worker
3544*c0909341SAndroid Build Coastguard Worker // move f->cur into output queue
3545*c0909341SAndroid Build Coastguard Worker if (c->n_fc == 1) {
3546*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->show_frame || c->output_invisible_frames) {
3547*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_ref(&c->out, &f->sr_cur);
3548*c0909341SAndroid Build Coastguard Worker c->event_flags |= dav1d_picture_get_event_flags(&f->sr_cur);
3549*c0909341SAndroid Build Coastguard Worker }
3550*c0909341SAndroid Build Coastguard Worker } else {
3551*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_ref(out_delayed, &f->sr_cur);
3552*c0909341SAndroid Build Coastguard Worker }
3553*c0909341SAndroid Build Coastguard Worker
3554*c0909341SAndroid Build Coastguard Worker f->w4 = (f->frame_hdr->width[0] + 3) >> 2;
3555*c0909341SAndroid Build Coastguard Worker f->h4 = (f->frame_hdr->height + 3) >> 2;
3556*c0909341SAndroid Build Coastguard Worker f->bw = ((f->frame_hdr->width[0] + 7) >> 3) << 1;
3557*c0909341SAndroid Build Coastguard Worker f->bh = ((f->frame_hdr->height + 7) >> 3) << 1;
3558*c0909341SAndroid Build Coastguard Worker f->sb128w = (f->bw + 31) >> 5;
3559*c0909341SAndroid Build Coastguard Worker f->sb128h = (f->bh + 31) >> 5;
3560*c0909341SAndroid Build Coastguard Worker f->sb_shift = 4 + f->seq_hdr->sb128;
3561*c0909341SAndroid Build Coastguard Worker f->sb_step = 16 << f->seq_hdr->sb128;
3562*c0909341SAndroid Build Coastguard Worker f->sbh = (f->bh + f->sb_step - 1) >> f->sb_shift;
3563*c0909341SAndroid Build Coastguard Worker f->b4_stride = (f->bw + 31) & ~31;
3564*c0909341SAndroid Build Coastguard Worker f->bitdepth_max = (1 << f->cur.p.bpc) - 1;
3565*c0909341SAndroid Build Coastguard Worker atomic_init(&f->task_thread.error, 0);
3566*c0909341SAndroid Build Coastguard Worker const int uses_2pass = c->n_fc > 1;
3567*c0909341SAndroid Build Coastguard Worker const int cols = f->frame_hdr->tiling.cols;
3568*c0909341SAndroid Build Coastguard Worker const int rows = f->frame_hdr->tiling.rows;
3569*c0909341SAndroid Build Coastguard Worker atomic_store(&f->task_thread.task_counter,
3570*c0909341SAndroid Build Coastguard Worker (cols * rows + f->sbh) << uses_2pass);
3571*c0909341SAndroid Build Coastguard Worker
3572*c0909341SAndroid Build Coastguard Worker // ref_mvs
3573*c0909341SAndroid Build Coastguard Worker if (IS_INTER_OR_SWITCH(f->frame_hdr) || f->frame_hdr->allow_intrabc) {
3574*c0909341SAndroid Build Coastguard Worker f->mvs_ref = dav1d_ref_create_using_pool(c->refmvs_pool,
3575*c0909341SAndroid Build Coastguard Worker sizeof(*f->mvs) * f->sb128h * 16 * (f->b4_stride >> 1));
3576*c0909341SAndroid Build Coastguard Worker if (!f->mvs_ref) {
3577*c0909341SAndroid Build Coastguard Worker res = DAV1D_ERR(ENOMEM);
3578*c0909341SAndroid Build Coastguard Worker goto error;
3579*c0909341SAndroid Build Coastguard Worker }
3580*c0909341SAndroid Build Coastguard Worker f->mvs = f->mvs_ref->data;
3581*c0909341SAndroid Build Coastguard Worker if (!f->frame_hdr->allow_intrabc) {
3582*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < 7; i++)
3583*c0909341SAndroid Build Coastguard Worker f->refpoc[i] = f->refp[i].p.frame_hdr->frame_offset;
3584*c0909341SAndroid Build Coastguard Worker } else {
3585*c0909341SAndroid Build Coastguard Worker memset(f->refpoc, 0, sizeof(f->refpoc));
3586*c0909341SAndroid Build Coastguard Worker }
3587*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->use_ref_frame_mvs) {
3588*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < 7; i++) {
3589*c0909341SAndroid Build Coastguard Worker const int refidx = f->frame_hdr->refidx[i];
3590*c0909341SAndroid Build Coastguard Worker const int ref_w = ((ref_coded_width[i] + 7) >> 3) << 1;
3591*c0909341SAndroid Build Coastguard Worker const int ref_h = ((f->refp[i].p.p.h + 7) >> 3) << 1;
3592*c0909341SAndroid Build Coastguard Worker if (c->refs[refidx].refmvs != NULL &&
3593*c0909341SAndroid Build Coastguard Worker ref_w == f->bw && ref_h == f->bh)
3594*c0909341SAndroid Build Coastguard Worker {
3595*c0909341SAndroid Build Coastguard Worker f->ref_mvs_ref[i] = c->refs[refidx].refmvs;
3596*c0909341SAndroid Build Coastguard Worker dav1d_ref_inc(f->ref_mvs_ref[i]);
3597*c0909341SAndroid Build Coastguard Worker f->ref_mvs[i] = c->refs[refidx].refmvs->data;
3598*c0909341SAndroid Build Coastguard Worker } else {
3599*c0909341SAndroid Build Coastguard Worker f->ref_mvs[i] = NULL;
3600*c0909341SAndroid Build Coastguard Worker f->ref_mvs_ref[i] = NULL;
3601*c0909341SAndroid Build Coastguard Worker }
3602*c0909341SAndroid Build Coastguard Worker memcpy(f->refrefpoc[i], c->refs[refidx].refpoc,
3603*c0909341SAndroid Build Coastguard Worker sizeof(*f->refrefpoc));
3604*c0909341SAndroid Build Coastguard Worker }
3605*c0909341SAndroid Build Coastguard Worker } else {
3606*c0909341SAndroid Build Coastguard Worker memset(f->ref_mvs_ref, 0, sizeof(f->ref_mvs_ref));
3607*c0909341SAndroid Build Coastguard Worker }
3608*c0909341SAndroid Build Coastguard Worker } else {
3609*c0909341SAndroid Build Coastguard Worker f->mvs_ref = NULL;
3610*c0909341SAndroid Build Coastguard Worker memset(f->ref_mvs_ref, 0, sizeof(f->ref_mvs_ref));
3611*c0909341SAndroid Build Coastguard Worker }
3612*c0909341SAndroid Build Coastguard Worker
3613*c0909341SAndroid Build Coastguard Worker // segmap
3614*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->segmentation.enabled) {
3615*c0909341SAndroid Build Coastguard Worker // By default, the previous segmentation map is not initialised.
3616*c0909341SAndroid Build Coastguard Worker f->prev_segmap_ref = NULL;
3617*c0909341SAndroid Build Coastguard Worker f->prev_segmap = NULL;
3618*c0909341SAndroid Build Coastguard Worker
3619*c0909341SAndroid Build Coastguard Worker // We might need a previous frame's segmentation map. This
3620*c0909341SAndroid Build Coastguard Worker // happens if there is either no update or a temporal update.
3621*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->segmentation.temporal || !f->frame_hdr->segmentation.update_map) {
3622*c0909341SAndroid Build Coastguard Worker const int pri_ref = f->frame_hdr->primary_ref_frame;
3623*c0909341SAndroid Build Coastguard Worker assert(pri_ref != DAV1D_PRIMARY_REF_NONE);
3624*c0909341SAndroid Build Coastguard Worker const int ref_w = ((ref_coded_width[pri_ref] + 7) >> 3) << 1;
3625*c0909341SAndroid Build Coastguard Worker const int ref_h = ((f->refp[pri_ref].p.p.h + 7) >> 3) << 1;
3626*c0909341SAndroid Build Coastguard Worker if (ref_w == f->bw && ref_h == f->bh) {
3627*c0909341SAndroid Build Coastguard Worker f->prev_segmap_ref = c->refs[f->frame_hdr->refidx[pri_ref]].segmap;
3628*c0909341SAndroid Build Coastguard Worker if (f->prev_segmap_ref) {
3629*c0909341SAndroid Build Coastguard Worker dav1d_ref_inc(f->prev_segmap_ref);
3630*c0909341SAndroid Build Coastguard Worker f->prev_segmap = f->prev_segmap_ref->data;
3631*c0909341SAndroid Build Coastguard Worker }
3632*c0909341SAndroid Build Coastguard Worker }
3633*c0909341SAndroid Build Coastguard Worker }
3634*c0909341SAndroid Build Coastguard Worker
3635*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->segmentation.update_map) {
3636*c0909341SAndroid Build Coastguard Worker // We're updating an existing map, but need somewhere to
3637*c0909341SAndroid Build Coastguard Worker // put the new values. Allocate them here (the data
3638*c0909341SAndroid Build Coastguard Worker // actually gets set elsewhere)
3639*c0909341SAndroid Build Coastguard Worker f->cur_segmap_ref = dav1d_ref_create_using_pool(c->segmap_pool,
3640*c0909341SAndroid Build Coastguard Worker sizeof(*f->cur_segmap) * f->b4_stride * 32 * f->sb128h);
3641*c0909341SAndroid Build Coastguard Worker if (!f->cur_segmap_ref) {
3642*c0909341SAndroid Build Coastguard Worker dav1d_ref_dec(&f->prev_segmap_ref);
3643*c0909341SAndroid Build Coastguard Worker res = DAV1D_ERR(ENOMEM);
3644*c0909341SAndroid Build Coastguard Worker goto error;
3645*c0909341SAndroid Build Coastguard Worker }
3646*c0909341SAndroid Build Coastguard Worker f->cur_segmap = f->cur_segmap_ref->data;
3647*c0909341SAndroid Build Coastguard Worker } else if (f->prev_segmap_ref) {
3648*c0909341SAndroid Build Coastguard Worker // We're not updating an existing map, and we have a valid
3649*c0909341SAndroid Build Coastguard Worker // reference. Use that.
3650*c0909341SAndroid Build Coastguard Worker f->cur_segmap_ref = f->prev_segmap_ref;
3651*c0909341SAndroid Build Coastguard Worker dav1d_ref_inc(f->cur_segmap_ref);
3652*c0909341SAndroid Build Coastguard Worker f->cur_segmap = f->prev_segmap_ref->data;
3653*c0909341SAndroid Build Coastguard Worker } else {
3654*c0909341SAndroid Build Coastguard Worker // We need to make a new map. Allocate one here and zero it out.
3655*c0909341SAndroid Build Coastguard Worker const size_t segmap_size = sizeof(*f->cur_segmap) * f->b4_stride * 32 * f->sb128h;
3656*c0909341SAndroid Build Coastguard Worker f->cur_segmap_ref = dav1d_ref_create_using_pool(c->segmap_pool, segmap_size);
3657*c0909341SAndroid Build Coastguard Worker if (!f->cur_segmap_ref) {
3658*c0909341SAndroid Build Coastguard Worker res = DAV1D_ERR(ENOMEM);
3659*c0909341SAndroid Build Coastguard Worker goto error;
3660*c0909341SAndroid Build Coastguard Worker }
3661*c0909341SAndroid Build Coastguard Worker f->cur_segmap = f->cur_segmap_ref->data;
3662*c0909341SAndroid Build Coastguard Worker memset(f->cur_segmap, 0, segmap_size);
3663*c0909341SAndroid Build Coastguard Worker }
3664*c0909341SAndroid Build Coastguard Worker } else {
3665*c0909341SAndroid Build Coastguard Worker f->cur_segmap = NULL;
3666*c0909341SAndroid Build Coastguard Worker f->cur_segmap_ref = NULL;
3667*c0909341SAndroid Build Coastguard Worker f->prev_segmap_ref = NULL;
3668*c0909341SAndroid Build Coastguard Worker }
3669*c0909341SAndroid Build Coastguard Worker
3670*c0909341SAndroid Build Coastguard Worker // update references etc.
3671*c0909341SAndroid Build Coastguard Worker const unsigned refresh_frame_flags = f->frame_hdr->refresh_frame_flags;
3672*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < 8; i++) {
3673*c0909341SAndroid Build Coastguard Worker if (refresh_frame_flags & (1 << i)) {
3674*c0909341SAndroid Build Coastguard Worker if (c->refs[i].p.p.frame_hdr)
3675*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_unref(&c->refs[i].p);
3676*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_ref(&c->refs[i].p, &f->sr_cur);
3677*c0909341SAndroid Build Coastguard Worker
3678*c0909341SAndroid Build Coastguard Worker dav1d_cdf_thread_unref(&c->cdf[i]);
3679*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->refresh_context) {
3680*c0909341SAndroid Build Coastguard Worker dav1d_cdf_thread_ref(&c->cdf[i], &f->out_cdf);
3681*c0909341SAndroid Build Coastguard Worker } else {
3682*c0909341SAndroid Build Coastguard Worker dav1d_cdf_thread_ref(&c->cdf[i], &f->in_cdf);
3683*c0909341SAndroid Build Coastguard Worker }
3684*c0909341SAndroid Build Coastguard Worker
3685*c0909341SAndroid Build Coastguard Worker dav1d_ref_dec(&c->refs[i].segmap);
3686*c0909341SAndroid Build Coastguard Worker c->refs[i].segmap = f->cur_segmap_ref;
3687*c0909341SAndroid Build Coastguard Worker if (f->cur_segmap_ref)
3688*c0909341SAndroid Build Coastguard Worker dav1d_ref_inc(f->cur_segmap_ref);
3689*c0909341SAndroid Build Coastguard Worker dav1d_ref_dec(&c->refs[i].refmvs);
3690*c0909341SAndroid Build Coastguard Worker if (!f->frame_hdr->allow_intrabc) {
3691*c0909341SAndroid Build Coastguard Worker c->refs[i].refmvs = f->mvs_ref;
3692*c0909341SAndroid Build Coastguard Worker if (f->mvs_ref)
3693*c0909341SAndroid Build Coastguard Worker dav1d_ref_inc(f->mvs_ref);
3694*c0909341SAndroid Build Coastguard Worker }
3695*c0909341SAndroid Build Coastguard Worker memcpy(c->refs[i].refpoc, f->refpoc, sizeof(f->refpoc));
3696*c0909341SAndroid Build Coastguard Worker }
3697*c0909341SAndroid Build Coastguard Worker }
3698*c0909341SAndroid Build Coastguard Worker
3699*c0909341SAndroid Build Coastguard Worker if (c->n_fc == 1) {
3700*c0909341SAndroid Build Coastguard Worker if ((res = dav1d_decode_frame(f)) < 0) {
3701*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_unref(&c->out);
3702*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < 8; i++) {
3703*c0909341SAndroid Build Coastguard Worker if (refresh_frame_flags & (1 << i)) {
3704*c0909341SAndroid Build Coastguard Worker if (c->refs[i].p.p.frame_hdr)
3705*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_unref(&c->refs[i].p);
3706*c0909341SAndroid Build Coastguard Worker dav1d_cdf_thread_unref(&c->cdf[i]);
3707*c0909341SAndroid Build Coastguard Worker dav1d_ref_dec(&c->refs[i].segmap);
3708*c0909341SAndroid Build Coastguard Worker dav1d_ref_dec(&c->refs[i].refmvs);
3709*c0909341SAndroid Build Coastguard Worker }
3710*c0909341SAndroid Build Coastguard Worker }
3711*c0909341SAndroid Build Coastguard Worker goto error;
3712*c0909341SAndroid Build Coastguard Worker }
3713*c0909341SAndroid Build Coastguard Worker } else {
3714*c0909341SAndroid Build Coastguard Worker dav1d_task_frame_init(f);
3715*c0909341SAndroid Build Coastguard Worker pthread_mutex_unlock(&c->task_thread.lock);
3716*c0909341SAndroid Build Coastguard Worker }
3717*c0909341SAndroid Build Coastguard Worker
3718*c0909341SAndroid Build Coastguard Worker return 0;
3719*c0909341SAndroid Build Coastguard Worker error:
3720*c0909341SAndroid Build Coastguard Worker atomic_init(&f->task_thread.error, 1);
3721*c0909341SAndroid Build Coastguard Worker dav1d_cdf_thread_unref(&f->in_cdf);
3722*c0909341SAndroid Build Coastguard Worker if (f->frame_hdr->refresh_context)
3723*c0909341SAndroid Build Coastguard Worker dav1d_cdf_thread_unref(&f->out_cdf);
3724*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < 7; i++) {
3725*c0909341SAndroid Build Coastguard Worker if (f->refp[i].p.frame_hdr)
3726*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_unref(&f->refp[i]);
3727*c0909341SAndroid Build Coastguard Worker dav1d_ref_dec(&f->ref_mvs_ref[i]);
3728*c0909341SAndroid Build Coastguard Worker }
3729*c0909341SAndroid Build Coastguard Worker if (c->n_fc == 1)
3730*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_unref(&c->out);
3731*c0909341SAndroid Build Coastguard Worker else
3732*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_unref(out_delayed);
3733*c0909341SAndroid Build Coastguard Worker dav1d_picture_unref_internal(&f->cur);
3734*c0909341SAndroid Build Coastguard Worker dav1d_thread_picture_unref(&f->sr_cur);
3735*c0909341SAndroid Build Coastguard Worker dav1d_ref_dec(&f->mvs_ref);
3736*c0909341SAndroid Build Coastguard Worker dav1d_ref_dec(&f->seq_hdr_ref);
3737*c0909341SAndroid Build Coastguard Worker dav1d_ref_dec(&f->frame_hdr_ref);
3738*c0909341SAndroid Build Coastguard Worker dav1d_data_props_copy(&c->cached_error_props, &c->in.m);
3739*c0909341SAndroid Build Coastguard Worker
3740*c0909341SAndroid Build Coastguard Worker for (int i = 0; i < f->n_tile_data; i++)
3741*c0909341SAndroid Build Coastguard Worker dav1d_data_unref_internal(&f->tile[i].data);
3742*c0909341SAndroid Build Coastguard Worker f->n_tile_data = 0;
3743*c0909341SAndroid Build Coastguard Worker
3744*c0909341SAndroid Build Coastguard Worker if (c->n_fc > 1)
3745*c0909341SAndroid Build Coastguard Worker pthread_mutex_unlock(&c->task_thread.lock);
3746*c0909341SAndroid Build Coastguard Worker
3747*c0909341SAndroid Build Coastguard Worker return res;
3748*c0909341SAndroid Build Coastguard Worker }
3749