1*b2055c35SXin Li // Copyright 2011 Google Inc. All Rights Reserved.
2*b2055c35SXin Li //
3*b2055c35SXin Li // Use of this source code is governed by a BSD-style license
4*b2055c35SXin Li // that can be found in the COPYING file in the root of the source
5*b2055c35SXin Li // tree. An additional intellectual property rights grant can be found
6*b2055c35SXin Li // in the file PATENTS. All contributing project authors may
7*b2055c35SXin Li // be found in the AUTHORS file in the root of the source tree.
8*b2055c35SXin Li // -----------------------------------------------------------------------------
9*b2055c35SXin Li //
10*b2055c35SXin Li // VP8Iterator: block iterator
11*b2055c35SXin Li //
12*b2055c35SXin Li // Author: Skal ([email protected])
13*b2055c35SXin Li
14*b2055c35SXin Li #include <string.h>
15*b2055c35SXin Li
16*b2055c35SXin Li #include "src/enc/vp8i_enc.h"
17*b2055c35SXin Li
18*b2055c35SXin Li //------------------------------------------------------------------------------
19*b2055c35SXin Li // VP8Iterator
20*b2055c35SXin Li //------------------------------------------------------------------------------
21*b2055c35SXin Li
InitLeft(VP8EncIterator * const it)22*b2055c35SXin Li static void InitLeft(VP8EncIterator* const it) {
23*b2055c35SXin Li it->y_left_[-1] = it->u_left_[-1] = it->v_left_[-1] =
24*b2055c35SXin Li (it->y_ > 0) ? 129 : 127;
25*b2055c35SXin Li memset(it->y_left_, 129, 16);
26*b2055c35SXin Li memset(it->u_left_, 129, 8);
27*b2055c35SXin Li memset(it->v_left_, 129, 8);
28*b2055c35SXin Li it->left_nz_[8] = 0;
29*b2055c35SXin Li if (it->top_derr_ != NULL) {
30*b2055c35SXin Li memset(&it->left_derr_, 0, sizeof(it->left_derr_));
31*b2055c35SXin Li }
32*b2055c35SXin Li }
33*b2055c35SXin Li
InitTop(VP8EncIterator * const it)34*b2055c35SXin Li static void InitTop(VP8EncIterator* const it) {
35*b2055c35SXin Li const VP8Encoder* const enc = it->enc_;
36*b2055c35SXin Li const size_t top_size = enc->mb_w_ * 16;
37*b2055c35SXin Li memset(enc->y_top_, 127, 2 * top_size);
38*b2055c35SXin Li memset(enc->nz_, 0, enc->mb_w_ * sizeof(*enc->nz_));
39*b2055c35SXin Li if (enc->top_derr_ != NULL) {
40*b2055c35SXin Li memset(enc->top_derr_, 0, enc->mb_w_ * sizeof(*enc->top_derr_));
41*b2055c35SXin Li }
42*b2055c35SXin Li }
43*b2055c35SXin Li
VP8IteratorSetRow(VP8EncIterator * const it,int y)44*b2055c35SXin Li void VP8IteratorSetRow(VP8EncIterator* const it, int y) {
45*b2055c35SXin Li VP8Encoder* const enc = it->enc_;
46*b2055c35SXin Li it->x_ = 0;
47*b2055c35SXin Li it->y_ = y;
48*b2055c35SXin Li it->bw_ = &enc->parts_[y & (enc->num_parts_ - 1)];
49*b2055c35SXin Li it->preds_ = enc->preds_ + y * 4 * enc->preds_w_;
50*b2055c35SXin Li it->nz_ = enc->nz_;
51*b2055c35SXin Li it->mb_ = enc->mb_info_ + y * enc->mb_w_;
52*b2055c35SXin Li it->y_top_ = enc->y_top_;
53*b2055c35SXin Li it->uv_top_ = enc->uv_top_;
54*b2055c35SXin Li InitLeft(it);
55*b2055c35SXin Li }
56*b2055c35SXin Li
VP8IteratorReset(VP8EncIterator * const it)57*b2055c35SXin Li void VP8IteratorReset(VP8EncIterator* const it) {
58*b2055c35SXin Li VP8Encoder* const enc = it->enc_;
59*b2055c35SXin Li VP8IteratorSetRow(it, 0);
60*b2055c35SXin Li VP8IteratorSetCountDown(it, enc->mb_w_ * enc->mb_h_); // default
61*b2055c35SXin Li InitTop(it);
62*b2055c35SXin Li memset(it->bit_count_, 0, sizeof(it->bit_count_));
63*b2055c35SXin Li it->do_trellis_ = 0;
64*b2055c35SXin Li }
65*b2055c35SXin Li
VP8IteratorSetCountDown(VP8EncIterator * const it,int count_down)66*b2055c35SXin Li void VP8IteratorSetCountDown(VP8EncIterator* const it, int count_down) {
67*b2055c35SXin Li it->count_down_ = it->count_down0_ = count_down;
68*b2055c35SXin Li }
69*b2055c35SXin Li
VP8IteratorIsDone(const VP8EncIterator * const it)70*b2055c35SXin Li int VP8IteratorIsDone(const VP8EncIterator* const it) {
71*b2055c35SXin Li return (it->count_down_ <= 0);
72*b2055c35SXin Li }
73*b2055c35SXin Li
VP8IteratorInit(VP8Encoder * const enc,VP8EncIterator * const it)74*b2055c35SXin Li void VP8IteratorInit(VP8Encoder* const enc, VP8EncIterator* const it) {
75*b2055c35SXin Li it->enc_ = enc;
76*b2055c35SXin Li it->yuv_in_ = (uint8_t*)WEBP_ALIGN(it->yuv_mem_);
77*b2055c35SXin Li it->yuv_out_ = it->yuv_in_ + YUV_SIZE_ENC;
78*b2055c35SXin Li it->yuv_out2_ = it->yuv_out_ + YUV_SIZE_ENC;
79*b2055c35SXin Li it->yuv_p_ = it->yuv_out2_ + YUV_SIZE_ENC;
80*b2055c35SXin Li it->lf_stats_ = enc->lf_stats_;
81*b2055c35SXin Li it->percent0_ = enc->percent_;
82*b2055c35SXin Li it->y_left_ = (uint8_t*)WEBP_ALIGN(it->yuv_left_mem_ + 1);
83*b2055c35SXin Li it->u_left_ = it->y_left_ + 16 + 16;
84*b2055c35SXin Li it->v_left_ = it->u_left_ + 16;
85*b2055c35SXin Li it->top_derr_ = enc->top_derr_;
86*b2055c35SXin Li VP8IteratorReset(it);
87*b2055c35SXin Li }
88*b2055c35SXin Li
VP8IteratorProgress(const VP8EncIterator * const it,int delta)89*b2055c35SXin Li int VP8IteratorProgress(const VP8EncIterator* const it, int delta) {
90*b2055c35SXin Li VP8Encoder* const enc = it->enc_;
91*b2055c35SXin Li if (delta && enc->pic_->progress_hook != NULL) {
92*b2055c35SXin Li const int done = it->count_down0_ - it->count_down_;
93*b2055c35SXin Li const int percent = (it->count_down0_ <= 0)
94*b2055c35SXin Li ? it->percent0_
95*b2055c35SXin Li : it->percent0_ + delta * done / it->count_down0_;
96*b2055c35SXin Li return WebPReportProgress(enc->pic_, percent, &enc->percent_);
97*b2055c35SXin Li }
98*b2055c35SXin Li return 1;
99*b2055c35SXin Li }
100*b2055c35SXin Li
101*b2055c35SXin Li //------------------------------------------------------------------------------
102*b2055c35SXin Li // Import the source samples into the cache. Takes care of replicating
103*b2055c35SXin Li // boundary pixels if necessary.
104*b2055c35SXin Li
MinSize(int a,int b)105*b2055c35SXin Li static WEBP_INLINE int MinSize(int a, int b) { return (a < b) ? a : b; }
106*b2055c35SXin Li
ImportBlock(const uint8_t * src,int src_stride,uint8_t * dst,int w,int h,int size)107*b2055c35SXin Li static void ImportBlock(const uint8_t* src, int src_stride,
108*b2055c35SXin Li uint8_t* dst, int w, int h, int size) {
109*b2055c35SXin Li int i;
110*b2055c35SXin Li for (i = 0; i < h; ++i) {
111*b2055c35SXin Li memcpy(dst, src, w);
112*b2055c35SXin Li if (w < size) {
113*b2055c35SXin Li memset(dst + w, dst[w - 1], size - w);
114*b2055c35SXin Li }
115*b2055c35SXin Li dst += BPS;
116*b2055c35SXin Li src += src_stride;
117*b2055c35SXin Li }
118*b2055c35SXin Li for (i = h; i < size; ++i) {
119*b2055c35SXin Li memcpy(dst, dst - BPS, size);
120*b2055c35SXin Li dst += BPS;
121*b2055c35SXin Li }
122*b2055c35SXin Li }
123*b2055c35SXin Li
ImportLine(const uint8_t * src,int src_stride,uint8_t * dst,int len,int total_len)124*b2055c35SXin Li static void ImportLine(const uint8_t* src, int src_stride,
125*b2055c35SXin Li uint8_t* dst, int len, int total_len) {
126*b2055c35SXin Li int i;
127*b2055c35SXin Li for (i = 0; i < len; ++i, src += src_stride) dst[i] = *src;
128*b2055c35SXin Li for (; i < total_len; ++i) dst[i] = dst[len - 1];
129*b2055c35SXin Li }
130*b2055c35SXin Li
VP8IteratorImport(VP8EncIterator * const it,uint8_t * const tmp_32)131*b2055c35SXin Li void VP8IteratorImport(VP8EncIterator* const it, uint8_t* const tmp_32) {
132*b2055c35SXin Li const VP8Encoder* const enc = it->enc_;
133*b2055c35SXin Li const int x = it->x_, y = it->y_;
134*b2055c35SXin Li const WebPPicture* const pic = enc->pic_;
135*b2055c35SXin Li const uint8_t* const ysrc = pic->y + (y * pic->y_stride + x) * 16;
136*b2055c35SXin Li const uint8_t* const usrc = pic->u + (y * pic->uv_stride + x) * 8;
137*b2055c35SXin Li const uint8_t* const vsrc = pic->v + (y * pic->uv_stride + x) * 8;
138*b2055c35SXin Li const int w = MinSize(pic->width - x * 16, 16);
139*b2055c35SXin Li const int h = MinSize(pic->height - y * 16, 16);
140*b2055c35SXin Li const int uv_w = (w + 1) >> 1;
141*b2055c35SXin Li const int uv_h = (h + 1) >> 1;
142*b2055c35SXin Li
143*b2055c35SXin Li ImportBlock(ysrc, pic->y_stride, it->yuv_in_ + Y_OFF_ENC, w, h, 16);
144*b2055c35SXin Li ImportBlock(usrc, pic->uv_stride, it->yuv_in_ + U_OFF_ENC, uv_w, uv_h, 8);
145*b2055c35SXin Li ImportBlock(vsrc, pic->uv_stride, it->yuv_in_ + V_OFF_ENC, uv_w, uv_h, 8);
146*b2055c35SXin Li
147*b2055c35SXin Li if (tmp_32 == NULL) return;
148*b2055c35SXin Li
149*b2055c35SXin Li // Import source (uncompressed) samples into boundary.
150*b2055c35SXin Li if (x == 0) {
151*b2055c35SXin Li InitLeft(it);
152*b2055c35SXin Li } else {
153*b2055c35SXin Li if (y == 0) {
154*b2055c35SXin Li it->y_left_[-1] = it->u_left_[-1] = it->v_left_[-1] = 127;
155*b2055c35SXin Li } else {
156*b2055c35SXin Li it->y_left_[-1] = ysrc[- 1 - pic->y_stride];
157*b2055c35SXin Li it->u_left_[-1] = usrc[- 1 - pic->uv_stride];
158*b2055c35SXin Li it->v_left_[-1] = vsrc[- 1 - pic->uv_stride];
159*b2055c35SXin Li }
160*b2055c35SXin Li ImportLine(ysrc - 1, pic->y_stride, it->y_left_, h, 16);
161*b2055c35SXin Li ImportLine(usrc - 1, pic->uv_stride, it->u_left_, uv_h, 8);
162*b2055c35SXin Li ImportLine(vsrc - 1, pic->uv_stride, it->v_left_, uv_h, 8);
163*b2055c35SXin Li }
164*b2055c35SXin Li
165*b2055c35SXin Li it->y_top_ = tmp_32 + 0;
166*b2055c35SXin Li it->uv_top_ = tmp_32 + 16;
167*b2055c35SXin Li if (y == 0) {
168*b2055c35SXin Li memset(tmp_32, 127, 32 * sizeof(*tmp_32));
169*b2055c35SXin Li } else {
170*b2055c35SXin Li ImportLine(ysrc - pic->y_stride, 1, tmp_32, w, 16);
171*b2055c35SXin Li ImportLine(usrc - pic->uv_stride, 1, tmp_32 + 16, uv_w, 8);
172*b2055c35SXin Li ImportLine(vsrc - pic->uv_stride, 1, tmp_32 + 16 + 8, uv_w, 8);
173*b2055c35SXin Li }
174*b2055c35SXin Li }
175*b2055c35SXin Li
176*b2055c35SXin Li //------------------------------------------------------------------------------
177*b2055c35SXin Li // Copy back the compressed samples into user space if requested.
178*b2055c35SXin Li
ExportBlock(const uint8_t * src,uint8_t * dst,int dst_stride,int w,int h)179*b2055c35SXin Li static void ExportBlock(const uint8_t* src, uint8_t* dst, int dst_stride,
180*b2055c35SXin Li int w, int h) {
181*b2055c35SXin Li while (h-- > 0) {
182*b2055c35SXin Li memcpy(dst, src, w);
183*b2055c35SXin Li dst += dst_stride;
184*b2055c35SXin Li src += BPS;
185*b2055c35SXin Li }
186*b2055c35SXin Li }
187*b2055c35SXin Li
VP8IteratorExport(const VP8EncIterator * const it)188*b2055c35SXin Li void VP8IteratorExport(const VP8EncIterator* const it) {
189*b2055c35SXin Li const VP8Encoder* const enc = it->enc_;
190*b2055c35SXin Li if (enc->config_->show_compressed) {
191*b2055c35SXin Li const int x = it->x_, y = it->y_;
192*b2055c35SXin Li const uint8_t* const ysrc = it->yuv_out_ + Y_OFF_ENC;
193*b2055c35SXin Li const uint8_t* const usrc = it->yuv_out_ + U_OFF_ENC;
194*b2055c35SXin Li const uint8_t* const vsrc = it->yuv_out_ + V_OFF_ENC;
195*b2055c35SXin Li const WebPPicture* const pic = enc->pic_;
196*b2055c35SXin Li uint8_t* const ydst = pic->y + (y * pic->y_stride + x) * 16;
197*b2055c35SXin Li uint8_t* const udst = pic->u + (y * pic->uv_stride + x) * 8;
198*b2055c35SXin Li uint8_t* const vdst = pic->v + (y * pic->uv_stride + x) * 8;
199*b2055c35SXin Li int w = (pic->width - x * 16);
200*b2055c35SXin Li int h = (pic->height - y * 16);
201*b2055c35SXin Li
202*b2055c35SXin Li if (w > 16) w = 16;
203*b2055c35SXin Li if (h > 16) h = 16;
204*b2055c35SXin Li
205*b2055c35SXin Li // Luma plane
206*b2055c35SXin Li ExportBlock(ysrc, ydst, pic->y_stride, w, h);
207*b2055c35SXin Li
208*b2055c35SXin Li { // U/V planes
209*b2055c35SXin Li const int uv_w = (w + 1) >> 1;
210*b2055c35SXin Li const int uv_h = (h + 1) >> 1;
211*b2055c35SXin Li ExportBlock(usrc, udst, pic->uv_stride, uv_w, uv_h);
212*b2055c35SXin Li ExportBlock(vsrc, vdst, pic->uv_stride, uv_w, uv_h);
213*b2055c35SXin Li }
214*b2055c35SXin Li }
215*b2055c35SXin Li }
216*b2055c35SXin Li
217*b2055c35SXin Li //------------------------------------------------------------------------------
218*b2055c35SXin Li // Non-zero contexts setup/teardown
219*b2055c35SXin Li
220*b2055c35SXin Li // Nz bits:
221*b2055c35SXin Li // 0 1 2 3 Y
222*b2055c35SXin Li // 4 5 6 7
223*b2055c35SXin Li // 8 9 10 11
224*b2055c35SXin Li // 12 13 14 15
225*b2055c35SXin Li // 16 17 U
226*b2055c35SXin Li // 18 19
227*b2055c35SXin Li // 20 21 V
228*b2055c35SXin Li // 22 23
229*b2055c35SXin Li // 24 DC-intra16
230*b2055c35SXin Li
231*b2055c35SXin Li // Convert packed context to byte array
232*b2055c35SXin Li #define BIT(nz, n) (!!((nz) & (1 << (n))))
233*b2055c35SXin Li
VP8IteratorNzToBytes(VP8EncIterator * const it)234*b2055c35SXin Li void VP8IteratorNzToBytes(VP8EncIterator* const it) {
235*b2055c35SXin Li const int tnz = it->nz_[0], lnz = it->nz_[-1];
236*b2055c35SXin Li int* const top_nz = it->top_nz_;
237*b2055c35SXin Li int* const left_nz = it->left_nz_;
238*b2055c35SXin Li
239*b2055c35SXin Li // Top-Y
240*b2055c35SXin Li top_nz[0] = BIT(tnz, 12);
241*b2055c35SXin Li top_nz[1] = BIT(tnz, 13);
242*b2055c35SXin Li top_nz[2] = BIT(tnz, 14);
243*b2055c35SXin Li top_nz[3] = BIT(tnz, 15);
244*b2055c35SXin Li // Top-U
245*b2055c35SXin Li top_nz[4] = BIT(tnz, 18);
246*b2055c35SXin Li top_nz[5] = BIT(tnz, 19);
247*b2055c35SXin Li // Top-V
248*b2055c35SXin Li top_nz[6] = BIT(tnz, 22);
249*b2055c35SXin Li top_nz[7] = BIT(tnz, 23);
250*b2055c35SXin Li // DC
251*b2055c35SXin Li top_nz[8] = BIT(tnz, 24);
252*b2055c35SXin Li
253*b2055c35SXin Li // left-Y
254*b2055c35SXin Li left_nz[0] = BIT(lnz, 3);
255*b2055c35SXin Li left_nz[1] = BIT(lnz, 7);
256*b2055c35SXin Li left_nz[2] = BIT(lnz, 11);
257*b2055c35SXin Li left_nz[3] = BIT(lnz, 15);
258*b2055c35SXin Li // left-U
259*b2055c35SXin Li left_nz[4] = BIT(lnz, 17);
260*b2055c35SXin Li left_nz[5] = BIT(lnz, 19);
261*b2055c35SXin Li // left-V
262*b2055c35SXin Li left_nz[6] = BIT(lnz, 21);
263*b2055c35SXin Li left_nz[7] = BIT(lnz, 23);
264*b2055c35SXin Li // left-DC is special, iterated separately
265*b2055c35SXin Li }
266*b2055c35SXin Li
VP8IteratorBytesToNz(VP8EncIterator * const it)267*b2055c35SXin Li void VP8IteratorBytesToNz(VP8EncIterator* const it) {
268*b2055c35SXin Li uint32_t nz = 0;
269*b2055c35SXin Li const int* const top_nz = it->top_nz_;
270*b2055c35SXin Li const int* const left_nz = it->left_nz_;
271*b2055c35SXin Li // top
272*b2055c35SXin Li nz |= (top_nz[0] << 12) | (top_nz[1] << 13);
273*b2055c35SXin Li nz |= (top_nz[2] << 14) | (top_nz[3] << 15);
274*b2055c35SXin Li nz |= (top_nz[4] << 18) | (top_nz[5] << 19);
275*b2055c35SXin Li nz |= (top_nz[6] << 22) | (top_nz[7] << 23);
276*b2055c35SXin Li nz |= (top_nz[8] << 24); // we propagate the _top_ bit, esp. for intra4
277*b2055c35SXin Li // left
278*b2055c35SXin Li nz |= (left_nz[0] << 3) | (left_nz[1] << 7);
279*b2055c35SXin Li nz |= (left_nz[2] << 11);
280*b2055c35SXin Li nz |= (left_nz[4] << 17) | (left_nz[6] << 21);
281*b2055c35SXin Li
282*b2055c35SXin Li *it->nz_ = nz;
283*b2055c35SXin Li }
284*b2055c35SXin Li
285*b2055c35SXin Li #undef BIT
286*b2055c35SXin Li
287*b2055c35SXin Li //------------------------------------------------------------------------------
288*b2055c35SXin Li // Advance to the next position, doing the bookkeeping.
289*b2055c35SXin Li
VP8IteratorSaveBoundary(VP8EncIterator * const it)290*b2055c35SXin Li void VP8IteratorSaveBoundary(VP8EncIterator* const it) {
291*b2055c35SXin Li VP8Encoder* const enc = it->enc_;
292*b2055c35SXin Li const int x = it->x_, y = it->y_;
293*b2055c35SXin Li const uint8_t* const ysrc = it->yuv_out_ + Y_OFF_ENC;
294*b2055c35SXin Li const uint8_t* const uvsrc = it->yuv_out_ + U_OFF_ENC;
295*b2055c35SXin Li if (x < enc->mb_w_ - 1) { // left
296*b2055c35SXin Li int i;
297*b2055c35SXin Li for (i = 0; i < 16; ++i) {
298*b2055c35SXin Li it->y_left_[i] = ysrc[15 + i * BPS];
299*b2055c35SXin Li }
300*b2055c35SXin Li for (i = 0; i < 8; ++i) {
301*b2055c35SXin Li it->u_left_[i] = uvsrc[7 + i * BPS];
302*b2055c35SXin Li it->v_left_[i] = uvsrc[15 + i * BPS];
303*b2055c35SXin Li }
304*b2055c35SXin Li // top-left (before 'top'!)
305*b2055c35SXin Li it->y_left_[-1] = it->y_top_[15];
306*b2055c35SXin Li it->u_left_[-1] = it->uv_top_[0 + 7];
307*b2055c35SXin Li it->v_left_[-1] = it->uv_top_[8 + 7];
308*b2055c35SXin Li }
309*b2055c35SXin Li if (y < enc->mb_h_ - 1) { // top
310*b2055c35SXin Li memcpy(it->y_top_, ysrc + 15 * BPS, 16);
311*b2055c35SXin Li memcpy(it->uv_top_, uvsrc + 7 * BPS, 8 + 8);
312*b2055c35SXin Li }
313*b2055c35SXin Li }
314*b2055c35SXin Li
VP8IteratorNext(VP8EncIterator * const it)315*b2055c35SXin Li int VP8IteratorNext(VP8EncIterator* const it) {
316*b2055c35SXin Li if (++it->x_ == it->enc_->mb_w_) {
317*b2055c35SXin Li VP8IteratorSetRow(it, ++it->y_);
318*b2055c35SXin Li } else {
319*b2055c35SXin Li it->preds_ += 4;
320*b2055c35SXin Li it->mb_ += 1;
321*b2055c35SXin Li it->nz_ += 1;
322*b2055c35SXin Li it->y_top_ += 16;
323*b2055c35SXin Li it->uv_top_ += 16;
324*b2055c35SXin Li }
325*b2055c35SXin Li return (0 < --it->count_down_);
326*b2055c35SXin Li }
327*b2055c35SXin Li
328*b2055c35SXin Li //------------------------------------------------------------------------------
329*b2055c35SXin Li // Helper function to set mode properties
330*b2055c35SXin Li
VP8SetIntra16Mode(const VP8EncIterator * const it,int mode)331*b2055c35SXin Li void VP8SetIntra16Mode(const VP8EncIterator* const it, int mode) {
332*b2055c35SXin Li uint8_t* preds = it->preds_;
333*b2055c35SXin Li int y;
334*b2055c35SXin Li for (y = 0; y < 4; ++y) {
335*b2055c35SXin Li memset(preds, mode, 4);
336*b2055c35SXin Li preds += it->enc_->preds_w_;
337*b2055c35SXin Li }
338*b2055c35SXin Li it->mb_->type_ = 1;
339*b2055c35SXin Li }
340*b2055c35SXin Li
VP8SetIntra4Mode(const VP8EncIterator * const it,const uint8_t * modes)341*b2055c35SXin Li void VP8SetIntra4Mode(const VP8EncIterator* const it, const uint8_t* modes) {
342*b2055c35SXin Li uint8_t* preds = it->preds_;
343*b2055c35SXin Li int y;
344*b2055c35SXin Li for (y = 4; y > 0; --y) {
345*b2055c35SXin Li memcpy(preds, modes, 4 * sizeof(*modes));
346*b2055c35SXin Li preds += it->enc_->preds_w_;
347*b2055c35SXin Li modes += 4;
348*b2055c35SXin Li }
349*b2055c35SXin Li it->mb_->type_ = 0;
350*b2055c35SXin Li }
351*b2055c35SXin Li
VP8SetIntraUVMode(const VP8EncIterator * const it,int mode)352*b2055c35SXin Li void VP8SetIntraUVMode(const VP8EncIterator* const it, int mode) {
353*b2055c35SXin Li it->mb_->uv_mode_ = mode;
354*b2055c35SXin Li }
355*b2055c35SXin Li
VP8SetSkip(const VP8EncIterator * const it,int skip)356*b2055c35SXin Li void VP8SetSkip(const VP8EncIterator* const it, int skip) {
357*b2055c35SXin Li it->mb_->skip_ = skip;
358*b2055c35SXin Li }
359*b2055c35SXin Li
VP8SetSegment(const VP8EncIterator * const it,int segment)360*b2055c35SXin Li void VP8SetSegment(const VP8EncIterator* const it, int segment) {
361*b2055c35SXin Li it->mb_->segment_ = segment;
362*b2055c35SXin Li }
363*b2055c35SXin Li
364*b2055c35SXin Li //------------------------------------------------------------------------------
365*b2055c35SXin Li // Intra4x4 sub-blocks iteration
366*b2055c35SXin Li //
367*b2055c35SXin Li // We store and update the boundary samples into an array of 37 pixels. They
368*b2055c35SXin Li // are updated as we iterate and reconstructs each intra4x4 blocks in turn.
369*b2055c35SXin Li // The position of the samples has the following snake pattern:
370*b2055c35SXin Li //
371*b2055c35SXin Li // 16|17 18 19 20|21 22 23 24|25 26 27 28|29 30 31 32|33 34 35 36 <- Top-right
372*b2055c35SXin Li // --+-----------+-----------+-----------+-----------+
373*b2055c35SXin Li // 15| 19| 23| 27| 31|
374*b2055c35SXin Li // 14| 18| 22| 26| 30|
375*b2055c35SXin Li // 13| 17| 21| 25| 29|
376*b2055c35SXin Li // 12|13 14 15 16|17 18 19 20|21 22 23 24|25 26 27 28|
377*b2055c35SXin Li // --+-----------+-----------+-----------+-----------+
378*b2055c35SXin Li // 11| 15| 19| 23| 27|
379*b2055c35SXin Li // 10| 14| 18| 22| 26|
380*b2055c35SXin Li // 9| 13| 17| 21| 25|
381*b2055c35SXin Li // 8| 9 10 11 12|13 14 15 16|17 18 19 20|21 22 23 24|
382*b2055c35SXin Li // --+-----------+-----------+-----------+-----------+
383*b2055c35SXin Li // 7| 11| 15| 19| 23|
384*b2055c35SXin Li // 6| 10| 14| 18| 22|
385*b2055c35SXin Li // 5| 9| 13| 17| 21|
386*b2055c35SXin Li // 4| 5 6 7 8| 9 10 11 12|13 14 15 16|17 18 19 20|
387*b2055c35SXin Li // --+-----------+-----------+-----------+-----------+
388*b2055c35SXin Li // 3| 7| 11| 15| 19|
389*b2055c35SXin Li // 2| 6| 10| 14| 18|
390*b2055c35SXin Li // 1| 5| 9| 13| 17|
391*b2055c35SXin Li // 0| 1 2 3 4| 5 6 7 8| 9 10 11 12|13 14 15 16|
392*b2055c35SXin Li // --+-----------+-----------+-----------+-----------+
393*b2055c35SXin Li
394*b2055c35SXin Li // Array to record the position of the top sample to pass to the prediction
395*b2055c35SXin Li // functions in dsp.c.
396*b2055c35SXin Li static const uint8_t VP8TopLeftI4[16] = {
397*b2055c35SXin Li 17, 21, 25, 29,
398*b2055c35SXin Li 13, 17, 21, 25,
399*b2055c35SXin Li 9, 13, 17, 21,
400*b2055c35SXin Li 5, 9, 13, 17
401*b2055c35SXin Li };
402*b2055c35SXin Li
VP8IteratorStartI4(VP8EncIterator * const it)403*b2055c35SXin Li void VP8IteratorStartI4(VP8EncIterator* const it) {
404*b2055c35SXin Li const VP8Encoder* const enc = it->enc_;
405*b2055c35SXin Li int i;
406*b2055c35SXin Li
407*b2055c35SXin Li it->i4_ = 0; // first 4x4 sub-block
408*b2055c35SXin Li it->i4_top_ = it->i4_boundary_ + VP8TopLeftI4[0];
409*b2055c35SXin Li
410*b2055c35SXin Li // Import the boundary samples
411*b2055c35SXin Li for (i = 0; i < 17; ++i) { // left
412*b2055c35SXin Li it->i4_boundary_[i] = it->y_left_[15 - i];
413*b2055c35SXin Li }
414*b2055c35SXin Li for (i = 0; i < 16; ++i) { // top
415*b2055c35SXin Li it->i4_boundary_[17 + i] = it->y_top_[i];
416*b2055c35SXin Li }
417*b2055c35SXin Li // top-right samples have a special case on the far right of the picture
418*b2055c35SXin Li if (it->x_ < enc->mb_w_ - 1) {
419*b2055c35SXin Li for (i = 16; i < 16 + 4; ++i) {
420*b2055c35SXin Li it->i4_boundary_[17 + i] = it->y_top_[i];
421*b2055c35SXin Li }
422*b2055c35SXin Li } else { // else, replicate the last valid pixel four times
423*b2055c35SXin Li for (i = 16; i < 16 + 4; ++i) {
424*b2055c35SXin Li it->i4_boundary_[17 + i] = it->i4_boundary_[17 + 15];
425*b2055c35SXin Li }
426*b2055c35SXin Li }
427*b2055c35SXin Li VP8IteratorNzToBytes(it); // import the non-zero context
428*b2055c35SXin Li }
429*b2055c35SXin Li
VP8IteratorRotateI4(VP8EncIterator * const it,const uint8_t * const yuv_out)430*b2055c35SXin Li int VP8IteratorRotateI4(VP8EncIterator* const it,
431*b2055c35SXin Li const uint8_t* const yuv_out) {
432*b2055c35SXin Li const uint8_t* const blk = yuv_out + VP8Scan[it->i4_];
433*b2055c35SXin Li uint8_t* const top = it->i4_top_;
434*b2055c35SXin Li int i;
435*b2055c35SXin Li
436*b2055c35SXin Li // Update the cache with 7 fresh samples
437*b2055c35SXin Li for (i = 0; i <= 3; ++i) {
438*b2055c35SXin Li top[-4 + i] = blk[i + 3 * BPS]; // store future top samples
439*b2055c35SXin Li }
440*b2055c35SXin Li if ((it->i4_ & 3) != 3) { // if not on the right sub-blocks #3, #7, #11, #15
441*b2055c35SXin Li for (i = 0; i <= 2; ++i) { // store future left samples
442*b2055c35SXin Li top[i] = blk[3 + (2 - i) * BPS];
443*b2055c35SXin Li }
444*b2055c35SXin Li } else { // else replicate top-right samples, as says the specs.
445*b2055c35SXin Li for (i = 0; i <= 3; ++i) {
446*b2055c35SXin Li top[i] = top[i + 4];
447*b2055c35SXin Li }
448*b2055c35SXin Li }
449*b2055c35SXin Li // move pointers to next sub-block
450*b2055c35SXin Li ++it->i4_;
451*b2055c35SXin Li if (it->i4_ == 16) { // we're done
452*b2055c35SXin Li return 0;
453*b2055c35SXin Li }
454*b2055c35SXin Li
455*b2055c35SXin Li it->i4_top_ = it->i4_boundary_ + VP8TopLeftI4[it->i4_];
456*b2055c35SXin Li return 1;
457*b2055c35SXin Li }
458*b2055c35SXin Li
459*b2055c35SXin Li //------------------------------------------------------------------------------
460