xref: /aosp_15_r20/external/webp/src/dec/io_dec.c (revision b2055c353e87c8814eb2b6b1b11112a1562253bd)
1*b2055c35SXin Li // Copyright 2011 Google Inc. All Rights Reserved.
2*b2055c35SXin Li //
3*b2055c35SXin Li // Use of this source code is governed by a BSD-style license
4*b2055c35SXin Li // that can be found in the COPYING file in the root of the source
5*b2055c35SXin Li // tree. An additional intellectual property rights grant can be found
6*b2055c35SXin Li // in the file PATENTS. All contributing project authors may
7*b2055c35SXin Li // be found in the AUTHORS file in the root of the source tree.
8*b2055c35SXin Li // -----------------------------------------------------------------------------
9*b2055c35SXin Li //
10*b2055c35SXin Li // functions for sample output.
11*b2055c35SXin Li //
12*b2055c35SXin Li // Author: Skal ([email protected])
13*b2055c35SXin Li 
14*b2055c35SXin Li #include <assert.h>
15*b2055c35SXin Li #include <stdlib.h>
16*b2055c35SXin Li #include "src/dec/vp8i_dec.h"
17*b2055c35SXin Li #include "src/dec/webpi_dec.h"
18*b2055c35SXin Li #include "src/dsp/dsp.h"
19*b2055c35SXin Li #include "src/dsp/yuv.h"
20*b2055c35SXin Li #include "src/utils/utils.h"
21*b2055c35SXin Li 
22*b2055c35SXin Li //------------------------------------------------------------------------------
23*b2055c35SXin Li // Main YUV<->RGB conversion functions
24*b2055c35SXin Li 
EmitYUV(const VP8Io * const io,WebPDecParams * const p)25*b2055c35SXin Li static int EmitYUV(const VP8Io* const io, WebPDecParams* const p) {
26*b2055c35SXin Li   WebPDecBuffer* output = p->output;
27*b2055c35SXin Li   const WebPYUVABuffer* const buf = &output->u.YUVA;
28*b2055c35SXin Li   uint8_t* const y_dst = buf->y + (size_t)io->mb_y * buf->y_stride;
29*b2055c35SXin Li   uint8_t* const u_dst = buf->u + (size_t)(io->mb_y >> 1) * buf->u_stride;
30*b2055c35SXin Li   uint8_t* const v_dst = buf->v + (size_t)(io->mb_y >> 1) * buf->v_stride;
31*b2055c35SXin Li   const int mb_w = io->mb_w;
32*b2055c35SXin Li   const int mb_h = io->mb_h;
33*b2055c35SXin Li   const int uv_w = (mb_w + 1) / 2;
34*b2055c35SXin Li   const int uv_h = (mb_h + 1) / 2;
35*b2055c35SXin Li   WebPCopyPlane(io->y, io->y_stride, y_dst, buf->y_stride, mb_w, mb_h);
36*b2055c35SXin Li   WebPCopyPlane(io->u, io->uv_stride, u_dst, buf->u_stride, uv_w, uv_h);
37*b2055c35SXin Li   WebPCopyPlane(io->v, io->uv_stride, v_dst, buf->v_stride, uv_w, uv_h);
38*b2055c35SXin Li   return io->mb_h;
39*b2055c35SXin Li }
40*b2055c35SXin Li 
41*b2055c35SXin Li // Point-sampling U/V sampler.
EmitSampledRGB(const VP8Io * const io,WebPDecParams * const p)42*b2055c35SXin Li static int EmitSampledRGB(const VP8Io* const io, WebPDecParams* const p) {
43*b2055c35SXin Li   WebPDecBuffer* const output = p->output;
44*b2055c35SXin Li   WebPRGBABuffer* const buf = &output->u.RGBA;
45*b2055c35SXin Li   uint8_t* const dst = buf->rgba + (size_t)io->mb_y * buf->stride;
46*b2055c35SXin Li   WebPSamplerProcessPlane(io->y, io->y_stride,
47*b2055c35SXin Li                           io->u, io->v, io->uv_stride,
48*b2055c35SXin Li                           dst, buf->stride, io->mb_w, io->mb_h,
49*b2055c35SXin Li                           WebPSamplers[output->colorspace]);
50*b2055c35SXin Li   return io->mb_h;
51*b2055c35SXin Li }
52*b2055c35SXin Li 
53*b2055c35SXin Li //------------------------------------------------------------------------------
54*b2055c35SXin Li // Fancy upsampling
55*b2055c35SXin Li 
56*b2055c35SXin Li #ifdef FANCY_UPSAMPLING
EmitFancyRGB(const VP8Io * const io,WebPDecParams * const p)57*b2055c35SXin Li static int EmitFancyRGB(const VP8Io* const io, WebPDecParams* const p) {
58*b2055c35SXin Li   int num_lines_out = io->mb_h;   // a priori guess
59*b2055c35SXin Li   const WebPRGBABuffer* const buf = &p->output->u.RGBA;
60*b2055c35SXin Li   uint8_t* dst = buf->rgba + (size_t)io->mb_y * buf->stride;
61*b2055c35SXin Li   WebPUpsampleLinePairFunc upsample = WebPUpsamplers[p->output->colorspace];
62*b2055c35SXin Li   const uint8_t* cur_y = io->y;
63*b2055c35SXin Li   const uint8_t* cur_u = io->u;
64*b2055c35SXin Li   const uint8_t* cur_v = io->v;
65*b2055c35SXin Li   const uint8_t* top_u = p->tmp_u;
66*b2055c35SXin Li   const uint8_t* top_v = p->tmp_v;
67*b2055c35SXin Li   int y = io->mb_y;
68*b2055c35SXin Li   const int y_end = io->mb_y + io->mb_h;
69*b2055c35SXin Li   const int mb_w = io->mb_w;
70*b2055c35SXin Li   const int uv_w = (mb_w + 1) / 2;
71*b2055c35SXin Li 
72*b2055c35SXin Li   if (y == 0) {
73*b2055c35SXin Li     // First line is special cased. We mirror the u/v samples at boundary.
74*b2055c35SXin Li     upsample(cur_y, NULL, cur_u, cur_v, cur_u, cur_v, dst, NULL, mb_w);
75*b2055c35SXin Li   } else {
76*b2055c35SXin Li     // We can finish the left-over line from previous call.
77*b2055c35SXin Li     upsample(p->tmp_y, cur_y, top_u, top_v, cur_u, cur_v,
78*b2055c35SXin Li              dst - buf->stride, dst, mb_w);
79*b2055c35SXin Li     ++num_lines_out;
80*b2055c35SXin Li   }
81*b2055c35SXin Li   // Loop over each output pairs of row.
82*b2055c35SXin Li   for (; y + 2 < y_end; y += 2) {
83*b2055c35SXin Li     top_u = cur_u;
84*b2055c35SXin Li     top_v = cur_v;
85*b2055c35SXin Li     cur_u += io->uv_stride;
86*b2055c35SXin Li     cur_v += io->uv_stride;
87*b2055c35SXin Li     dst += 2 * buf->stride;
88*b2055c35SXin Li     cur_y += 2 * io->y_stride;
89*b2055c35SXin Li     upsample(cur_y - io->y_stride, cur_y,
90*b2055c35SXin Li              top_u, top_v, cur_u, cur_v,
91*b2055c35SXin Li              dst - buf->stride, dst, mb_w);
92*b2055c35SXin Li   }
93*b2055c35SXin Li   // move to last row
94*b2055c35SXin Li   cur_y += io->y_stride;
95*b2055c35SXin Li   if (io->crop_top + y_end < io->crop_bottom) {
96*b2055c35SXin Li     // Save the unfinished samples for next call (as we're not done yet).
97*b2055c35SXin Li     memcpy(p->tmp_y, cur_y, mb_w * sizeof(*p->tmp_y));
98*b2055c35SXin Li     memcpy(p->tmp_u, cur_u, uv_w * sizeof(*p->tmp_u));
99*b2055c35SXin Li     memcpy(p->tmp_v, cur_v, uv_w * sizeof(*p->tmp_v));
100*b2055c35SXin Li     // The fancy upsampler leaves a row unfinished behind
101*b2055c35SXin Li     // (except for the very last row)
102*b2055c35SXin Li     num_lines_out--;
103*b2055c35SXin Li   } else {
104*b2055c35SXin Li     // Process the very last row of even-sized picture
105*b2055c35SXin Li     if (!(y_end & 1)) {
106*b2055c35SXin Li       upsample(cur_y, NULL, cur_u, cur_v, cur_u, cur_v,
107*b2055c35SXin Li                dst + buf->stride, NULL, mb_w);
108*b2055c35SXin Li     }
109*b2055c35SXin Li   }
110*b2055c35SXin Li   return num_lines_out;
111*b2055c35SXin Li }
112*b2055c35SXin Li 
113*b2055c35SXin Li #endif    /* FANCY_UPSAMPLING */
114*b2055c35SXin Li 
115*b2055c35SXin Li //------------------------------------------------------------------------------
116*b2055c35SXin Li 
FillAlphaPlane(uint8_t * dst,int w,int h,int stride)117*b2055c35SXin Li static void FillAlphaPlane(uint8_t* dst, int w, int h, int stride) {
118*b2055c35SXin Li   int j;
119*b2055c35SXin Li   for (j = 0; j < h; ++j) {
120*b2055c35SXin Li     memset(dst, 0xff, w * sizeof(*dst));
121*b2055c35SXin Li     dst += stride;
122*b2055c35SXin Li   }
123*b2055c35SXin Li }
124*b2055c35SXin Li 
EmitAlphaYUV(const VP8Io * const io,WebPDecParams * const p,int expected_num_lines_out)125*b2055c35SXin Li static int EmitAlphaYUV(const VP8Io* const io, WebPDecParams* const p,
126*b2055c35SXin Li                         int expected_num_lines_out) {
127*b2055c35SXin Li   const uint8_t* alpha = io->a;
128*b2055c35SXin Li   const WebPYUVABuffer* const buf = &p->output->u.YUVA;
129*b2055c35SXin Li   const int mb_w = io->mb_w;
130*b2055c35SXin Li   const int mb_h = io->mb_h;
131*b2055c35SXin Li   uint8_t* dst = buf->a + (size_t)io->mb_y * buf->a_stride;
132*b2055c35SXin Li   int j;
133*b2055c35SXin Li   (void)expected_num_lines_out;
134*b2055c35SXin Li   assert(expected_num_lines_out == mb_h);
135*b2055c35SXin Li   if (alpha != NULL) {
136*b2055c35SXin Li     for (j = 0; j < mb_h; ++j) {
137*b2055c35SXin Li       memcpy(dst, alpha, mb_w * sizeof(*dst));
138*b2055c35SXin Li       alpha += io->width;
139*b2055c35SXin Li       dst += buf->a_stride;
140*b2055c35SXin Li     }
141*b2055c35SXin Li   } else if (buf->a != NULL) {
142*b2055c35SXin Li     // the user requested alpha, but there is none, set it to opaque.
143*b2055c35SXin Li     FillAlphaPlane(dst, mb_w, mb_h, buf->a_stride);
144*b2055c35SXin Li   }
145*b2055c35SXin Li   return 0;
146*b2055c35SXin Li }
147*b2055c35SXin Li 
GetAlphaSourceRow(const VP8Io * const io,const uint8_t ** alpha,int * const num_rows)148*b2055c35SXin Li static int GetAlphaSourceRow(const VP8Io* const io,
149*b2055c35SXin Li                              const uint8_t** alpha, int* const num_rows) {
150*b2055c35SXin Li   int start_y = io->mb_y;
151*b2055c35SXin Li   *num_rows = io->mb_h;
152*b2055c35SXin Li 
153*b2055c35SXin Li   // Compensate for the 1-line delay of the fancy upscaler.
154*b2055c35SXin Li   // This is similar to EmitFancyRGB().
155*b2055c35SXin Li   if (io->fancy_upsampling) {
156*b2055c35SXin Li     if (start_y == 0) {
157*b2055c35SXin Li       // We don't process the last row yet. It'll be done during the next call.
158*b2055c35SXin Li       --*num_rows;
159*b2055c35SXin Li     } else {
160*b2055c35SXin Li       --start_y;
161*b2055c35SXin Li       // Fortunately, *alpha data is persistent, so we can go back
162*b2055c35SXin Li       // one row and finish alpha blending, now that the fancy upscaler
163*b2055c35SXin Li       // completed the YUV->RGB interpolation.
164*b2055c35SXin Li       *alpha -= io->width;
165*b2055c35SXin Li     }
166*b2055c35SXin Li     if (io->crop_top + io->mb_y + io->mb_h == io->crop_bottom) {
167*b2055c35SXin Li       // If it's the very last call, we process all the remaining rows!
168*b2055c35SXin Li       *num_rows = io->crop_bottom - io->crop_top - start_y;
169*b2055c35SXin Li     }
170*b2055c35SXin Li   }
171*b2055c35SXin Li   return start_y;
172*b2055c35SXin Li }
173*b2055c35SXin Li 
EmitAlphaRGB(const VP8Io * const io,WebPDecParams * const p,int expected_num_lines_out)174*b2055c35SXin Li static int EmitAlphaRGB(const VP8Io* const io, WebPDecParams* const p,
175*b2055c35SXin Li                         int expected_num_lines_out) {
176*b2055c35SXin Li   const uint8_t* alpha = io->a;
177*b2055c35SXin Li   if (alpha != NULL) {
178*b2055c35SXin Li     const int mb_w = io->mb_w;
179*b2055c35SXin Li     const WEBP_CSP_MODE colorspace = p->output->colorspace;
180*b2055c35SXin Li     const int alpha_first =
181*b2055c35SXin Li         (colorspace == MODE_ARGB || colorspace == MODE_Argb);
182*b2055c35SXin Li     const WebPRGBABuffer* const buf = &p->output->u.RGBA;
183*b2055c35SXin Li     int num_rows;
184*b2055c35SXin Li     const size_t start_y = GetAlphaSourceRow(io, &alpha, &num_rows);
185*b2055c35SXin Li     uint8_t* const base_rgba = buf->rgba + start_y * buf->stride;
186*b2055c35SXin Li     uint8_t* const dst = base_rgba + (alpha_first ? 0 : 3);
187*b2055c35SXin Li     const int has_alpha = WebPDispatchAlpha(alpha, io->width, mb_w,
188*b2055c35SXin Li                                             num_rows, dst, buf->stride);
189*b2055c35SXin Li     (void)expected_num_lines_out;
190*b2055c35SXin Li     assert(expected_num_lines_out == num_rows);
191*b2055c35SXin Li     // has_alpha is true if there's non-trivial alpha to premultiply with.
192*b2055c35SXin Li     if (has_alpha && WebPIsPremultipliedMode(colorspace)) {
193*b2055c35SXin Li       WebPApplyAlphaMultiply(base_rgba, alpha_first,
194*b2055c35SXin Li                              mb_w, num_rows, buf->stride);
195*b2055c35SXin Li     }
196*b2055c35SXin Li   }
197*b2055c35SXin Li   return 0;
198*b2055c35SXin Li }
199*b2055c35SXin Li 
EmitAlphaRGBA4444(const VP8Io * const io,WebPDecParams * const p,int expected_num_lines_out)200*b2055c35SXin Li static int EmitAlphaRGBA4444(const VP8Io* const io, WebPDecParams* const p,
201*b2055c35SXin Li                              int expected_num_lines_out) {
202*b2055c35SXin Li   const uint8_t* alpha = io->a;
203*b2055c35SXin Li   if (alpha != NULL) {
204*b2055c35SXin Li     const int mb_w = io->mb_w;
205*b2055c35SXin Li     const WEBP_CSP_MODE colorspace = p->output->colorspace;
206*b2055c35SXin Li     const WebPRGBABuffer* const buf = &p->output->u.RGBA;
207*b2055c35SXin Li     int num_rows;
208*b2055c35SXin Li     const size_t start_y = GetAlphaSourceRow(io, &alpha, &num_rows);
209*b2055c35SXin Li     uint8_t* const base_rgba = buf->rgba + start_y * buf->stride;
210*b2055c35SXin Li #if (WEBP_SWAP_16BIT_CSP == 1)
211*b2055c35SXin Li     uint8_t* alpha_dst = base_rgba;
212*b2055c35SXin Li #else
213*b2055c35SXin Li     uint8_t* alpha_dst = base_rgba + 1;
214*b2055c35SXin Li #endif
215*b2055c35SXin Li     uint32_t alpha_mask = 0x0f;
216*b2055c35SXin Li     int i, j;
217*b2055c35SXin Li     for (j = 0; j < num_rows; ++j) {
218*b2055c35SXin Li       for (i = 0; i < mb_w; ++i) {
219*b2055c35SXin Li         // Fill in the alpha value (converted to 4 bits).
220*b2055c35SXin Li         const uint32_t alpha_value = alpha[i] >> 4;
221*b2055c35SXin Li         alpha_dst[2 * i] = (alpha_dst[2 * i] & 0xf0) | alpha_value;
222*b2055c35SXin Li         alpha_mask &= alpha_value;
223*b2055c35SXin Li       }
224*b2055c35SXin Li       alpha += io->width;
225*b2055c35SXin Li       alpha_dst += buf->stride;
226*b2055c35SXin Li     }
227*b2055c35SXin Li     (void)expected_num_lines_out;
228*b2055c35SXin Li     assert(expected_num_lines_out == num_rows);
229*b2055c35SXin Li     if (alpha_mask != 0x0f && WebPIsPremultipliedMode(colorspace)) {
230*b2055c35SXin Li       WebPApplyAlphaMultiply4444(base_rgba, mb_w, num_rows, buf->stride);
231*b2055c35SXin Li     }
232*b2055c35SXin Li   }
233*b2055c35SXin Li   return 0;
234*b2055c35SXin Li }
235*b2055c35SXin Li 
236*b2055c35SXin Li //------------------------------------------------------------------------------
237*b2055c35SXin Li // YUV rescaling (no final RGB conversion needed)
238*b2055c35SXin Li 
239*b2055c35SXin Li #if !defined(WEBP_REDUCE_SIZE)
Rescale(const uint8_t * src,int src_stride,int new_lines,WebPRescaler * const wrk)240*b2055c35SXin Li static int Rescale(const uint8_t* src, int src_stride,
241*b2055c35SXin Li                    int new_lines, WebPRescaler* const wrk) {
242*b2055c35SXin Li   int num_lines_out = 0;
243*b2055c35SXin Li   while (new_lines > 0) {    // import new contributions of source rows.
244*b2055c35SXin Li     const int lines_in = WebPRescalerImport(wrk, new_lines, src, src_stride);
245*b2055c35SXin Li     src += lines_in * src_stride;
246*b2055c35SXin Li     new_lines -= lines_in;
247*b2055c35SXin Li     num_lines_out += WebPRescalerExport(wrk);    // emit output row(s)
248*b2055c35SXin Li   }
249*b2055c35SXin Li   return num_lines_out;
250*b2055c35SXin Li }
251*b2055c35SXin Li 
EmitRescaledYUV(const VP8Io * const io,WebPDecParams * const p)252*b2055c35SXin Li static int EmitRescaledYUV(const VP8Io* const io, WebPDecParams* const p) {
253*b2055c35SXin Li   const int mb_h = io->mb_h;
254*b2055c35SXin Li   const int uv_mb_h = (mb_h + 1) >> 1;
255*b2055c35SXin Li   WebPRescaler* const scaler = p->scaler_y;
256*b2055c35SXin Li   int num_lines_out = 0;
257*b2055c35SXin Li   if (WebPIsAlphaMode(p->output->colorspace) && io->a != NULL) {
258*b2055c35SXin Li     // Before rescaling, we premultiply the luma directly into the io->y
259*b2055c35SXin Li     // internal buffer. This is OK since these samples are not used for
260*b2055c35SXin Li     // intra-prediction (the top samples are saved in cache_y_/u_/v_).
261*b2055c35SXin Li     // But we need to cast the const away, though.
262*b2055c35SXin Li     WebPMultRows((uint8_t*)io->y, io->y_stride,
263*b2055c35SXin Li                  io->a, io->width, io->mb_w, mb_h, 0);
264*b2055c35SXin Li   }
265*b2055c35SXin Li   num_lines_out = Rescale(io->y, io->y_stride, mb_h, scaler);
266*b2055c35SXin Li   Rescale(io->u, io->uv_stride, uv_mb_h, p->scaler_u);
267*b2055c35SXin Li   Rescale(io->v, io->uv_stride, uv_mb_h, p->scaler_v);
268*b2055c35SXin Li   return num_lines_out;
269*b2055c35SXin Li }
270*b2055c35SXin Li 
EmitRescaledAlphaYUV(const VP8Io * const io,WebPDecParams * const p,int expected_num_lines_out)271*b2055c35SXin Li static int EmitRescaledAlphaYUV(const VP8Io* const io, WebPDecParams* const p,
272*b2055c35SXin Li                                 int expected_num_lines_out) {
273*b2055c35SXin Li   const WebPYUVABuffer* const buf = &p->output->u.YUVA;
274*b2055c35SXin Li   uint8_t* const dst_a = buf->a + (size_t)p->last_y * buf->a_stride;
275*b2055c35SXin Li   if (io->a != NULL) {
276*b2055c35SXin Li     uint8_t* const dst_y = buf->y + (size_t)p->last_y * buf->y_stride;
277*b2055c35SXin Li     const int num_lines_out = Rescale(io->a, io->width, io->mb_h, p->scaler_a);
278*b2055c35SXin Li     assert(expected_num_lines_out == num_lines_out);
279*b2055c35SXin Li     if (num_lines_out > 0) {   // unmultiply the Y
280*b2055c35SXin Li       WebPMultRows(dst_y, buf->y_stride, dst_a, buf->a_stride,
281*b2055c35SXin Li                    p->scaler_a->dst_width, num_lines_out, 1);
282*b2055c35SXin Li     }
283*b2055c35SXin Li   } else if (buf->a != NULL) {
284*b2055c35SXin Li     // the user requested alpha, but there is none, set it to opaque.
285*b2055c35SXin Li     assert(p->last_y + expected_num_lines_out <= io->scaled_height);
286*b2055c35SXin Li     FillAlphaPlane(dst_a, io->scaled_width, expected_num_lines_out,
287*b2055c35SXin Li                    buf->a_stride);
288*b2055c35SXin Li   }
289*b2055c35SXin Li   return 0;
290*b2055c35SXin Li }
291*b2055c35SXin Li 
InitYUVRescaler(const VP8Io * const io,WebPDecParams * const p)292*b2055c35SXin Li static int InitYUVRescaler(const VP8Io* const io, WebPDecParams* const p) {
293*b2055c35SXin Li   const int has_alpha = WebPIsAlphaMode(p->output->colorspace);
294*b2055c35SXin Li   const WebPYUVABuffer* const buf = &p->output->u.YUVA;
295*b2055c35SXin Li   const int out_width  = io->scaled_width;
296*b2055c35SXin Li   const int out_height = io->scaled_height;
297*b2055c35SXin Li   const int uv_out_width  = (out_width + 1) >> 1;
298*b2055c35SXin Li   const int uv_out_height = (out_height + 1) >> 1;
299*b2055c35SXin Li   const int uv_in_width  = (io->mb_w + 1) >> 1;
300*b2055c35SXin Li   const int uv_in_height = (io->mb_h + 1) >> 1;
301*b2055c35SXin Li   // scratch memory for luma rescaler
302*b2055c35SXin Li   const size_t work_size = 2 * (size_t)out_width;
303*b2055c35SXin Li   const size_t uv_work_size = 2 * uv_out_width;  // and for each u/v ones
304*b2055c35SXin Li   uint64_t total_size;
305*b2055c35SXin Li   size_t rescaler_size;
306*b2055c35SXin Li   rescaler_t* work;
307*b2055c35SXin Li   WebPRescaler* scalers;
308*b2055c35SXin Li   const int num_rescalers = has_alpha ? 4 : 3;
309*b2055c35SXin Li 
310*b2055c35SXin Li   total_size = ((uint64_t)work_size + 2 * uv_work_size) * sizeof(*work);
311*b2055c35SXin Li   if (has_alpha) {
312*b2055c35SXin Li     total_size += (uint64_t)work_size * sizeof(*work);
313*b2055c35SXin Li   }
314*b2055c35SXin Li   rescaler_size = num_rescalers * sizeof(*p->scaler_y) + WEBP_ALIGN_CST;
315*b2055c35SXin Li   total_size += rescaler_size;
316*b2055c35SXin Li   if (!CheckSizeOverflow(total_size)) {
317*b2055c35SXin Li     return 0;
318*b2055c35SXin Li   }
319*b2055c35SXin Li 
320*b2055c35SXin Li   p->memory = WebPSafeMalloc(1ULL, (size_t)total_size);
321*b2055c35SXin Li   if (p->memory == NULL) {
322*b2055c35SXin Li     return 0;   // memory error
323*b2055c35SXin Li   }
324*b2055c35SXin Li   work = (rescaler_t*)p->memory;
325*b2055c35SXin Li 
326*b2055c35SXin Li   scalers = (WebPRescaler*)WEBP_ALIGN(
327*b2055c35SXin Li       (const uint8_t*)work + total_size - rescaler_size);
328*b2055c35SXin Li   p->scaler_y = &scalers[0];
329*b2055c35SXin Li   p->scaler_u = &scalers[1];
330*b2055c35SXin Li   p->scaler_v = &scalers[2];
331*b2055c35SXin Li   p->scaler_a = has_alpha ? &scalers[3] : NULL;
332*b2055c35SXin Li 
333*b2055c35SXin Li   if (!WebPRescalerInit(p->scaler_y, io->mb_w, io->mb_h,
334*b2055c35SXin Li                         buf->y, out_width, out_height, buf->y_stride, 1,
335*b2055c35SXin Li                         work) ||
336*b2055c35SXin Li       !WebPRescalerInit(p->scaler_u, uv_in_width, uv_in_height,
337*b2055c35SXin Li                         buf->u, uv_out_width, uv_out_height, buf->u_stride, 1,
338*b2055c35SXin Li                         work + work_size) ||
339*b2055c35SXin Li       !WebPRescalerInit(p->scaler_v, uv_in_width, uv_in_height,
340*b2055c35SXin Li                         buf->v, uv_out_width, uv_out_height, buf->v_stride, 1,
341*b2055c35SXin Li                         work + work_size + uv_work_size)) {
342*b2055c35SXin Li     return 0;
343*b2055c35SXin Li   }
344*b2055c35SXin Li   p->emit = EmitRescaledYUV;
345*b2055c35SXin Li 
346*b2055c35SXin Li   if (has_alpha) {
347*b2055c35SXin Li     if (!WebPRescalerInit(p->scaler_a, io->mb_w, io->mb_h,
348*b2055c35SXin Li                           buf->a, out_width, out_height, buf->a_stride, 1,
349*b2055c35SXin Li                           work + work_size + 2 * uv_work_size)) {
350*b2055c35SXin Li       return 0;
351*b2055c35SXin Li     }
352*b2055c35SXin Li     p->emit_alpha = EmitRescaledAlphaYUV;
353*b2055c35SXin Li     WebPInitAlphaProcessing();
354*b2055c35SXin Li   }
355*b2055c35SXin Li   return 1;
356*b2055c35SXin Li }
357*b2055c35SXin Li 
358*b2055c35SXin Li //------------------------------------------------------------------------------
359*b2055c35SXin Li // RGBA rescaling
360*b2055c35SXin Li 
ExportRGB(WebPDecParams * const p,int y_pos)361*b2055c35SXin Li static int ExportRGB(WebPDecParams* const p, int y_pos) {
362*b2055c35SXin Li   const WebPYUV444Converter convert =
363*b2055c35SXin Li       WebPYUV444Converters[p->output->colorspace];
364*b2055c35SXin Li   const WebPRGBABuffer* const buf = &p->output->u.RGBA;
365*b2055c35SXin Li   uint8_t* dst = buf->rgba + (size_t)y_pos * buf->stride;
366*b2055c35SXin Li   int num_lines_out = 0;
367*b2055c35SXin Li   // For RGB rescaling, because of the YUV420, current scan position
368*b2055c35SXin Li   // U/V can be +1/-1 line from the Y one.  Hence the double test.
369*b2055c35SXin Li   while (WebPRescalerHasPendingOutput(p->scaler_y) &&
370*b2055c35SXin Li          WebPRescalerHasPendingOutput(p->scaler_u)) {
371*b2055c35SXin Li     assert(y_pos + num_lines_out < p->output->height);
372*b2055c35SXin Li     assert(p->scaler_u->y_accum == p->scaler_v->y_accum);
373*b2055c35SXin Li     WebPRescalerExportRow(p->scaler_y);
374*b2055c35SXin Li     WebPRescalerExportRow(p->scaler_u);
375*b2055c35SXin Li     WebPRescalerExportRow(p->scaler_v);
376*b2055c35SXin Li     convert(p->scaler_y->dst, p->scaler_u->dst, p->scaler_v->dst,
377*b2055c35SXin Li             dst, p->scaler_y->dst_width);
378*b2055c35SXin Li     dst += buf->stride;
379*b2055c35SXin Li     ++num_lines_out;
380*b2055c35SXin Li   }
381*b2055c35SXin Li   return num_lines_out;
382*b2055c35SXin Li }
383*b2055c35SXin Li 
EmitRescaledRGB(const VP8Io * const io,WebPDecParams * const p)384*b2055c35SXin Li static int EmitRescaledRGB(const VP8Io* const io, WebPDecParams* const p) {
385*b2055c35SXin Li   const int mb_h = io->mb_h;
386*b2055c35SXin Li   const int uv_mb_h = (mb_h + 1) >> 1;
387*b2055c35SXin Li   int j = 0, uv_j = 0;
388*b2055c35SXin Li   int num_lines_out = 0;
389*b2055c35SXin Li   while (j < mb_h) {
390*b2055c35SXin Li     const int y_lines_in =
391*b2055c35SXin Li         WebPRescalerImport(p->scaler_y, mb_h - j,
392*b2055c35SXin Li                            io->y + (size_t)j * io->y_stride, io->y_stride);
393*b2055c35SXin Li     j += y_lines_in;
394*b2055c35SXin Li     if (WebPRescaleNeededLines(p->scaler_u, uv_mb_h - uv_j)) {
395*b2055c35SXin Li       const int u_lines_in = WebPRescalerImport(
396*b2055c35SXin Li           p->scaler_u, uv_mb_h - uv_j, io->u + (size_t)uv_j * io->uv_stride,
397*b2055c35SXin Li           io->uv_stride);
398*b2055c35SXin Li       const int v_lines_in = WebPRescalerImport(
399*b2055c35SXin Li           p->scaler_v, uv_mb_h - uv_j, io->v + (size_t)uv_j * io->uv_stride,
400*b2055c35SXin Li           io->uv_stride);
401*b2055c35SXin Li       (void)v_lines_in;   // remove a gcc warning
402*b2055c35SXin Li       assert(u_lines_in == v_lines_in);
403*b2055c35SXin Li       uv_j += u_lines_in;
404*b2055c35SXin Li     }
405*b2055c35SXin Li     num_lines_out += ExportRGB(p, p->last_y + num_lines_out);
406*b2055c35SXin Li   }
407*b2055c35SXin Li   return num_lines_out;
408*b2055c35SXin Li }
409*b2055c35SXin Li 
ExportAlpha(WebPDecParams * const p,int y_pos,int max_lines_out)410*b2055c35SXin Li static int ExportAlpha(WebPDecParams* const p, int y_pos, int max_lines_out) {
411*b2055c35SXin Li   const WebPRGBABuffer* const buf = &p->output->u.RGBA;
412*b2055c35SXin Li   uint8_t* const base_rgba = buf->rgba + (size_t)y_pos * buf->stride;
413*b2055c35SXin Li   const WEBP_CSP_MODE colorspace = p->output->colorspace;
414*b2055c35SXin Li   const int alpha_first =
415*b2055c35SXin Li       (colorspace == MODE_ARGB || colorspace == MODE_Argb);
416*b2055c35SXin Li   uint8_t* dst = base_rgba + (alpha_first ? 0 : 3);
417*b2055c35SXin Li   int num_lines_out = 0;
418*b2055c35SXin Li   const int is_premult_alpha = WebPIsPremultipliedMode(colorspace);
419*b2055c35SXin Li   uint32_t non_opaque = 0;
420*b2055c35SXin Li   const int width = p->scaler_a->dst_width;
421*b2055c35SXin Li 
422*b2055c35SXin Li   while (WebPRescalerHasPendingOutput(p->scaler_a) &&
423*b2055c35SXin Li          num_lines_out < max_lines_out) {
424*b2055c35SXin Li     assert(y_pos + num_lines_out < p->output->height);
425*b2055c35SXin Li     WebPRescalerExportRow(p->scaler_a);
426*b2055c35SXin Li     non_opaque |= WebPDispatchAlpha(p->scaler_a->dst, 0, width, 1, dst, 0);
427*b2055c35SXin Li     dst += buf->stride;
428*b2055c35SXin Li     ++num_lines_out;
429*b2055c35SXin Li   }
430*b2055c35SXin Li   if (is_premult_alpha && non_opaque) {
431*b2055c35SXin Li     WebPApplyAlphaMultiply(base_rgba, alpha_first,
432*b2055c35SXin Li                            width, num_lines_out, buf->stride);
433*b2055c35SXin Li   }
434*b2055c35SXin Li   return num_lines_out;
435*b2055c35SXin Li }
436*b2055c35SXin Li 
ExportAlphaRGBA4444(WebPDecParams * const p,int y_pos,int max_lines_out)437*b2055c35SXin Li static int ExportAlphaRGBA4444(WebPDecParams* const p, int y_pos,
438*b2055c35SXin Li                                int max_lines_out) {
439*b2055c35SXin Li   const WebPRGBABuffer* const buf = &p->output->u.RGBA;
440*b2055c35SXin Li   uint8_t* const base_rgba = buf->rgba + (size_t)y_pos * buf->stride;
441*b2055c35SXin Li #if (WEBP_SWAP_16BIT_CSP == 1)
442*b2055c35SXin Li   uint8_t* alpha_dst = base_rgba;
443*b2055c35SXin Li #else
444*b2055c35SXin Li   uint8_t* alpha_dst = base_rgba + 1;
445*b2055c35SXin Li #endif
446*b2055c35SXin Li   int num_lines_out = 0;
447*b2055c35SXin Li   const WEBP_CSP_MODE colorspace = p->output->colorspace;
448*b2055c35SXin Li   const int width = p->scaler_a->dst_width;
449*b2055c35SXin Li   const int is_premult_alpha = WebPIsPremultipliedMode(colorspace);
450*b2055c35SXin Li   uint32_t alpha_mask = 0x0f;
451*b2055c35SXin Li 
452*b2055c35SXin Li   while (WebPRescalerHasPendingOutput(p->scaler_a) &&
453*b2055c35SXin Li          num_lines_out < max_lines_out) {
454*b2055c35SXin Li     int i;
455*b2055c35SXin Li     assert(y_pos + num_lines_out < p->output->height);
456*b2055c35SXin Li     WebPRescalerExportRow(p->scaler_a);
457*b2055c35SXin Li     for (i = 0; i < width; ++i) {
458*b2055c35SXin Li       // Fill in the alpha value (converted to 4 bits).
459*b2055c35SXin Li       const uint32_t alpha_value = p->scaler_a->dst[i] >> 4;
460*b2055c35SXin Li       alpha_dst[2 * i] = (alpha_dst[2 * i] & 0xf0) | alpha_value;
461*b2055c35SXin Li       alpha_mask &= alpha_value;
462*b2055c35SXin Li     }
463*b2055c35SXin Li     alpha_dst += buf->stride;
464*b2055c35SXin Li     ++num_lines_out;
465*b2055c35SXin Li   }
466*b2055c35SXin Li   if (is_premult_alpha && alpha_mask != 0x0f) {
467*b2055c35SXin Li     WebPApplyAlphaMultiply4444(base_rgba, width, num_lines_out, buf->stride);
468*b2055c35SXin Li   }
469*b2055c35SXin Li   return num_lines_out;
470*b2055c35SXin Li }
471*b2055c35SXin Li 
EmitRescaledAlphaRGB(const VP8Io * const io,WebPDecParams * const p,int expected_num_out_lines)472*b2055c35SXin Li static int EmitRescaledAlphaRGB(const VP8Io* const io, WebPDecParams* const p,
473*b2055c35SXin Li                                 int expected_num_out_lines) {
474*b2055c35SXin Li   if (io->a != NULL) {
475*b2055c35SXin Li     WebPRescaler* const scaler = p->scaler_a;
476*b2055c35SXin Li     int lines_left = expected_num_out_lines;
477*b2055c35SXin Li     const int y_end = p->last_y + lines_left;
478*b2055c35SXin Li     while (lines_left > 0) {
479*b2055c35SXin Li       const int64_t row_offset = (int64_t)scaler->src_y - io->mb_y;
480*b2055c35SXin Li       WebPRescalerImport(scaler, io->mb_h + io->mb_y - scaler->src_y,
481*b2055c35SXin Li                          io->a + row_offset * io->width, io->width);
482*b2055c35SXin Li       lines_left -= p->emit_alpha_row(p, y_end - lines_left, lines_left);
483*b2055c35SXin Li     }
484*b2055c35SXin Li   }
485*b2055c35SXin Li   return 0;
486*b2055c35SXin Li }
487*b2055c35SXin Li 
InitRGBRescaler(const VP8Io * const io,WebPDecParams * const p)488*b2055c35SXin Li static int InitRGBRescaler(const VP8Io* const io, WebPDecParams* const p) {
489*b2055c35SXin Li   const int has_alpha = WebPIsAlphaMode(p->output->colorspace);
490*b2055c35SXin Li   const int out_width  = io->scaled_width;
491*b2055c35SXin Li   const int out_height = io->scaled_height;
492*b2055c35SXin Li   const int uv_in_width  = (io->mb_w + 1) >> 1;
493*b2055c35SXin Li   const int uv_in_height = (io->mb_h + 1) >> 1;
494*b2055c35SXin Li   // scratch memory for one rescaler
495*b2055c35SXin Li   const size_t work_size = 2 * (size_t)out_width;
496*b2055c35SXin Li   rescaler_t* work;  // rescalers work area
497*b2055c35SXin Li   uint8_t* tmp;   // tmp storage for scaled YUV444 samples before RGB conversion
498*b2055c35SXin Li   uint64_t tmp_size1, tmp_size2, total_size;
499*b2055c35SXin Li   size_t rescaler_size;
500*b2055c35SXin Li   WebPRescaler* scalers;
501*b2055c35SXin Li   const int num_rescalers = has_alpha ? 4 : 3;
502*b2055c35SXin Li 
503*b2055c35SXin Li   tmp_size1 = (uint64_t)num_rescalers * work_size;
504*b2055c35SXin Li   tmp_size2 = (uint64_t)num_rescalers * out_width;
505*b2055c35SXin Li   total_size = tmp_size1 * sizeof(*work) + tmp_size2 * sizeof(*tmp);
506*b2055c35SXin Li   rescaler_size = num_rescalers * sizeof(*p->scaler_y) + WEBP_ALIGN_CST;
507*b2055c35SXin Li   total_size += rescaler_size;
508*b2055c35SXin Li   if (!CheckSizeOverflow(total_size)) {
509*b2055c35SXin Li     return 0;
510*b2055c35SXin Li   }
511*b2055c35SXin Li 
512*b2055c35SXin Li   p->memory = WebPSafeMalloc(1ULL, (size_t)total_size);
513*b2055c35SXin Li   if (p->memory == NULL) {
514*b2055c35SXin Li     return 0;   // memory error
515*b2055c35SXin Li   }
516*b2055c35SXin Li   work = (rescaler_t*)p->memory;
517*b2055c35SXin Li   tmp = (uint8_t*)(work + tmp_size1);
518*b2055c35SXin Li 
519*b2055c35SXin Li   scalers = (WebPRescaler*)WEBP_ALIGN(
520*b2055c35SXin Li       (const uint8_t*)work + total_size - rescaler_size);
521*b2055c35SXin Li   p->scaler_y = &scalers[0];
522*b2055c35SXin Li   p->scaler_u = &scalers[1];
523*b2055c35SXin Li   p->scaler_v = &scalers[2];
524*b2055c35SXin Li   p->scaler_a = has_alpha ? &scalers[3] : NULL;
525*b2055c35SXin Li 
526*b2055c35SXin Li   if (!WebPRescalerInit(p->scaler_y, io->mb_w, io->mb_h,
527*b2055c35SXin Li                         tmp + 0 * out_width, out_width, out_height, 0, 1,
528*b2055c35SXin Li                         work + 0 * work_size) ||
529*b2055c35SXin Li       !WebPRescalerInit(p->scaler_u, uv_in_width, uv_in_height,
530*b2055c35SXin Li                         tmp + 1 * out_width, out_width, out_height, 0, 1,
531*b2055c35SXin Li                         work + 1 * work_size) ||
532*b2055c35SXin Li       !WebPRescalerInit(p->scaler_v, uv_in_width, uv_in_height,
533*b2055c35SXin Li                         tmp + 2 * out_width, out_width, out_height, 0, 1,
534*b2055c35SXin Li                         work + 2 * work_size)) {
535*b2055c35SXin Li     return 0;
536*b2055c35SXin Li   }
537*b2055c35SXin Li   p->emit = EmitRescaledRGB;
538*b2055c35SXin Li   WebPInitYUV444Converters();
539*b2055c35SXin Li 
540*b2055c35SXin Li   if (has_alpha) {
541*b2055c35SXin Li     if (!WebPRescalerInit(p->scaler_a, io->mb_w, io->mb_h,
542*b2055c35SXin Li                           tmp + 3 * out_width, out_width, out_height, 0, 1,
543*b2055c35SXin Li                           work + 3 * work_size)) {
544*b2055c35SXin Li       return 0;
545*b2055c35SXin Li     }
546*b2055c35SXin Li     p->emit_alpha = EmitRescaledAlphaRGB;
547*b2055c35SXin Li     if (p->output->colorspace == MODE_RGBA_4444 ||
548*b2055c35SXin Li         p->output->colorspace == MODE_rgbA_4444) {
549*b2055c35SXin Li       p->emit_alpha_row = ExportAlphaRGBA4444;
550*b2055c35SXin Li     } else {
551*b2055c35SXin Li       p->emit_alpha_row = ExportAlpha;
552*b2055c35SXin Li     }
553*b2055c35SXin Li     WebPInitAlphaProcessing();
554*b2055c35SXin Li   }
555*b2055c35SXin Li   return 1;
556*b2055c35SXin Li }
557*b2055c35SXin Li 
558*b2055c35SXin Li #endif  // WEBP_REDUCE_SIZE
559*b2055c35SXin Li 
560*b2055c35SXin Li //------------------------------------------------------------------------------
561*b2055c35SXin Li // Default custom functions
562*b2055c35SXin Li 
CustomSetup(VP8Io * io)563*b2055c35SXin Li static int CustomSetup(VP8Io* io) {
564*b2055c35SXin Li   WebPDecParams* const p = (WebPDecParams*)io->opaque;
565*b2055c35SXin Li   const WEBP_CSP_MODE colorspace = p->output->colorspace;
566*b2055c35SXin Li   const int is_rgb = WebPIsRGBMode(colorspace);
567*b2055c35SXin Li   const int is_alpha = WebPIsAlphaMode(colorspace);
568*b2055c35SXin Li 
569*b2055c35SXin Li   p->memory = NULL;
570*b2055c35SXin Li   p->emit = NULL;
571*b2055c35SXin Li   p->emit_alpha = NULL;
572*b2055c35SXin Li   p->emit_alpha_row = NULL;
573*b2055c35SXin Li   if (!WebPIoInitFromOptions(p->options, io, is_alpha ? MODE_YUV : MODE_YUVA)) {
574*b2055c35SXin Li     return 0;
575*b2055c35SXin Li   }
576*b2055c35SXin Li   if (is_alpha && WebPIsPremultipliedMode(colorspace)) {
577*b2055c35SXin Li     WebPInitUpsamplers();
578*b2055c35SXin Li   }
579*b2055c35SXin Li   if (io->use_scaling) {
580*b2055c35SXin Li #if !defined(WEBP_REDUCE_SIZE)
581*b2055c35SXin Li     const int ok = is_rgb ? InitRGBRescaler(io, p) : InitYUVRescaler(io, p);
582*b2055c35SXin Li     if (!ok) {
583*b2055c35SXin Li       return 0;    // memory error
584*b2055c35SXin Li     }
585*b2055c35SXin Li #else
586*b2055c35SXin Li     return 0;   // rescaling support not compiled
587*b2055c35SXin Li #endif
588*b2055c35SXin Li   } else {
589*b2055c35SXin Li     if (is_rgb) {
590*b2055c35SXin Li       WebPInitSamplers();
591*b2055c35SXin Li       p->emit = EmitSampledRGB;   // default
592*b2055c35SXin Li       if (io->fancy_upsampling) {
593*b2055c35SXin Li #ifdef FANCY_UPSAMPLING
594*b2055c35SXin Li         const int uv_width = (io->mb_w + 1) >> 1;
595*b2055c35SXin Li         p->memory = WebPSafeMalloc(1ULL, (size_t)(io->mb_w + 2 * uv_width));
596*b2055c35SXin Li         if (p->memory == NULL) {
597*b2055c35SXin Li           return 0;   // memory error.
598*b2055c35SXin Li         }
599*b2055c35SXin Li         p->tmp_y = (uint8_t*)p->memory;
600*b2055c35SXin Li         p->tmp_u = p->tmp_y + io->mb_w;
601*b2055c35SXin Li         p->tmp_v = p->tmp_u + uv_width;
602*b2055c35SXin Li         p->emit = EmitFancyRGB;
603*b2055c35SXin Li         WebPInitUpsamplers();
604*b2055c35SXin Li #endif
605*b2055c35SXin Li       }
606*b2055c35SXin Li     } else {
607*b2055c35SXin Li       p->emit = EmitYUV;
608*b2055c35SXin Li     }
609*b2055c35SXin Li     if (is_alpha) {  // need transparency output
610*b2055c35SXin Li       p->emit_alpha =
611*b2055c35SXin Li           (colorspace == MODE_RGBA_4444 || colorspace == MODE_rgbA_4444) ?
612*b2055c35SXin Li               EmitAlphaRGBA4444
613*b2055c35SXin Li           : is_rgb ? EmitAlphaRGB
614*b2055c35SXin Li           : EmitAlphaYUV;
615*b2055c35SXin Li       if (is_rgb) {
616*b2055c35SXin Li         WebPInitAlphaProcessing();
617*b2055c35SXin Li       }
618*b2055c35SXin Li     }
619*b2055c35SXin Li   }
620*b2055c35SXin Li 
621*b2055c35SXin Li   return 1;
622*b2055c35SXin Li }
623*b2055c35SXin Li 
624*b2055c35SXin Li //------------------------------------------------------------------------------
625*b2055c35SXin Li 
CustomPut(const VP8Io * io)626*b2055c35SXin Li static int CustomPut(const VP8Io* io) {
627*b2055c35SXin Li   WebPDecParams* const p = (WebPDecParams*)io->opaque;
628*b2055c35SXin Li   const int mb_w = io->mb_w;
629*b2055c35SXin Li   const int mb_h = io->mb_h;
630*b2055c35SXin Li   int num_lines_out;
631*b2055c35SXin Li   assert(!(io->mb_y & 1));
632*b2055c35SXin Li 
633*b2055c35SXin Li   if (mb_w <= 0 || mb_h <= 0) {
634*b2055c35SXin Li     return 0;
635*b2055c35SXin Li   }
636*b2055c35SXin Li   num_lines_out = p->emit(io, p);
637*b2055c35SXin Li   if (p->emit_alpha != NULL) {
638*b2055c35SXin Li     p->emit_alpha(io, p, num_lines_out);
639*b2055c35SXin Li   }
640*b2055c35SXin Li   p->last_y += num_lines_out;
641*b2055c35SXin Li   return 1;
642*b2055c35SXin Li }
643*b2055c35SXin Li 
644*b2055c35SXin Li //------------------------------------------------------------------------------
645*b2055c35SXin Li 
CustomTeardown(const VP8Io * io)646*b2055c35SXin Li static void CustomTeardown(const VP8Io* io) {
647*b2055c35SXin Li   WebPDecParams* const p = (WebPDecParams*)io->opaque;
648*b2055c35SXin Li   WebPSafeFree(p->memory);
649*b2055c35SXin Li   p->memory = NULL;
650*b2055c35SXin Li }
651*b2055c35SXin Li 
652*b2055c35SXin Li //------------------------------------------------------------------------------
653*b2055c35SXin Li // Main entry point
654*b2055c35SXin Li 
WebPInitCustomIo(WebPDecParams * const params,VP8Io * const io)655*b2055c35SXin Li void WebPInitCustomIo(WebPDecParams* const params, VP8Io* const io) {
656*b2055c35SXin Li   io->put      = CustomPut;
657*b2055c35SXin Li   io->setup    = CustomSetup;
658*b2055c35SXin Li   io->teardown = CustomTeardown;
659*b2055c35SXin Li   io->opaque   = params;
660*b2055c35SXin Li }
661*b2055c35SXin Li 
662*b2055c35SXin Li //------------------------------------------------------------------------------
663