src/dsp/dsp.h

*09537850SAkhilesh Sanikop/*
*09537850SAkhilesh Sanikop * Copyright 2019 The libgav1 Authors
*09537850SAkhilesh Sanikop *
*09537850SAkhilesh Sanikop * Licensed under the Apache License, Version 2.0 (the "License");
*09537850SAkhilesh Sanikop * you may not use this file except in compliance with the License.
*09537850SAkhilesh Sanikop * You may obtain a copy of the License at
*09537850SAkhilesh Sanikop *
*09537850SAkhilesh Sanikop *      http://www.apache.org/licenses/LICENSE-2.0
*09537850SAkhilesh Sanikop *
*09537850SAkhilesh Sanikop * Unless required by applicable law or agreed to in writing, software
*09537850SAkhilesh Sanikop * distributed under the License is distributed on an "AS IS" BASIS,
*09537850SAkhilesh Sanikop * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
*09537850SAkhilesh Sanikop * See the License for the specific language governing permissions and
*09537850SAkhilesh Sanikop * limitations under the License.
*09537850SAkhilesh Sanikop */
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop#ifndef LIBGAV1_SRC_DSP_DSP_H_
*09537850SAkhilesh Sanikop#define LIBGAV1_SRC_DSP_DSP_H_
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop#include <cstddef>
*09537850SAkhilesh Sanikop#include <cstdint>
*09537850SAkhilesh Sanikop#include <cstdlib>
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop#include "src/dsp/common.h"
*09537850SAkhilesh Sanikop#include "src/dsp/constants.h"
*09537850SAkhilesh Sanikop#include "src/dsp/film_grain_common.h"
*09537850SAkhilesh Sanikop#include "src/utils/cpu.h"
*09537850SAkhilesh Sanikop#include "src/utils/reference_info.h"
*09537850SAkhilesh Sanikop#include "src/utils/types.h"
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikopnamespace libgav1 {
*09537850SAkhilesh Sanikopnamespace dsp {
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop#if !defined(LIBGAV1_ENABLE_ALL_DSP_FUNCTIONS)
*09537850SAkhilesh Sanikop#define LIBGAV1_ENABLE_ALL_DSP_FUNCTIONS 0
*09537850SAkhilesh Sanikop#endif
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikopenum IntraPredictor : uint8_t {
*09537850SAkhilesh Sanikop  kIntraPredictorDcFill,
*09537850SAkhilesh Sanikop  kIntraPredictorDcTop,
*09537850SAkhilesh Sanikop  kIntraPredictorDcLeft,
*09537850SAkhilesh Sanikop  kIntraPredictorDc,
*09537850SAkhilesh Sanikop  kIntraPredictorVertical,
*09537850SAkhilesh Sanikop  kIntraPredictorHorizontal,
*09537850SAkhilesh Sanikop  kIntraPredictorPaeth,
*09537850SAkhilesh Sanikop  kIntraPredictorSmooth,
*09537850SAkhilesh Sanikop  kIntraPredictorSmoothVertical,
*09537850SAkhilesh Sanikop  kIntraPredictorSmoothHorizontal,
*09537850SAkhilesh Sanikop  kNumIntraPredictors
*09537850SAkhilesh Sanikop};
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// List of valid 1D transforms.
*09537850SAkhilesh Sanikopenum Transform1d : uint8_t {
*09537850SAkhilesh Sanikop  kTransform1dDct,   // Discrete Cosine Transform.
*09537850SAkhilesh Sanikop  kTransform1dAdst,  // Asymmetric Discrete Sine Transform.
*09537850SAkhilesh Sanikop  kTransform1dIdentity,
*09537850SAkhilesh Sanikop  kTransform1dWht,  // Walsh Hadamard Transform.
*09537850SAkhilesh Sanikop  kNumTransform1ds
*09537850SAkhilesh Sanikop};
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// List of valid 1D transform sizes. Not all transforms may be available for all
*09537850SAkhilesh Sanikop// the sizes.
*09537850SAkhilesh Sanikopenum Transform1dSize : uint8_t {
*09537850SAkhilesh Sanikop  kTransform1dSize4,
*09537850SAkhilesh Sanikop  kTransform1dSize8,
*09537850SAkhilesh Sanikop  kTransform1dSize16,
*09537850SAkhilesh Sanikop  kTransform1dSize32,
*09537850SAkhilesh Sanikop  kTransform1dSize64,
*09537850SAkhilesh Sanikop  kNumTransform1dSizes
*09537850SAkhilesh Sanikop};
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// The maximum width of the loop filter, fewer pixels may be filtered depending
*09537850SAkhilesh Sanikop// on strength thresholds.
*09537850SAkhilesh Sanikopenum LoopFilterSize : uint8_t {
*09537850SAkhilesh Sanikop  kLoopFilterSize4,
*09537850SAkhilesh Sanikop  kLoopFilterSize6,
*09537850SAkhilesh Sanikop  kLoopFilterSize8,
*09537850SAkhilesh Sanikop  kLoopFilterSize14,
*09537850SAkhilesh Sanikop  kNumLoopFilterSizes
*09537850SAkhilesh Sanikop};
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikopenum : uint8_t {
*09537850SAkhilesh Sanikop  kRow = 0,
*09537850SAkhilesh Sanikop  kColumn = 1,
*09537850SAkhilesh Sanikop};
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop//------------------------------------------------------------------------------
*09537850SAkhilesh Sanikop// ToString()
*09537850SAkhilesh Sanikop//
*09537850SAkhilesh Sanikop// These functions are meant to be used only in debug logging and within tests.
*09537850SAkhilesh Sanikop// They are defined inline to avoid including the strings in the release
*09537850SAkhilesh Sanikop// library when logging is disabled; unreferenced functions will not be added to
*09537850SAkhilesh Sanikop// any object file in that case.
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikopinline const char* ToString(const IntraPredictor predictor) {
*09537850SAkhilesh Sanikop  switch (predictor) {
*09537850SAkhilesh Sanikop    case kIntraPredictorDcFill:
*09537850SAkhilesh Sanikop      return "kIntraPredictorDcFill";
*09537850SAkhilesh Sanikop    case kIntraPredictorDcTop:
*09537850SAkhilesh Sanikop      return "kIntraPredictorDcTop";
*09537850SAkhilesh Sanikop    case kIntraPredictorDcLeft:
*09537850SAkhilesh Sanikop      return "kIntraPredictorDcLeft";
*09537850SAkhilesh Sanikop    case kIntraPredictorDc:
*09537850SAkhilesh Sanikop      return "kIntraPredictorDc";
*09537850SAkhilesh Sanikop    case kIntraPredictorVertical:
*09537850SAkhilesh Sanikop      return "kIntraPredictorVertical";
*09537850SAkhilesh Sanikop    case kIntraPredictorHorizontal:
*09537850SAkhilesh Sanikop      return "kIntraPredictorHorizontal";
*09537850SAkhilesh Sanikop    case kIntraPredictorPaeth:
*09537850SAkhilesh Sanikop      return "kIntraPredictorPaeth";
*09537850SAkhilesh Sanikop    case kIntraPredictorSmooth:
*09537850SAkhilesh Sanikop      return "kIntraPredictorSmooth";
*09537850SAkhilesh Sanikop    case kIntraPredictorSmoothVertical:
*09537850SAkhilesh Sanikop      return "kIntraPredictorSmoothVertical";
*09537850SAkhilesh Sanikop    case kIntraPredictorSmoothHorizontal:
*09537850SAkhilesh Sanikop      return "kIntraPredictorSmoothHorizontal";
*09537850SAkhilesh Sanikop    case kNumIntraPredictors:
*09537850SAkhilesh Sanikop      return "kNumIntraPredictors";
*09537850SAkhilesh Sanikop  }
*09537850SAkhilesh Sanikop  abort();
*09537850SAkhilesh Sanikop}
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikopinline const char* ToString(const Transform1d transform) {
*09537850SAkhilesh Sanikop  switch (transform) {
*09537850SAkhilesh Sanikop    case kTransform1dDct:
*09537850SAkhilesh Sanikop      return "kTransform1dDct";
*09537850SAkhilesh Sanikop    case kTransform1dAdst:
*09537850SAkhilesh Sanikop      return "kTransform1dAdst";
*09537850SAkhilesh Sanikop    case kTransform1dIdentity:
*09537850SAkhilesh Sanikop      return "kTransform1dIdentity";
*09537850SAkhilesh Sanikop    case kTransform1dWht:
*09537850SAkhilesh Sanikop      return "kTransform1dWht";
*09537850SAkhilesh Sanikop    case kNumTransform1ds:
*09537850SAkhilesh Sanikop      return "kNumTransform1ds";
*09537850SAkhilesh Sanikop  }
*09537850SAkhilesh Sanikop  abort();
*09537850SAkhilesh Sanikop}
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikopinline const char* ToString(const Transform1dSize transform_size) {
*09537850SAkhilesh Sanikop  switch (transform_size) {
*09537850SAkhilesh Sanikop    case kTransform1dSize4:
*09537850SAkhilesh Sanikop      return "kTransform1dSize4";
*09537850SAkhilesh Sanikop    case kTransform1dSize8:
*09537850SAkhilesh Sanikop      return "kTransform1dSize8";
*09537850SAkhilesh Sanikop    case kTransform1dSize16:
*09537850SAkhilesh Sanikop      return "kTransform1dSize16";
*09537850SAkhilesh Sanikop    case kTransform1dSize32:
*09537850SAkhilesh Sanikop      return "kTransform1dSize32";
*09537850SAkhilesh Sanikop    case kTransform1dSize64:
*09537850SAkhilesh Sanikop      return "kTransform1dSize64";
*09537850SAkhilesh Sanikop    case kNumTransform1dSizes:
*09537850SAkhilesh Sanikop      return "kNumTransform1dSizes";
*09537850SAkhilesh Sanikop  }
*09537850SAkhilesh Sanikop  abort();
*09537850SAkhilesh Sanikop}
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikopinline const char* ToString(const LoopFilterSize filter_size) {
*09537850SAkhilesh Sanikop  switch (filter_size) {
*09537850SAkhilesh Sanikop    case kLoopFilterSize4:
*09537850SAkhilesh Sanikop      return "kLoopFilterSize4";
*09537850SAkhilesh Sanikop    case kLoopFilterSize6:
*09537850SAkhilesh Sanikop      return "kLoopFilterSize6";
*09537850SAkhilesh Sanikop    case kLoopFilterSize8:
*09537850SAkhilesh Sanikop      return "kLoopFilterSize8";
*09537850SAkhilesh Sanikop    case kLoopFilterSize14:
*09537850SAkhilesh Sanikop      return "kLoopFilterSize14";
*09537850SAkhilesh Sanikop    case kNumLoopFilterSizes:
*09537850SAkhilesh Sanikop      return "kNumLoopFilterSizes";
*09537850SAkhilesh Sanikop  }
*09537850SAkhilesh Sanikop  abort();
*09537850SAkhilesh Sanikop}
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikopinline const char* ToString(const LoopFilterType filter_type) {
*09537850SAkhilesh Sanikop  switch (filter_type) {
*09537850SAkhilesh Sanikop    case kLoopFilterTypeVertical:
*09537850SAkhilesh Sanikop      return "kLoopFilterTypeVertical";
*09537850SAkhilesh Sanikop    case kLoopFilterTypeHorizontal:
*09537850SAkhilesh Sanikop      return "kLoopFilterTypeHorizontal";
*09537850SAkhilesh Sanikop    case kNumLoopFilterTypes:
*09537850SAkhilesh Sanikop      return "kNumLoopFilterTypes";
*09537850SAkhilesh Sanikop  }
*09537850SAkhilesh Sanikop  abort();
*09537850SAkhilesh Sanikop}
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop//------------------------------------------------------------------------------
*09537850SAkhilesh Sanikop// Intra predictors. Section 7.11.2.
*09537850SAkhilesh Sanikop// These require access to one or both of the top row and left column. Some may
*09537850SAkhilesh Sanikop// access the top-left (top[-1]), top-right (top[width+N]), bottom-left
*09537850SAkhilesh Sanikop// (left[height+N]) or upper-left (left[-1]).
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Intra predictor function signature. Sections 7.11.2.2, 7.11.2.4 (#10,#11),
*09537850SAkhilesh Sanikop// 7.11.2.5, 7.11.2.6.
*09537850SAkhilesh Sanikop// |dst| is an unaligned pointer to the output block. Pixel size is determined
*09537850SAkhilesh Sanikop// by bitdepth with |stride| given in bytes. |top| is an unaligned pointer to
*09537850SAkhilesh Sanikop// the row above |dst|. |left| is an aligned vector of the column to the left
*09537850SAkhilesh Sanikop// of |dst|. top-left and bottom-left may be accessed.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing IntraPredictorFunc = void (*)(void* dst, ptrdiff_t stride,
*09537850SAkhilesh Sanikop                                    const void* top, const void* left);
*09537850SAkhilesh Sanikopusing IntraPredictorFuncs =
*09537850SAkhilesh Sanikop    IntraPredictorFunc[kNumTransformSizes][kNumIntraPredictors];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Directional intra predictor function signature, zone 1 (0 < angle < 90).
*09537850SAkhilesh Sanikop// Section 7.11.2.4 (#7).
*09537850SAkhilesh Sanikop// |dst| is an unaligned pointer to the output block. Pixel size is determined
*09537850SAkhilesh Sanikop// by bitdepth with |stride| given in bytes. |top| is an unaligned pointer to
*09537850SAkhilesh Sanikop// the row above |dst|. |width| and |height| give the dimensions of the block.
*09537850SAkhilesh Sanikop// |xstep| is the scaled starting index to |top| from
*09537850SAkhilesh Sanikop// kDirectionalIntraPredictorDerivative. |upsampled_top| indicates whether
*09537850SAkhilesh Sanikop// |top| has been upsampled as described in '7.11.2.11. Intra edge upsample
*09537850SAkhilesh Sanikop// process'. This can occur in cases with |width| + |height| <= 16. top-right
*09537850SAkhilesh Sanikop// is accessed.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing DirectionalIntraPredictorZone1Func = void (*)(void* dst, ptrdiff_t stride,
*09537850SAkhilesh Sanikop                                                    const void* top, int width,
*09537850SAkhilesh Sanikop                                                    int height, int xstep,
*09537850SAkhilesh Sanikop                                                    bool upsampled_top);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Directional intra predictor function signature, zone 2 (90 < angle < 180).
*09537850SAkhilesh Sanikop// Section 7.11.2.4 (#8).
*09537850SAkhilesh Sanikop// |dst| is an unaligned pointer to the output block. Pixel size is determined
*09537850SAkhilesh Sanikop// by bitdepth with |stride| given in bytes. |top| is an unaligned pointer to
*09537850SAkhilesh Sanikop// the row above |dst|. |left| is an aligned vector of the column to the left of
*09537850SAkhilesh Sanikop// |dst|. |width| and |height| give the dimensions of the block. |xstep| and
*09537850SAkhilesh Sanikop// |ystep| are the scaled starting index to |top| and |left|, respectively,
*09537850SAkhilesh Sanikop// from kDirectionalIntraPredictorDerivative. |upsampled_top| and
*09537850SAkhilesh Sanikop// |upsampled_left| indicate whether |top| and |left| have been upsampled as
*09537850SAkhilesh Sanikop// described in '7.11.2.11. Intra edge upsample process'. This can occur in
*09537850SAkhilesh Sanikop// cases with |width| + |height| <= 16. top-left and upper-left are accessed,
*09537850SAkhilesh Sanikop// up to [-2] in each if |upsampled_top/left| are set.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing DirectionalIntraPredictorZone2Func = void (*)(
*09537850SAkhilesh Sanikop    void* dst, ptrdiff_t stride, const void* top, const void* left, int width,
*09537850SAkhilesh Sanikop    int height, int xstep, int ystep, bool upsampled_top, bool upsampled_left);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Directional intra predictor function signature, zone 3 (180 < angle < 270).
*09537850SAkhilesh Sanikop// Section 7.11.2.4 (#9).
*09537850SAkhilesh Sanikop// |dst| is an unaligned pointer to the output block. Pixel size is determined
*09537850SAkhilesh Sanikop// by bitdepth with |stride| given in bytes. |left| is an aligned vector of the
*09537850SAkhilesh Sanikop// column to the left of |dst|. |width| and |height| give the dimensions of the
*09537850SAkhilesh Sanikop// block. |ystep| is the scaled starting index to |left| from
*09537850SAkhilesh Sanikop// kDirectionalIntraPredictorDerivative. |upsampled_left| indicates whether
*09537850SAkhilesh Sanikop// |left| has been upsampled as described in '7.11.2.11. Intra edge upsample
*09537850SAkhilesh Sanikop// process'. This can occur in cases with |width| + |height| <= 16. bottom-left
*09537850SAkhilesh Sanikop// is accessed.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing DirectionalIntraPredictorZone3Func = void (*)(void* dst, ptrdiff_t stride,
*09537850SAkhilesh Sanikop                                                    const void* left, int width,
*09537850SAkhilesh Sanikop                                                    int height, int ystep,
*09537850SAkhilesh Sanikop                                                    bool upsampled_left);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Filter intra predictor function signature. Section 7.11.2.3.
*09537850SAkhilesh Sanikop// |dst| is an unaligned pointer to the output block. Pixel size is determined
*09537850SAkhilesh Sanikop// by bitdepth with |stride| given in bytes. |top| is an unaligned pointer to
*09537850SAkhilesh Sanikop// the row above |dst|. |left| is an aligned vector of the column to the left
*09537850SAkhilesh Sanikop// of |dst|. |width| and |height| are the size of the block in pixels.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing FilterIntraPredictorFunc = void (*)(void* dst, ptrdiff_t stride,
*09537850SAkhilesh Sanikop                                          const void* top, const void* left,
*09537850SAkhilesh Sanikop                                          FilterIntraPredictor pred, int width,
*09537850SAkhilesh Sanikop                                          int height);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop//------------------------------------------------------------------------------
*09537850SAkhilesh Sanikop// Chroma from Luma (Cfl) prediction. Section 7.11.5.
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Chroma from Luma (Cfl) intra prediction function signature. |dst| is an
*09537850SAkhilesh Sanikop// unaligned pointer to the output block. Pixel size is determined by bitdepth
*09537850SAkhilesh Sanikop// with |stride| given in bytes. |luma| contains subsampled luma pixels with 3
*09537850SAkhilesh Sanikop// fractional bits of precision. |alpha| is the signed Cfl alpha value for the
*09537850SAkhilesh Sanikop// appropriate plane.
*09537850SAkhilesh Sanikopusing CflIntraPredictorFunc = void (*)(
*09537850SAkhilesh Sanikop    void* dst, ptrdiff_t stride,
*09537850SAkhilesh Sanikop    const int16_t luma[kCflLumaBufferStride][kCflLumaBufferStride], int alpha);
*09537850SAkhilesh Sanikopusing CflIntraPredictorFuncs = CflIntraPredictorFunc[kNumTransformSizes];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Chroma from Luma (Cfl) subsampler function signature. |luma| is an unaligned
*09537850SAkhilesh Sanikop// pointer to the output block. |src| is an unaligned pointer to the input
*09537850SAkhilesh Sanikop// block. Pixel size is determined by bitdepth with |stride| given in bytes.
*09537850SAkhilesh Sanikopusing CflSubsamplerFunc =
*09537850SAkhilesh Sanikop    void (*)(int16_t luma[kCflLumaBufferStride][kCflLumaBufferStride],
*09537850SAkhilesh Sanikop             int max_luma_width, int max_luma_height, const void* source,
*09537850SAkhilesh Sanikop             ptrdiff_t stride);
*09537850SAkhilesh Sanikopusing CflSubsamplerFuncs =
*09537850SAkhilesh Sanikop    CflSubsamplerFunc[kNumTransformSizes][kNumSubsamplingTypes];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop//------------------------------------------------------------------------------
*09537850SAkhilesh Sanikop// Intra Edge Filtering and Upsampling. Step 4 in section 7.11.2.4.
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Intra edge filter function signature. |buffer| is a pointer to the top_row or
*09537850SAkhilesh Sanikop// left_column that needs to be filtered. Typically the -1'th index of |top_row|
*09537850SAkhilesh Sanikop// and |left_column| need to be filtered as well, so the caller can merely pass
*09537850SAkhilesh Sanikop// the |buffer| as top_row[-1] or left_column[-1]. Pixel size is determined by
*09537850SAkhilesh Sanikop// bitdepth. |size| is the number of pixels to be filtered. |strength| is the
*09537850SAkhilesh Sanikop// filter strength. Section 7.11.2.12 in the spec.
*09537850SAkhilesh Sanikopusing IntraEdgeFilterFunc = void (*)(void* buffer, int size, int strength);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Intra edge upsampler function signature. |buffer| is a pointer to the top_row
*09537850SAkhilesh Sanikop// or left_column that needs to be upsampled. Pixel size is determined by
*09537850SAkhilesh Sanikop// bitdepth. |size| is the number of pixels to be upsampled; valid values are:
*09537850SAkhilesh Sanikop// 4, 8, 12, 16. This function needs access to negative indices -1 and -2 of
*09537850SAkhilesh Sanikop// the |buffer|. Section 7.11.2.11 in the spec.
*09537850SAkhilesh Sanikopusing IntraEdgeUpsamplerFunc = void (*)(void* buffer, int size);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop//------------------------------------------------------------------------------
*09537850SAkhilesh Sanikop// Inverse transform add function signature.
*09537850SAkhilesh Sanikop//
*09537850SAkhilesh Sanikop// Steps 2 and 3 of section 7.12.3 (contains the implementation of section
*09537850SAkhilesh Sanikop// 7.13.3).
*09537850SAkhilesh Sanikop// Apply the inverse transforms and add the residual to the destination frame
*09537850SAkhilesh Sanikop// for the transform type and block size |tx_size| starting at position
*09537850SAkhilesh Sanikop// |start_x| and |start_y|. |dst_frame| is a pointer to an Array2D of Pixel
*09537850SAkhilesh Sanikop// values. |adjusted_tx_height| is the number of rows to process based on the
*09537850SAkhilesh Sanikop// non-zero coefficient count in the block. It will be 1 (non-zero coefficient
*09537850SAkhilesh Sanikop// count == 1), 4 or a multiple of 8 up to 32 or the original transform height,
*09537850SAkhilesh Sanikop// whichever is less. |src_buffer| is a pointer to an Array2D of Residual
*09537850SAkhilesh Sanikop// values. On input |src_buffer| contains the dequantized values, on output it
*09537850SAkhilesh Sanikop// contains the residual.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing InverseTransformAddFunc = void (*)(TransformType tx_type,
*09537850SAkhilesh Sanikop                                         TransformSize tx_size,
*09537850SAkhilesh Sanikop                                         int adjusted_tx_height,
*09537850SAkhilesh Sanikop                                         void* src_buffer, int start_x,
*09537850SAkhilesh Sanikop                                         int start_y, void* dst_frame);
*09537850SAkhilesh Sanikop// The final dimension holds row and column transforms indexed with kRow and
*09537850SAkhilesh Sanikop// kColumn.
*09537850SAkhilesh Sanikopusing InverseTransformAddFuncs =
*09537850SAkhilesh Sanikop    InverseTransformAddFunc[kNumTransform1ds][kNumTransform1dSizes][2];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop//------------------------------------------------------------------------------
*09537850SAkhilesh Sanikop// Post processing.
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Loop filter function signature. Section 7.14.
*09537850SAkhilesh Sanikop// |dst| is an unaligned pointer to the output block. Pixel size is determined
*09537850SAkhilesh Sanikop// by bitdepth with |stride| given in bytes.
*09537850SAkhilesh Sanikop// <threshold param> <spec name> <range>
*09537850SAkhilesh Sanikop// |outer_thresh|    blimit      [7, 193]
*09537850SAkhilesh Sanikop// |inner_thresh|    limit       [1, 63]
*09537850SAkhilesh Sanikop// |hev_thresh|      thresh      [0, 63]
*09537850SAkhilesh Sanikop// These are scaled by the implementation by 'bitdepth - 8' to produce
*09537850SAkhilesh Sanikop// the spec variables blimitBd, limitBd and threshBd.
*09537850SAkhilesh Sanikop// Note these functions are not called when the loop filter level is 0.
*09537850SAkhilesh Sanikopusing LoopFilterFunc = void (*)(void* dst, ptrdiff_t stride, int outer_thresh,
*09537850SAkhilesh Sanikop                                int inner_thresh, int hev_thresh);
*09537850SAkhilesh Sanikopusing LoopFilterFuncs =
*09537850SAkhilesh Sanikop    LoopFilterFunc[kNumLoopFilterSizes][kNumLoopFilterTypes];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Cdef direction function signature. Section 7.15.2.
*09537850SAkhilesh Sanikop// |src| is a pointer to the source block. Pixel size is determined by bitdepth
*09537850SAkhilesh Sanikop// with |stride| given in bytes. |direction| and |variance| are output
*09537850SAkhilesh Sanikop// parameters and must not be nullptr.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing CdefDirectionFunc = void (*)(const void* src, ptrdiff_t stride,
*09537850SAkhilesh Sanikop                                   uint8_t* direction, int* variance);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Cdef filtering function signature. Section 7.15.3.
*09537850SAkhilesh Sanikop// |source| is a pointer to the input block padded with kCdefLargeValue if at a
*09537850SAkhilesh Sanikop// frame border. |source_stride| is given in units of uint16_t.
*09537850SAkhilesh Sanikop// |block_width|, |block_height| are the width/height of the input block.
*09537850SAkhilesh Sanikop// |primary_strength|, |secondary_strength|, and |damping| are Cdef filtering
*09537850SAkhilesh Sanikop// parameters.
*09537850SAkhilesh Sanikop// |direction| is the filtering direction.
*09537850SAkhilesh Sanikop// |dest| is the output buffer. |dest_stride| is given in bytes.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing CdefFilteringFunc = void (*)(const uint16_t* source,
*09537850SAkhilesh Sanikop                                   ptrdiff_t source_stride, int block_height,
*09537850SAkhilesh Sanikop                                   int primary_strength, int secondary_strength,
*09537850SAkhilesh Sanikop                                   int damping, int direction, void* dest,
*09537850SAkhilesh Sanikop                                   ptrdiff_t dest_stride);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// The first index is block width: [0]: 4, [1]: 8. The second is based on
*09537850SAkhilesh Sanikop// non-zero strengths: [0]: |primary_strength| and |secondary_strength|, [1]:
*09537850SAkhilesh Sanikop// |primary_strength| only, [2]: |secondary_strength| only.
*09537850SAkhilesh Sanikopusing CdefFilteringFuncs = CdefFilteringFunc[2][3];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Upscaling coefficients function signature. Section 7.16.
*09537850SAkhilesh Sanikop// This is an auxiliary function for SIMD optimizations and has no corresponding
*09537850SAkhilesh Sanikop// C function. Different SIMD versions may have different outputs. So it must
*09537850SAkhilesh Sanikop// pair with the corresponding version of SuperResFunc.
*09537850SAkhilesh Sanikop// |upscaled_width| is the width of the output frame.
*09537850SAkhilesh Sanikop// |step| is the number of subpixels to move the kernel for the next destination
*09537850SAkhilesh Sanikop// pixel.
*09537850SAkhilesh Sanikop// |initial_subpixel_x| is a base offset from which |step| increments.
*09537850SAkhilesh Sanikop// |coefficients| is the upscale filter used by each pixel in a row.
*09537850SAkhilesh Sanikopusing SuperResCoefficientsFunc = void (*)(int upscaled_width,
*09537850SAkhilesh Sanikop                                          int initial_subpixel_x, int step,
*09537850SAkhilesh Sanikop                                          void* coefficients);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Upscaling process function signature. Section 7.16.
*09537850SAkhilesh Sanikop// |coefficients| is the upscale filter used by each pixel in a row. It is not
*09537850SAkhilesh Sanikop// used by the C function.
*09537850SAkhilesh Sanikop// |source| is the input frame buffer. It will be line extended.
*09537850SAkhilesh Sanikop// |source_stride| is given in pixels.
*09537850SAkhilesh Sanikop// |dest| is the output buffer.
*09537850SAkhilesh Sanikop// |dest_stride| is given in pixels.
*09537850SAkhilesh Sanikop// |height| is the height of the block to be processed.
*09537850SAkhilesh Sanikop// |downscaled_width| is the width of the input frame.
*09537850SAkhilesh Sanikop// |upscaled_width| is the width of the output frame.
*09537850SAkhilesh Sanikop// |step| is the number of subpixels to move the kernel for the next destination
*09537850SAkhilesh Sanikop// pixel.
*09537850SAkhilesh Sanikop// |initial_subpixel_x| is a base offset from which |step| increments.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing SuperResFunc = void (*)(const void* coefficients, void* source,
*09537850SAkhilesh Sanikop                              ptrdiff_t source_stride, int height,
*09537850SAkhilesh Sanikop                              int downscaled_width, int upscaled_width,
*09537850SAkhilesh Sanikop                              int initial_subpixel_x, int step, void* dest,
*09537850SAkhilesh Sanikop                              ptrdiff_t dest_stride);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Loop restoration function signature. Sections 7.16, 7.17.
*09537850SAkhilesh Sanikop// |restoration_info| contains loop restoration information, such as filter
*09537850SAkhilesh Sanikop// type, strength.
*09537850SAkhilesh Sanikop// |source| is the input frame buffer, which is deblocked and cdef filtered.
*09537850SAkhilesh Sanikop// |top_border| and |bottom_border| are the top and bottom borders.
*09537850SAkhilesh Sanikop// |dest| is the output.
*09537850SAkhilesh Sanikop// |stride| is given in pixels, and shared by |source| and |dest|.
*09537850SAkhilesh Sanikop// |top_border_stride| and |bottom_border_stride| are given in pixels.
*09537850SAkhilesh Sanikop// |restoration_buffer| contains buffers required for self guided filter and
*09537850SAkhilesh Sanikop// wiener filter. They must be initialized before calling.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing LoopRestorationFunc = void (*)(
*09537850SAkhilesh Sanikop    const RestorationUnitInfo& restoration_info, const void* source,
*09537850SAkhilesh Sanikop    ptrdiff_t stride, const void* top_border, ptrdiff_t top_border_stride,
*09537850SAkhilesh Sanikop    const void* bottom_border, ptrdiff_t bottom_border_stride, int width,
*09537850SAkhilesh Sanikop    int height, RestorationBuffer* restoration_buffer, void* dest);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Index 0 is Wiener Filter.
*09537850SAkhilesh Sanikop// Index 1 is Self Guided Restoration Filter.
*09537850SAkhilesh Sanikop// This can be accessed as LoopRestorationType - 2.
*09537850SAkhilesh Sanikopusing LoopRestorationFuncs = LoopRestorationFunc[2];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Convolve function signature. Section 7.11.3.4.
*09537850SAkhilesh Sanikop// This function applies a horizontal filter followed by a vertical filter.
*09537850SAkhilesh Sanikop// |reference| is the input block (reference frame buffer). |reference_stride|
*09537850SAkhilesh Sanikop// is the corresponding frame stride.
*09537850SAkhilesh Sanikop// |vertical_filter_index|/|horizontal_filter_index| is the index to
*09537850SAkhilesh Sanikop// retrieve the type of filter to be applied for vertical/horizontal direction
*09537850SAkhilesh Sanikop// from the filter lookup table 'kSubPixelFilters'.
*09537850SAkhilesh Sanikop// |horizontal_filter_id| and |vertical_filter_id| are the filter ids.
*09537850SAkhilesh Sanikop// |width| and |height| are width and height of the block to be filtered.
*09537850SAkhilesh Sanikop// |ref_last_x| and |ref_last_y| are the last pixel of the reference frame in
*09537850SAkhilesh Sanikop// x/y direction.
*09537850SAkhilesh Sanikop// |prediction| is the output block (output frame buffer).
*09537850SAkhilesh Sanikop// Rounding precision is derived from the function being called. For horizontal
*09537850SAkhilesh Sanikop// filtering kInterRoundBitsHorizontal & kInterRoundBitsHorizontal12bpp will be
*09537850SAkhilesh Sanikop// used. For compound vertical filtering kInterRoundBitsCompoundVertical will be
*09537850SAkhilesh Sanikop// used. Otherwise kInterRoundBitsVertical & kInterRoundBitsVertical12bpp will
*09537850SAkhilesh Sanikop// be used.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing ConvolveFunc = void (*)(const void* reference, ptrdiff_t reference_stride,
*09537850SAkhilesh Sanikop                              int horizontal_filter_index,
*09537850SAkhilesh Sanikop                              int vertical_filter_index,
*09537850SAkhilesh Sanikop                              int horizontal_filter_id, int vertical_filter_id,
*09537850SAkhilesh Sanikop                              int width, int height, void* prediction,
*09537850SAkhilesh Sanikop                              ptrdiff_t pred_stride);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Convolve functions signature. Each points to one convolve function with
*09537850SAkhilesh Sanikop// a specific setting:
*09537850SAkhilesh Sanikop// ConvolveFunc[is_intra_block_copy][is_compound][has_vertical_filter]
*09537850SAkhilesh Sanikop// [has_horizontal_filter].
*09537850SAkhilesh Sanikop// If is_compound is false, the prediction is clipped to Pixel.
*09537850SAkhilesh Sanikop// If is_compound is true, the range of prediction is:
*09537850SAkhilesh Sanikop//   8bpp:  [-5132,  9212] (int16_t)
*09537850SAkhilesh Sanikop//   10bpp: [ 3988, 61532] (uint16_t)
*09537850SAkhilesh Sanikop//   12bpp: [ 3974, 61559] (uint16_t)
*09537850SAkhilesh Sanikop// See src/dsp/convolve.cc
*09537850SAkhilesh Sanikopusing ConvolveFuncs = ConvolveFunc[2][2][2][2];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Convolve + scale function signature. Section 7.11.3.4.
*09537850SAkhilesh Sanikop// This function applies a horizontal filter followed by a vertical filter.
*09537850SAkhilesh Sanikop// |reference| is the input block (reference frame buffer). |reference_stride|
*09537850SAkhilesh Sanikop// is the corresponding frame stride.
*09537850SAkhilesh Sanikop// |vertical_filter_index|/|horizontal_filter_index| is the index to
*09537850SAkhilesh Sanikop// retrieve the type of filter to be applied for vertical/horizontal direction
*09537850SAkhilesh Sanikop// from the filter lookup table 'kSubPixelFilters'.
*09537850SAkhilesh Sanikop// |subpixel_x| and |subpixel_y| are starting positions in units of 1/1024.
*09537850SAkhilesh Sanikop// |step_x| and |step_y| are step sizes in units of 1/1024 of a pixel.
*09537850SAkhilesh Sanikop// |width| and |height| are width and height of the block to be filtered.
*09537850SAkhilesh Sanikop// |ref_last_x| and |ref_last_y| are the last pixel of the reference frame in
*09537850SAkhilesh Sanikop// x/y direction.
*09537850SAkhilesh Sanikop// |prediction| is the output block (output frame buffer).
*09537850SAkhilesh Sanikop// Rounding precision is derived from the function being called. For horizontal
*09537850SAkhilesh Sanikop// filtering kInterRoundBitsHorizontal & kInterRoundBitsHorizontal12bpp will be
*09537850SAkhilesh Sanikop// used. For compound vertical filtering kInterRoundBitsCompoundVertical will be
*09537850SAkhilesh Sanikop// used. Otherwise kInterRoundBitsVertical & kInterRoundBitsVertical12bpp will
*09537850SAkhilesh Sanikop// be used.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing ConvolveScaleFunc = void (*)(const void* reference,
*09537850SAkhilesh Sanikop                                   ptrdiff_t reference_stride,
*09537850SAkhilesh Sanikop                                   int horizontal_filter_index,
*09537850SAkhilesh Sanikop                                   int vertical_filter_index, int subpixel_x,
*09537850SAkhilesh Sanikop                                   int subpixel_y, int step_x, int step_y,
*09537850SAkhilesh Sanikop                                   int width, int height, void* prediction,
*09537850SAkhilesh Sanikop                                   ptrdiff_t pred_stride);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Convolve functions signature for scaling version.
*09537850SAkhilesh Sanikop// 0: single predictor. 1: compound predictor.
*09537850SAkhilesh Sanikopusing ConvolveScaleFuncs = ConvolveScaleFunc[2];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Weight mask function signature. Section 7.11.3.12.
*09537850SAkhilesh Sanikop// |prediction_0| is the first input block.
*09537850SAkhilesh Sanikop// |prediction_1| is the second input block. Both blocks are int16_t* when
*09537850SAkhilesh Sanikop// bitdepth == 8 and uint16_t* otherwise.
*09537850SAkhilesh Sanikop// |width| and |height| are the prediction width and height.
*09537850SAkhilesh Sanikop// The stride for the input buffers is equal to |width|.
*09537850SAkhilesh Sanikop// The valid range of block size is [8x8, 128x128] for the luma plane.
*09537850SAkhilesh Sanikop// |mask| is the output buffer. |mask_stride| is the output buffer stride.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing WeightMaskFunc = void (*)(const void* prediction_0,
*09537850SAkhilesh Sanikop                                const void* prediction_1, uint8_t* mask,
*09537850SAkhilesh Sanikop                                ptrdiff_t mask_stride);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Weight mask functions signature. The dimensions (in order) are:
*09537850SAkhilesh Sanikop//   * Width index (4 => 0, 8 => 1, 16 => 2 and so on).
*09537850SAkhilesh Sanikop//   * Height index (4 => 0, 8 => 1, 16 => 2 and so on).
*09537850SAkhilesh Sanikop//   * mask_is_inverse.
*09537850SAkhilesh Sanikopusing WeightMaskFuncs = WeightMaskFunc[6][6][2];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Average blending function signature.
*09537850SAkhilesh Sanikop// Two predictors are averaged to generate the output.
*09537850SAkhilesh Sanikop// Input predictor values are int16_t. Output type is uint8_t, with actual
*09537850SAkhilesh Sanikop// range of Pixel value.
*09537850SAkhilesh Sanikop// Average blending is in the bottom of Section 7.11.3.1 (COMPOUND_AVERAGE).
*09537850SAkhilesh Sanikop// |prediction_0| is the first input block.
*09537850SAkhilesh Sanikop// |prediction_1| is the second input block. Both blocks are int16_t* when
*09537850SAkhilesh Sanikop// bitdepth == 8 and uint16_t* otherwise.
*09537850SAkhilesh Sanikop// |width| and |height| are the same for the first and second input blocks.
*09537850SAkhilesh Sanikop// The stride for the input buffers is equal to |width|.
*09537850SAkhilesh Sanikop// The valid range of block size is [8x8, 128x128] for the luma plane.
*09537850SAkhilesh Sanikop// |dest| is the output buffer. |dest_stride| is the output buffer stride.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing AverageBlendFunc = void (*)(const void* prediction_0,
*09537850SAkhilesh Sanikop                                  const void* prediction_1, int width,
*09537850SAkhilesh Sanikop                                  int height, void* dest,
*09537850SAkhilesh Sanikop                                  ptrdiff_t dest_stride);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Distance weighted blending function signature.
*09537850SAkhilesh Sanikop// Weights are generated in Section 7.11.3.15.
*09537850SAkhilesh Sanikop// Weighted blending is in the bottom of Section 7.11.3.1 (COMPOUND_DISTANCE).
*09537850SAkhilesh Sanikop// This function takes two blocks (inter frame prediction) and produces a
*09537850SAkhilesh Sanikop// weighted output.
*09537850SAkhilesh Sanikop// |prediction_0| is the first input block.
*09537850SAkhilesh Sanikop// |prediction_1| is the second input block. Both blocks are int16_t* when
*09537850SAkhilesh Sanikop// bitdepth == 8 and uint16_t* otherwise.
*09537850SAkhilesh Sanikop// |weight_0| is the weight for the first block. It is derived from the relative
*09537850SAkhilesh Sanikop// distance of the first reference frame and the current frame.
*09537850SAkhilesh Sanikop// |weight_1| is the weight for the second block. It is derived from the
*09537850SAkhilesh Sanikop// relative distance of the second reference frame and the current frame.
*09537850SAkhilesh Sanikop// |width| and |height| are the same for the first and second input blocks.
*09537850SAkhilesh Sanikop// The stride for the input buffers is equal to |width|.
*09537850SAkhilesh Sanikop// The valid range of block size is [8x8, 128x128] for the luma plane.
*09537850SAkhilesh Sanikop// |dest| is the output buffer. |dest_stride| is the output buffer stride.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing DistanceWeightedBlendFunc = void (*)(const void* prediction_0,
*09537850SAkhilesh Sanikop                                           const void* prediction_1,
*09537850SAkhilesh Sanikop                                           uint8_t weight_0, uint8_t weight_1,
*09537850SAkhilesh Sanikop                                           int width, int height, void* dest,
*09537850SAkhilesh Sanikop                                           ptrdiff_t dest_stride);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Mask blending function signature. Section 7.11.3.14.
*09537850SAkhilesh Sanikop// This function takes two blocks and produces a blended output stored into the
*09537850SAkhilesh Sanikop// output block |dest|. The blending is a weighted average process, controlled
*09537850SAkhilesh Sanikop// by values of the mask.
*09537850SAkhilesh Sanikop// |prediction_0| is the first input block. When prediction mode is inter_intra
*09537850SAkhilesh Sanikop// (or wedge_inter_intra), this refers to the inter frame prediction. It is
*09537850SAkhilesh Sanikop// int16_t* when bitdepth == 8 and uint16_t* otherwise.
*09537850SAkhilesh Sanikop// The stride for |prediction_0| is equal to |width|.
*09537850SAkhilesh Sanikop// |prediction_1| is the second input block. When prediction mode is inter_intra
*09537850SAkhilesh Sanikop// (or wedge_inter_intra), this refers to the intra frame prediction and uses
*09537850SAkhilesh Sanikop// Pixel values. It is only used for intra frame prediction when bitdepth >= 10.
*09537850SAkhilesh Sanikop// It is int16_t* when bitdepth == 8 and uint16_t* otherwise.
*09537850SAkhilesh Sanikop// |prediction_stride_1| is the stride, given in units of [u]int16_t. When
*09537850SAkhilesh Sanikop// |is_inter_intra| is false (compound prediction) then |prediction_stride_1| is
*09537850SAkhilesh Sanikop// equal to |width|.
*09537850SAkhilesh Sanikop// |mask| is an integer array, whose value indicates the weight of the blending.
*09537850SAkhilesh Sanikop// |mask_stride| is corresponding stride.
*09537850SAkhilesh Sanikop// |width|, |height| are the same for both input blocks.
*09537850SAkhilesh Sanikop// If it's inter_intra (or wedge_inter_intra), the valid range of block size is
*09537850SAkhilesh Sanikop// [8x8, 32x32], no 4:1/1:4 blocks (Section 5.11.28). Otherwise (including
*09537850SAkhilesh Sanikop// difference weighted prediction and compound average prediction), the valid
*09537850SAkhilesh Sanikop// range is [8x8, 128x128].
*09537850SAkhilesh Sanikop// If there's subsampling, the corresponding width and height are halved for
*09537850SAkhilesh Sanikop// chroma planes.
*09537850SAkhilesh Sanikop// |is_inter_intra| stands for the prediction mode. If it is true, one of the
*09537850SAkhilesh Sanikop// prediction blocks is from intra prediction of current frame. Otherwise, two
*09537850SAkhilesh Sanikop// prediction blocks are both inter frame predictions.
*09537850SAkhilesh Sanikop// |is_wedge_inter_intra| indicates if the mask is for the wedge prediction.
*09537850SAkhilesh Sanikop// |dest| is the output block.
*09537850SAkhilesh Sanikop// |dest_stride| is the corresponding stride for dest.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing MaskBlendFunc = void (*)(const void* prediction_0,
*09537850SAkhilesh Sanikop                               const void* prediction_1,
*09537850SAkhilesh Sanikop                               ptrdiff_t prediction_stride_1,
*09537850SAkhilesh Sanikop                               const uint8_t* mask, ptrdiff_t mask_stride,
*09537850SAkhilesh Sanikop                               int width, int height, void* dest,
*09537850SAkhilesh Sanikop                               ptrdiff_t dest_stride);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Mask blending functions signature. Each points to one function with
*09537850SAkhilesh Sanikop// a specific setting:
*09537850SAkhilesh Sanikop// MaskBlendFunc[subsampling_x + subsampling_y][is_inter_intra].
*09537850SAkhilesh Sanikopusing MaskBlendFuncs = MaskBlendFunc[3][2];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// This function is similar to the MaskBlendFunc. It is only used when
*09537850SAkhilesh Sanikop// |is_inter_intra| is true and |bitdepth| == 8.
*09537850SAkhilesh Sanikop// |prediction_[01]| are Pixel values (uint8_t).
*09537850SAkhilesh Sanikop// |prediction_1| is also the output buffer.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing InterIntraMaskBlendFunc8bpp = void (*)(const uint8_t* prediction_0,
*09537850SAkhilesh Sanikop                                             uint8_t* prediction_1,
*09537850SAkhilesh Sanikop                                             ptrdiff_t prediction_stride_1,
*09537850SAkhilesh Sanikop                                             const uint8_t* mask,
*09537850SAkhilesh Sanikop                                             ptrdiff_t mask_stride, int width,
*09537850SAkhilesh Sanikop                                             int height);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// InterIntra8bpp mask blending functions signature. When is_wedge_inter_intra
*09537850SAkhilesh Sanikop// is false, the function at index 0 must be used. Otherwise, the function at
*09537850SAkhilesh Sanikop// index subsampling_x + subsampling_y must be used.
*09537850SAkhilesh Sanikopusing InterIntraMaskBlendFuncs8bpp = InterIntraMaskBlendFunc8bpp[3];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Obmc (overlapped block motion compensation) blending function signature.
*09537850SAkhilesh Sanikop// Section 7.11.3.10.
*09537850SAkhilesh Sanikop// This function takes two blocks and produces a blended output stored into the
*09537850SAkhilesh Sanikop// first input block. The blending is a weighted average process, controlled by
*09537850SAkhilesh Sanikop// values of the mask.
*09537850SAkhilesh Sanikop// Obmc is not a compound mode. It is different from other compound blending,
*09537850SAkhilesh Sanikop// in terms of precision. The current block is computed using convolution with
*09537850SAkhilesh Sanikop// clipping to the range of pixel values. Its above and left blocks are also
*09537850SAkhilesh Sanikop// clipped. Therefore obmc blending process doesn't need to clip the output.
*09537850SAkhilesh Sanikop// |prediction| is the first input block, which will be overwritten.
*09537850SAkhilesh Sanikop// |prediction_stride| is the stride, given in bytes.
*09537850SAkhilesh Sanikop// |width|, |height| are the same for both input blocks. The range is [4x2,
*09537850SAkhilesh Sanikop// 32x32] for kObmcDirectionVertical and [2x4, 32x32] for
*09537850SAkhilesh Sanikop// kObmcDirectionHorizontal, see Section 7.11.3.9.
*09537850SAkhilesh Sanikop// |obmc_prediction| is the second input block.
*09537850SAkhilesh Sanikop// |obmc_prediction_stride| is its stride, given in bytes.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing ObmcBlendFunc = void (*)(void* prediction, ptrdiff_t prediction_stride,
*09537850SAkhilesh Sanikop                               int width, int height,
*09537850SAkhilesh Sanikop                               const void* obmc_prediction,
*09537850SAkhilesh Sanikop                               ptrdiff_t obmc_prediction_stride);
*09537850SAkhilesh Sanikopusing ObmcBlendFuncs = ObmcBlendFunc[kNumObmcDirections];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Warp function signature. Section 7.11.3.5.
*09537850SAkhilesh Sanikop// This function applies warp filtering for each 8x8 block inside the current
*09537850SAkhilesh Sanikop// coding block. The filtering process is similar to 2d convolve filtering.
*09537850SAkhilesh Sanikop// The horizontal filter is applied followed by the vertical filter.
*09537850SAkhilesh Sanikop// The function has to calculate corresponding pixel positions before and
*09537850SAkhilesh Sanikop// after warping.
*09537850SAkhilesh Sanikop// |source| is the input reference frame buffer.
*09537850SAkhilesh Sanikop// |source_stride|, |source_width|, |source_height| are corresponding frame
*09537850SAkhilesh Sanikop// stride, width, and height. |source_stride| is given in bytes.
*09537850SAkhilesh Sanikop// |warp_params| is the matrix of warp motion: warp_params[i] = mN.
*09537850SAkhilesh Sanikop//         [x'     (m2 m3 m0   [x
*09537850SAkhilesh Sanikop//     z .  y'  =   m4 m5 m1 *  y
*09537850SAkhilesh Sanikop//          1]      m6 m7 1)    1]
*09537850SAkhilesh Sanikop// |subsampling_x/y| is the current frame's plane subsampling factor.
*09537850SAkhilesh Sanikop// |block_start_x| and |block_start_y| are the starting position the current
*09537850SAkhilesh Sanikop// coding block.
*09537850SAkhilesh Sanikop// |block_width| and |block_height| are width and height of the current coding
*09537850SAkhilesh Sanikop// block. |block_width| and |block_height| are at least 8.
*09537850SAkhilesh Sanikop// |alpha|, |beta|, |gamma|, |delta| are valid warp parameters. See the
*09537850SAkhilesh Sanikop// comments in the definition of struct GlobalMotion for the range of their
*09537850SAkhilesh Sanikop// values.
*09537850SAkhilesh Sanikop// |dest| is the output buffer of type Pixel. The output values are clipped to
*09537850SAkhilesh Sanikop// Pixel values.
*09537850SAkhilesh Sanikop// |dest_stride| is the stride, in units of bytes.
*09537850SAkhilesh Sanikop// Rounding precision is derived from the function being called. For horizontal
*09537850SAkhilesh Sanikop// filtering kInterRoundBitsHorizontal & kInterRoundBitsHorizontal12bpp will be
*09537850SAkhilesh Sanikop// used. For vertical filtering kInterRoundBitsVertical &
*09537850SAkhilesh Sanikop// kInterRoundBitsVertical12bpp will be used.
*09537850SAkhilesh Sanikop//
*09537850SAkhilesh Sanikop// NOTE: WarpFunc assumes the source frame has left, right, top, and bottom
*09537850SAkhilesh Sanikop// borders that extend the frame boundary pixels.
*09537850SAkhilesh Sanikop// * The left and right borders must be at least 13 pixels wide. In addition,
*09537850SAkhilesh Sanikop//   Warp_NEON() may read up to 14 bytes after a row in the |source| buffer.
*09537850SAkhilesh Sanikop//   Therefore, there must be at least one extra padding byte after the right
*09537850SAkhilesh Sanikop//   border of the last row in the source buffer.
*09537850SAkhilesh Sanikop// * The top and bottom borders must be at least 13 pixels high.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing WarpFunc = void (*)(const void* source, ptrdiff_t source_stride,
*09537850SAkhilesh Sanikop                          int source_width, int source_height,
*09537850SAkhilesh Sanikop                          const int* warp_params, int subsampling_x,
*09537850SAkhilesh Sanikop                          int subsampling_y, int block_start_x,
*09537850SAkhilesh Sanikop                          int block_start_y, int block_width, int block_height,
*09537850SAkhilesh Sanikop                          int16_t alpha, int16_t beta, int16_t gamma,
*09537850SAkhilesh Sanikop                          int16_t delta, void* dest, ptrdiff_t dest_stride);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Warp for compound predictions. Section 7.11.3.5.
*09537850SAkhilesh Sanikop// Similar to WarpFunc, but |dest| is a uint16_t predictor buffer,
*09537850SAkhilesh Sanikop// |dest_stride| is given in units of uint16_t and |inter_round_bits_vertical|
*09537850SAkhilesh Sanikop// is always 7 (kCompoundInterRoundBitsVertical).
*09537850SAkhilesh Sanikop// Rounding precision is derived from the function being called. For horizontal
*09537850SAkhilesh Sanikop// filtering kInterRoundBitsHorizontal & kInterRoundBitsHorizontal12bpp will be
*09537850SAkhilesh Sanikop// used. For vertical filtering kInterRoundBitsCompondVertical will be used.
*09537850SAkhilesh Sanikopusing WarpCompoundFunc = WarpFunc;
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikopconstexpr int kNumAutoRegressionLags = 4;
*09537850SAkhilesh Sanikop// Applies an auto-regressive filter to the white noise in |luma_grain_buffer|.
*09537850SAkhilesh Sanikop// Section 7.18.3.3, second code block
*09537850SAkhilesh Sanikop// |params| are parameters read from frame header, mainly providing
*09537850SAkhilesh Sanikop// auto_regression_coeff_y for the filter and auto_regression_shift to right
*09537850SAkhilesh Sanikop// shift the filter sum by. Note: This method assumes
*09537850SAkhilesh Sanikop// params.auto_regression_coeff_lag is not 0. Do not call this method if
*09537850SAkhilesh Sanikop// params.auto_regression_coeff_lag is 0.
*09537850SAkhilesh Sanikopusing LumaAutoRegressionFunc = void (*)(const FilmGrainParams& params,
*09537850SAkhilesh Sanikop                                        void* luma_grain_buffer);
*09537850SAkhilesh Sanikop// Function index is auto_regression_coeff_lag - 1.
*09537850SAkhilesh Sanikopusing LumaAutoRegressionFuncs =
*09537850SAkhilesh Sanikop    LumaAutoRegressionFunc[kNumAutoRegressionLags - 1];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Applies an auto-regressive filter to the white noise in u_grain and v_grain.
*09537850SAkhilesh Sanikop// Section 7.18.3.3, third code block
*09537850SAkhilesh Sanikop// The |luma_grain_buffer| provides samples that are added to the autoregressive
*09537850SAkhilesh Sanikop// sum when num_y_points > 0.
*09537850SAkhilesh Sanikop// |u_grain_buffer| and |v_grain_buffer| point to the buffers of chroma noise
*09537850SAkhilesh Sanikop// that were generated from the stored Gaussian sequence, and are overwritten
*09537850SAkhilesh Sanikop// with the results of the autoregressive filter. |params| are parameters read
*09537850SAkhilesh Sanikop// from frame header, mainly providing auto_regression_coeff_u and
*09537850SAkhilesh Sanikop// auto_regression_coeff_v for each chroma plane's filter, and
*09537850SAkhilesh Sanikop// auto_regression_shift to right shift the filter sums by.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing ChromaAutoRegressionFunc = void (*)(const FilmGrainParams& params,
*09537850SAkhilesh Sanikop                                          const void* luma_grain_buffer,
*09537850SAkhilesh Sanikop                                          int subsampling_x, int subsampling_y,
*09537850SAkhilesh Sanikop                                          void* u_grain_buffer,
*09537850SAkhilesh Sanikop                                          void* v_grain_buffer);
*09537850SAkhilesh Sanikopusing ChromaAutoRegressionFuncs =
*09537850SAkhilesh Sanikop    ChromaAutoRegressionFunc[/*use_luma*/ 2][kNumAutoRegressionLags];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Build an image-wide "stripe" of grain noise for every 32 rows in the image.
*09537850SAkhilesh Sanikop// Section 7.18.3.5, first code block.
*09537850SAkhilesh Sanikop// Each 32x32 luma block is copied at a random offset specified via
*09537850SAkhilesh Sanikop// |grain_seed| from the grain template produced by autoregression, and the same
*09537850SAkhilesh Sanikop// is done for chroma grains, subject to subsampling.
*09537850SAkhilesh Sanikop// |width| and |height| are the dimensions of the overall image.
*09537850SAkhilesh Sanikop// |noise_stripes_buffer| points to an Array2DView with one row for each stripe.
*09537850SAkhilesh Sanikop// Because this function treats all planes identically and independently, it is
*09537850SAkhilesh Sanikop// simplified to take one grain buffer at a time. This means duplicating some
*09537850SAkhilesh Sanikop// random number generations, but that work can be reduced in other ways.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing ConstructNoiseStripesFunc = void (*)(const void* grain_buffer,
*09537850SAkhilesh Sanikop                                           int grain_seed, int width,
*09537850SAkhilesh Sanikop                                           int height, int subsampling_x,
*09537850SAkhilesh Sanikop                                           int subsampling_y,
*09537850SAkhilesh Sanikop                                           void* noise_stripes_buffer);
*09537850SAkhilesh Sanikopusing ConstructNoiseStripesFuncs =
*09537850SAkhilesh Sanikop    ConstructNoiseStripesFunc[/*overlap_flag*/ 2];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Compute the one or two overlap rows for each stripe copied to the noise
*09537850SAkhilesh Sanikop// image.
*09537850SAkhilesh Sanikop// Section 7.18.3.5, second code block. |width| and |height| are the
*09537850SAkhilesh Sanikop// dimensions of the overall image. |noise_stripes_buffer| points to an
*09537850SAkhilesh Sanikop// Array2DView with one row for each stripe. |noise_image_buffer| points to an
*09537850SAkhilesh Sanikop// Array2D containing the allocated plane for this frame. Because this function
*09537850SAkhilesh Sanikop// treats all planes identically and independently, it is simplified to take one
*09537850SAkhilesh Sanikop// grain buffer at a time.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing ConstructNoiseImageOverlapFunc =
*09537850SAkhilesh Sanikop    void (*)(const void* noise_stripes_buffer, int width, int height,
*09537850SAkhilesh Sanikop             int subsampling_x, int subsampling_y, void* noise_image_buffer);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Populate a scaling lookup table with interpolated values of a piecewise
*09537850SAkhilesh Sanikop// linear function where values in |point_value| are mapped to the values in
*09537850SAkhilesh Sanikop// |point_scaling|.
*09537850SAkhilesh Sanikop// |num_points| can be between 0 and 15. When 0, the lookup table is set to
*09537850SAkhilesh Sanikop// zero.
*09537850SAkhilesh Sanikop// |point_value| and |point_scaling| have |num_points| valid elements.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikopusing InitializeScalingLutFunc = void (*)(int num_points,
*09537850SAkhilesh Sanikop                                          const uint8_t point_value[],
*09537850SAkhilesh Sanikop                                          const uint8_t point_scaling[],
*09537850SAkhilesh Sanikop                                          int16_t* scaling_lut,
*09537850SAkhilesh Sanikop                                          const int scaling_lut_length);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Blend noise with image. Section 7.18.3.5, third code block.
*09537850SAkhilesh Sanikop// |width| is the width of each row, while |height| is how many rows to compute.
*09537850SAkhilesh Sanikop// |start_height| is an offset for the noise image, to support multithreading.
*09537850SAkhilesh Sanikop// |min_value|, |max_luma|, and |max_chroma| are computed by the caller of these
*09537850SAkhilesh Sanikop// functions, according to the code in the spec.
*09537850SAkhilesh Sanikop// |source_plane_y| and |source_plane_uv| are the plane buffers of the decoded
*09537850SAkhilesh Sanikop// frame. They are blended with the film grain noise and written to
*09537850SAkhilesh Sanikop// |dest_plane_y| and |dest_plane_uv| as final output for display.
*09537850SAkhilesh Sanikop// source_plane_* and dest_plane_* may point to the same buffer, in which case
*09537850SAkhilesh Sanikop// the film grain noise is added in place.
*09537850SAkhilesh Sanikop// |scaling_lut_y|  and |scaling_lut| represent a piecewise linear mapping from
*09537850SAkhilesh Sanikop// the frame's raw pixel value, to a scaling factor for the noise sample.
*09537850SAkhilesh Sanikop// |scaling_shift| is applied as a right shift after scaling, so that scaling
*09537850SAkhilesh Sanikop// down is possible. It is found in FilmGrainParams, but supplied directly to
*09537850SAkhilesh Sanikop// BlendNoiseWithImageLumaFunc because it's the only member used.
*09537850SAkhilesh Sanikop// The dest plane may point to the source plane, depending on the value of
*09537850SAkhilesh Sanikop// frame_header.show_existing_frame. |noise_image_ptr| and scaling_lut.* do not
*09537850SAkhilesh Sanikop// alias other arguments.
*09537850SAkhilesh Sanikopusing BlendNoiseWithImageLumaFunc = void (*)(
*09537850SAkhilesh Sanikop    const void* noise_image_ptr, int min_value, int max_value,
*09537850SAkhilesh Sanikop    int scaling_shift, int width, int height, int start_height,
*09537850SAkhilesh Sanikop    const int16_t* scaling_lut_y, const void* source_plane_y,
*09537850SAkhilesh Sanikop    ptrdiff_t source_stride_y, void* dest_plane_y, ptrdiff_t dest_stride_y);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikopusing BlendNoiseWithImageChromaFunc = void (*)(
*09537850SAkhilesh Sanikop    Plane plane, const FilmGrainParams& params, const void* noise_image_ptr,
*09537850SAkhilesh Sanikop    int min_value, int max_value, int width, int height, int start_height,
*09537850SAkhilesh Sanikop    int subsampling_x, int subsampling_y, const int16_t* scaling_lut,
*09537850SAkhilesh Sanikop    const void* source_plane_y, ptrdiff_t source_stride_y,
*09537850SAkhilesh Sanikop    const void* source_plane_uv, ptrdiff_t source_stride_uv,
*09537850SAkhilesh Sanikop    void* dest_plane_uv, ptrdiff_t dest_stride_uv);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikopusing BlendNoiseWithImageChromaFuncs =
*09537850SAkhilesh Sanikop    BlendNoiseWithImageChromaFunc[/*chroma_scaling_from_luma*/ 2];
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop//------------------------------------------------------------------------------
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikopstruct FilmGrainFuncs {
*09537850SAkhilesh Sanikop  LumaAutoRegressionFuncs luma_auto_regression;
*09537850SAkhilesh Sanikop  ChromaAutoRegressionFuncs chroma_auto_regression;
*09537850SAkhilesh Sanikop  ConstructNoiseStripesFuncs construct_noise_stripes;
*09537850SAkhilesh Sanikop  ConstructNoiseImageOverlapFunc construct_noise_image_overlap;
*09537850SAkhilesh Sanikop  InitializeScalingLutFunc initialize_scaling_lut;
*09537850SAkhilesh Sanikop  BlendNoiseWithImageLumaFunc blend_noise_luma;
*09537850SAkhilesh Sanikop  BlendNoiseWithImageChromaFuncs blend_noise_chroma;
*09537850SAkhilesh Sanikop};
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Motion field projection function signature. Section 7.9.
*09537850SAkhilesh Sanikop// |reference_info| provides reference information for motion field projection.
*09537850SAkhilesh Sanikop// |reference_to_current_with_sign| is the precalculated reference frame id
*09537850SAkhilesh Sanikop// distance from current frame.
*09537850SAkhilesh Sanikop// |dst_sign| is -1 for LAST_FRAME and LAST2_FRAME, or 0 (1 in spec) for others.
*09537850SAkhilesh Sanikop// |y8_start| and |y8_end| are the start and end 8x8 rows of the current tile.
*09537850SAkhilesh Sanikop// |x8_start| and |x8_end| are the start and end 8x8 columns of the current
*09537850SAkhilesh Sanikop// tile.
*09537850SAkhilesh Sanikop// |motion_field| is the output which saves the projected motion field
*09537850SAkhilesh Sanikop// information.
*09537850SAkhilesh Sanikop// Note: Only the entry from the 8-bit Dsp table is used as this function is
*09537850SAkhilesh Sanikop// bitdepth agnostic.
*09537850SAkhilesh Sanikopusing MotionFieldProjectionKernelFunc = void (*)(
*09537850SAkhilesh Sanikop    const ReferenceInfo& reference_info, int reference_to_current_with_sign,
*09537850SAkhilesh Sanikop    int dst_sign, int y8_start, int y8_end, int x8_start, int x8_end,
*09537850SAkhilesh Sanikop    TemporalMotionField* motion_field);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Compound temporal motion vector projection function signature.
*09537850SAkhilesh Sanikop// Section 7.9.3 and 7.10.2.10.
*09537850SAkhilesh Sanikop// |temporal_mvs| is the aligned set of temporal reference motion vectors.
*09537850SAkhilesh Sanikop// |temporal_reference_offsets| specifies the number of frames covered by the
*09537850SAkhilesh Sanikop// original motion vector.
*09537850SAkhilesh Sanikop// |reference_offsets| specifies the number of frames to be covered by the
*09537850SAkhilesh Sanikop// projected motion vector.
*09537850SAkhilesh Sanikop// |count| is the number of the temporal motion vectors.
*09537850SAkhilesh Sanikop// |candidate_mvs| is the aligned set of projected motion vectors.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikop// Note: Only the entry from the 8-bit Dsp table is used as this function is
*09537850SAkhilesh Sanikop// bitdepth agnostic.
*09537850SAkhilesh Sanikopusing MvProjectionCompoundFunc = void (*)(
*09537850SAkhilesh Sanikop    const MotionVector* temporal_mvs, const int8_t* temporal_reference_offsets,
*09537850SAkhilesh Sanikop    const int reference_offsets[2], int count,
*09537850SAkhilesh Sanikop    CompoundMotionVector* candidate_mvs);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Single temporal motion vector projection function signature.
*09537850SAkhilesh Sanikop// Section 7.9.3 and 7.10.2.10.
*09537850SAkhilesh Sanikop// |temporal_mvs| is the aligned set of temporal reference motion vectors.
*09537850SAkhilesh Sanikop// |temporal_reference_offsets| specifies the number of frames covered by the
*09537850SAkhilesh Sanikop// original motion vector.
*09537850SAkhilesh Sanikop// |reference_offset| specifies the number of frames to be covered by the
*09537850SAkhilesh Sanikop// projected motion vector.
*09537850SAkhilesh Sanikop// |count| is the number of the temporal motion vectors.
*09537850SAkhilesh Sanikop// |candidate_mvs| is the aligned set of projected motion vectors.
*09537850SAkhilesh Sanikop// The pointer arguments do not alias one another.
*09537850SAkhilesh Sanikop// Note: Only the entry from the 8-bit Dsp table is used as this function is
*09537850SAkhilesh Sanikop// bitdepth agnostic.
*09537850SAkhilesh Sanikopusing MvProjectionSingleFunc = void (*)(
*09537850SAkhilesh Sanikop    const MotionVector* temporal_mvs, const int8_t* temporal_reference_offsets,
*09537850SAkhilesh Sanikop    int reference_offset, int count, MotionVector* candidate_mvs);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikopstruct Dsp {
*09537850SAkhilesh Sanikop  AverageBlendFunc average_blend;
*09537850SAkhilesh Sanikop  CdefDirectionFunc cdef_direction;
*09537850SAkhilesh Sanikop  CdefFilteringFuncs cdef_filters;
*09537850SAkhilesh Sanikop  CflIntraPredictorFuncs cfl_intra_predictors;
*09537850SAkhilesh Sanikop  CflSubsamplerFuncs cfl_subsamplers;
*09537850SAkhilesh Sanikop  ConvolveFuncs convolve;
*09537850SAkhilesh Sanikop  ConvolveScaleFuncs convolve_scale;
*09537850SAkhilesh Sanikop  DirectionalIntraPredictorZone1Func directional_intra_predictor_zone1;
*09537850SAkhilesh Sanikop  DirectionalIntraPredictorZone2Func directional_intra_predictor_zone2;
*09537850SAkhilesh Sanikop  DirectionalIntraPredictorZone3Func directional_intra_predictor_zone3;
*09537850SAkhilesh Sanikop  DistanceWeightedBlendFunc distance_weighted_blend;
*09537850SAkhilesh Sanikop  FilmGrainFuncs film_grain;
*09537850SAkhilesh Sanikop  FilterIntraPredictorFunc filter_intra_predictor;
*09537850SAkhilesh Sanikop  InterIntraMaskBlendFuncs8bpp inter_intra_mask_blend_8bpp;
*09537850SAkhilesh Sanikop  IntraEdgeFilterFunc intra_edge_filter;
*09537850SAkhilesh Sanikop  IntraEdgeUpsamplerFunc intra_edge_upsampler;
*09537850SAkhilesh Sanikop  IntraPredictorFuncs intra_predictors;
*09537850SAkhilesh Sanikop  InverseTransformAddFuncs inverse_transforms;
*09537850SAkhilesh Sanikop  LoopFilterFuncs loop_filters;
*09537850SAkhilesh Sanikop  LoopRestorationFuncs loop_restorations;
*09537850SAkhilesh Sanikop  MaskBlendFuncs mask_blend;
*09537850SAkhilesh Sanikop  MotionFieldProjectionKernelFunc motion_field_projection_kernel;
*09537850SAkhilesh Sanikop  MvProjectionCompoundFunc mv_projection_compound[3];
*09537850SAkhilesh Sanikop  MvProjectionSingleFunc mv_projection_single[3];
*09537850SAkhilesh Sanikop  ObmcBlendFuncs obmc_blend;
*09537850SAkhilesh Sanikop  SuperResCoefficientsFunc super_res_coefficients;
*09537850SAkhilesh Sanikop  SuperResFunc super_res;
*09537850SAkhilesh Sanikop  WarpCompoundFunc warp_compound;
*09537850SAkhilesh Sanikop  WarpFunc warp;
*09537850SAkhilesh Sanikop  WeightMaskFuncs weight_mask;
*09537850SAkhilesh Sanikop};
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Initializes function pointers based on build config and runtime
*09537850SAkhilesh Sanikop// environment. Must be called once before first use. This function is
*09537850SAkhilesh Sanikop// thread-safe.
*09537850SAkhilesh Sanikopvoid DspInit();
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Returns the appropriate Dsp table for |bitdepth| or nullptr if one doesn't
*09537850SAkhilesh Sanikop// exist.
*09537850SAkhilesh Sanikopconst Dsp* GetDspTable(int bitdepth);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop}  // namespace dsp
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikopnamespace dsp_internal {
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Visual Studio builds don't have a way to detect SSE4_1. Only exclude the C
*09537850SAkhilesh Sanikop// functions if /arch:AVX2 is used across all sources.
*09537850SAkhilesh Sanikop#if !LIBGAV1_TARGETING_AVX2 && \
*09537850SAkhilesh Sanikop    (defined(_MSC_VER) || (defined(_M_IX86) || defined(_M_X64)))
*09537850SAkhilesh Sanikop#undef LIBGAV1_ENABLE_ALL_DSP_FUNCTIONS
*09537850SAkhilesh Sanikop#define LIBGAV1_ENABLE_ALL_DSP_FUNCTIONS 1
*09537850SAkhilesh Sanikop#endif
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Returns true if a more highly optimized version of |func| is not defined for
*09537850SAkhilesh Sanikop// the associated bitdepth or if it is forcibly enabled with
*09537850SAkhilesh Sanikop// LIBGAV1_ENABLE_ALL_DSP_FUNCTIONS. The define checked for |func| corresponds
*09537850SAkhilesh Sanikop// to the LIBGAV1_Dsp<bitdepth>bpp_|func| define in the header file associated
*09537850SAkhilesh Sanikop// with the module.
*09537850SAkhilesh Sanikop// |func| is one of:
*09537850SAkhilesh Sanikop//   - FunctionName, e.g., SelfGuidedFilter.
*09537850SAkhilesh Sanikop//   - [sub-table-index1][...-indexN] e.g.,
*09537850SAkhilesh Sanikop//     TransformSize4x4_IntraPredictorDc. The indices correspond to enum values
*09537850SAkhilesh Sanikop//     used as lookups with leading 'k' removed.
*09537850SAkhilesh Sanikop//
*09537850SAkhilesh Sanikop//  NEON support is the only extension available for ARM and it is always
*09537850SAkhilesh Sanikop//  required. Because of this restriction DSP_ENABLED_8BPP_NEON(func) is always
*09537850SAkhilesh Sanikop//  true and can be omitted.
*09537850SAkhilesh Sanikop#define DSP_ENABLED_8BPP_AVX2(func)    \
*09537850SAkhilesh Sanikop  (LIBGAV1_ENABLE_ALL_DSP_FUNCTIONS || \
*09537850SAkhilesh Sanikop   LIBGAV1_Dsp8bpp_##func == LIBGAV1_CPU_AVX2)
*09537850SAkhilesh Sanikop#define DSP_ENABLED_10BPP_AVX2(func)   \
*09537850SAkhilesh Sanikop  (LIBGAV1_ENABLE_ALL_DSP_FUNCTIONS || \
*09537850SAkhilesh Sanikop   LIBGAV1_Dsp10bpp_##func == LIBGAV1_CPU_AVX2)
*09537850SAkhilesh Sanikop#define DSP_ENABLED_8BPP_SSE4_1(func)  \
*09537850SAkhilesh Sanikop  (LIBGAV1_ENABLE_ALL_DSP_FUNCTIONS || \
*09537850SAkhilesh Sanikop   LIBGAV1_Dsp8bpp_##func == LIBGAV1_CPU_SSE4_1)
*09537850SAkhilesh Sanikop#define DSP_ENABLED_10BPP_SSE4_1(func) \
*09537850SAkhilesh Sanikop  (LIBGAV1_ENABLE_ALL_DSP_FUNCTIONS || \
*09537850SAkhilesh Sanikop   LIBGAV1_Dsp10bpp_##func == LIBGAV1_CPU_SSE4_1)
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Initializes C-only function pointers. Note some entries may be set to
*09537850SAkhilesh Sanikop// nullptr if LIBGAV1_ENABLE_ALL_DSP_FUNCTIONS is not defined. This is meant
*09537850SAkhilesh Sanikop// for use in tests only, it is not thread-safe.
*09537850SAkhilesh Sanikopvoid DspInit_C();
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop// Returns the appropriate Dsp table for |bitdepth| or nullptr if one doesn't
*09537850SAkhilesh Sanikop// exist. This version is meant for use by test or dsp/*Init() functions only.
*09537850SAkhilesh Sanikopdsp::Dsp* GetWritableDspTable(int bitdepth);
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop}  // namespace dsp_internal
*09537850SAkhilesh Sanikop}  // namespace libgav1
*09537850SAkhilesh Sanikop
*09537850SAkhilesh Sanikop#endif  // LIBGAV1_SRC_DSP_DSP_H_