libopus/dnn/dred_decoder.c

*a58d3d2aSXin Li/* Copyright (c) 2022 Amazon
*a58d3d2aSXin Li   Written by Jan Buethe */
*a58d3d2aSXin Li/*
*a58d3d2aSXin Li   Redistribution and use in source and binary forms, with or without
*a58d3d2aSXin Li   modification, are permitted provided that the following conditions
*a58d3d2aSXin Li   are met:
*a58d3d2aSXin Li
*a58d3d2aSXin Li   - Redistributions of source code must retain the above copyright
*a58d3d2aSXin Li   notice, this list of conditions and the following disclaimer.
*a58d3d2aSXin Li
*a58d3d2aSXin Li   - Redistributions in binary form must reproduce the above copyright
*a58d3d2aSXin Li   notice, this list of conditions and the following disclaimer in the
*a58d3d2aSXin Li   documentation and/or other materials provided with the distribution.
*a58d3d2aSXin Li
*a58d3d2aSXin Li   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
*a58d3d2aSXin Li   ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
*a58d3d2aSXin Li   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
*a58d3d2aSXin Li   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
*a58d3d2aSXin Li   OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
*a58d3d2aSXin Li   EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
*a58d3d2aSXin Li   PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
*a58d3d2aSXin Li   PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
*a58d3d2aSXin Li   LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
*a58d3d2aSXin Li   NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
*a58d3d2aSXin Li   SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*a58d3d2aSXin Li*/
*a58d3d2aSXin Li
*a58d3d2aSXin Li#include <string.h>
*a58d3d2aSXin Li
*a58d3d2aSXin Li#ifdef HAVE_CONFIG_H
*a58d3d2aSXin Li#include "config.h"
*a58d3d2aSXin Li#endif
*a58d3d2aSXin Li
*a58d3d2aSXin Li#include "os_support.h"
*a58d3d2aSXin Li#include "dred_decoder.h"
*a58d3d2aSXin Li#include "dred_coding.h"
*a58d3d2aSXin Li#include "celt/entdec.h"
*a58d3d2aSXin Li#include "celt/laplace.h"
*a58d3d2aSXin Li#include "dred_rdovae_stats_data.h"
*a58d3d2aSXin Li#include "dred_rdovae_constants.h"
*a58d3d2aSXin Li
*a58d3d2aSXin Listatic void dred_decode_latents(ec_dec *dec, float *x, const opus_uint8 *scale, const opus_uint8 *r, const opus_uint8 *p0, int dim) {
*a58d3d2aSXin Li    int i;
*a58d3d2aSXin Li    for (i=0;i<dim;i++) {
*a58d3d2aSXin Li        int q;
*a58d3d2aSXin Li        if (r[i] == 0 || p0[i] == 255) q = 0;
*a58d3d2aSXin Li        else q = ec_laplace_decode_p0(dec, p0[i]<<7, r[i]<<7);
*a58d3d2aSXin Li        x[i] = q*256.f/(scale[i] == 0 ? 1 : scale[i]);
*a58d3d2aSXin Li    }
*a58d3d2aSXin Li}
*a58d3d2aSXin Li
*a58d3d2aSXin Liint dred_ec_decode(OpusDRED *dec, const opus_uint8 *bytes, int num_bytes, int min_feature_frames, int dred_frame_offset)
*a58d3d2aSXin Li{
*a58d3d2aSXin Li  ec_dec ec;
*a58d3d2aSXin Li  int q_level;
*a58d3d2aSXin Li  int i;
*a58d3d2aSXin Li  int offset;
*a58d3d2aSXin Li  int q0;
*a58d3d2aSXin Li  int dQ;
*a58d3d2aSXin Li  int qmax;
*a58d3d2aSXin Li  int state_qoffset;
*a58d3d2aSXin Li  int extra_offset;
*a58d3d2aSXin Li
*a58d3d2aSXin Li  /* since features are decoded in quadruples, it makes no sense to go with an uneven number of redundancy frames */
*a58d3d2aSXin Li  celt_assert(DRED_NUM_REDUNDANCY_FRAMES % 2 == 0);
*a58d3d2aSXin Li
*a58d3d2aSXin Li  /* decode initial state and initialize RDOVAE decoder */
*a58d3d2aSXin Li  ec_dec_init(&ec, (unsigned char*)bytes, num_bytes);
*a58d3d2aSXin Li  q0 = ec_dec_uint(&ec, 16);
*a58d3d2aSXin Li  dQ = ec_dec_uint(&ec, 8);
*a58d3d2aSXin Li  if (ec_dec_uint(&ec, 2)) extra_offset = 32*ec_dec_uint(&ec, 256);
*a58d3d2aSXin Li  else extra_offset = 0;
*a58d3d2aSXin Li  /* Compute total offset, including DRED position in a multiframe packet. */
*a58d3d2aSXin Li  dec->dred_offset = 16 - ec_dec_uint(&ec, 32) - extra_offset + dred_frame_offset;
*a58d3d2aSXin Li  /*printf("%d %d %d\n", dred_offset, q0, dQ);*/
*a58d3d2aSXin Li  qmax = 15;
*a58d3d2aSXin Li  if (q0 < 14 && dQ > 0) {
*a58d3d2aSXin Li    int nvals;
*a58d3d2aSXin Li    int ft;
*a58d3d2aSXin Li    int s;
*a58d3d2aSXin Li    /* The distribution for the dQmax symbol is split evenly between zero
*a58d3d2aSXin Li        (which implies qmax == 15) and larger values, with the probability of
*a58d3d2aSXin Li        all larger values being uniform.
*a58d3d2aSXin Li       This is equivalent to coding 1 bit to decide if the maximum is less than
*a58d3d2aSXin Li        15 followed by a uint to decide the actual value if it is less than
*a58d3d2aSXin Li        15, but combined into a single symbol. */
*a58d3d2aSXin Li    nvals = 15 - (q0 + 1);
*a58d3d2aSXin Li    ft = 2*nvals;
*a58d3d2aSXin Li    s = ec_decode(&ec, ft);
*a58d3d2aSXin Li    if (s >= nvals) {
*a58d3d2aSXin Li      qmax = q0 + (s - nvals) + 1;
*a58d3d2aSXin Li      ec_dec_update(&ec, s, s + 1, ft);
*a58d3d2aSXin Li    }
*a58d3d2aSXin Li    else {
*a58d3d2aSXin Li      ec_dec_update(&ec, 0, nvals, ft);
*a58d3d2aSXin Li    }
*a58d3d2aSXin Li  }
*a58d3d2aSXin Li  state_qoffset = q0*DRED_STATE_DIM;
*a58d3d2aSXin Li  dred_decode_latents(
*a58d3d2aSXin Li      &ec,
*a58d3d2aSXin Li      dec->state,
*a58d3d2aSXin Li      dred_state_quant_scales_q8 + state_qoffset,
*a58d3d2aSXin Li      dred_state_r_q8 + state_qoffset,
*a58d3d2aSXin Li      dred_state_p0_q8 + state_qoffset,
*a58d3d2aSXin Li      DRED_STATE_DIM);
*a58d3d2aSXin Li
*a58d3d2aSXin Li  /* decode newest to oldest and store oldest to newest */
*a58d3d2aSXin Li  for (i = 0; i < IMIN(DRED_NUM_REDUNDANCY_FRAMES, (min_feature_frames+1)/2); i += 2)
*a58d3d2aSXin Li  {
*a58d3d2aSXin Li      /* FIXME: Figure out how to avoid missing a last frame that would take up < 8 bits. */
*a58d3d2aSXin Li      if (8*num_bytes - ec_tell(&ec) <= 7)
*a58d3d2aSXin Li         break;
*a58d3d2aSXin Li      q_level = compute_quantizer(q0, dQ, qmax, i/2);
*a58d3d2aSXin Li      offset = q_level*DRED_LATENT_DIM;
*a58d3d2aSXin Li      dred_decode_latents(
*a58d3d2aSXin Li          &ec,
*a58d3d2aSXin Li          &dec->latents[(i/2)*DRED_LATENT_DIM],
*a58d3d2aSXin Li          dred_latent_quant_scales_q8 + offset,
*a58d3d2aSXin Li          dred_latent_r_q8 + offset,
*a58d3d2aSXin Li          dred_latent_p0_q8 + offset,
*a58d3d2aSXin Li          DRED_LATENT_DIM
*a58d3d2aSXin Li          );
*a58d3d2aSXin Li
*a58d3d2aSXin Li      offset = 2 * i * DRED_NUM_FEATURES;
*a58d3d2aSXin Li  }
*a58d3d2aSXin Li  dec->process_stage = 1;
*a58d3d2aSXin Li  dec->nb_latents = i/2;
*a58d3d2aSXin Li  return i/2;
*a58d3d2aSXin Li}