libopus/celt/entdec.c

*a58d3d2aSXin Li/* Copyright (c) 2001-2011 Timothy B. Terriberry
*a58d3d2aSXin Li   Copyright (c) 2008-2009 Xiph.Org Foundation */
*a58d3d2aSXin Li/*
*a58d3d2aSXin Li   Redistribution and use in source and binary forms, with or without
*a58d3d2aSXin Li   modification, are permitted provided that the following conditions
*a58d3d2aSXin Li   are met:
*a58d3d2aSXin Li
*a58d3d2aSXin Li   - Redistributions of source code must retain the above copyright
*a58d3d2aSXin Li   notice, this list of conditions and the following disclaimer.
*a58d3d2aSXin Li
*a58d3d2aSXin Li   - Redistributions in binary form must reproduce the above copyright
*a58d3d2aSXin Li   notice, this list of conditions and the following disclaimer in the
*a58d3d2aSXin Li   documentation and/or other materials provided with the distribution.
*a58d3d2aSXin Li
*a58d3d2aSXin Li   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
*a58d3d2aSXin Li   ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
*a58d3d2aSXin Li   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
*a58d3d2aSXin Li   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
*a58d3d2aSXin Li   OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
*a58d3d2aSXin Li   EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
*a58d3d2aSXin Li   PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
*a58d3d2aSXin Li   PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
*a58d3d2aSXin Li   LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
*a58d3d2aSXin Li   NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
*a58d3d2aSXin Li   SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*a58d3d2aSXin Li*/
*a58d3d2aSXin Li
*a58d3d2aSXin Li#ifdef HAVE_CONFIG_H
*a58d3d2aSXin Li#include "config.h"
*a58d3d2aSXin Li#endif
*a58d3d2aSXin Li
*a58d3d2aSXin Li#include <stddef.h>
*a58d3d2aSXin Li#include "os_support.h"
*a58d3d2aSXin Li#include "arch.h"
*a58d3d2aSXin Li#include "entdec.h"
*a58d3d2aSXin Li#include "mfrngcod.h"
*a58d3d2aSXin Li
*a58d3d2aSXin Li/*A range decoder.
*a58d3d2aSXin Li  This is an entropy decoder based upon \cite{Mar79}, which is itself a
*a58d3d2aSXin Li   rediscovery of the FIFO arithmetic code introduced by \cite{Pas76}.
*a58d3d2aSXin Li  It is very similar to arithmetic encoding, except that encoding is done with
*a58d3d2aSXin Li   digits in any base, instead of with bits, and so it is faster when using
*a58d3d2aSXin Li   larger bases (i.e.: a byte).
*a58d3d2aSXin Li  The author claims an average waste of $\frac{1}{2}\log_b(2b)$ bits, where $b$
*a58d3d2aSXin Li   is the base, longer than the theoretical optimum, but to my knowledge there
*a58d3d2aSXin Li   is no published justification for this claim.
*a58d3d2aSXin Li  This only seems true when using near-infinite precision arithmetic so that
*a58d3d2aSXin Li   the process is carried out with no rounding errors.
*a58d3d2aSXin Li
*a58d3d2aSXin Li  An excellent description of implementation details is available at
*a58d3d2aSXin Li   http://www.arturocampos.com/ac_range.html
*a58d3d2aSXin Li  A recent work \cite{MNW98} which proposes several changes to arithmetic
*a58d3d2aSXin Li   encoding for efficiency actually re-discovers many of the principles
*a58d3d2aSXin Li   behind range encoding, and presents a good theoretical analysis of them.
*a58d3d2aSXin Li
*a58d3d2aSXin Li  End of stream is handled by writing out the smallest number of bits that
*a58d3d2aSXin Li   ensures that the stream will be correctly decoded regardless of the value of
*a58d3d2aSXin Li   any subsequent bits.
*a58d3d2aSXin Li  ec_tell() can be used to determine how many bits were needed to decode
*a58d3d2aSXin Li   all the symbols thus far; other data can be packed in the remaining bits of
*a58d3d2aSXin Li   the input buffer.
*a58d3d2aSXin Li  @PHDTHESIS{Pas76,
*a58d3d2aSXin Li    author="Richard Clark Pasco",
*a58d3d2aSXin Li    title="Source coding algorithms for fast data compression",
*a58d3d2aSXin Li    school="Dept. of Electrical Engineering, Stanford University",
*a58d3d2aSXin Li    address="Stanford, CA",
*a58d3d2aSXin Li    month=May,
*a58d3d2aSXin Li    year=1976
*a58d3d2aSXin Li  }
*a58d3d2aSXin Li  @INPROCEEDINGS{Mar79,
*a58d3d2aSXin Li   author="Martin, G.N.N.",
*a58d3d2aSXin Li   title="Range encoding: an algorithm for removing redundancy from a digitised
*a58d3d2aSXin Li    message",
*a58d3d2aSXin Li   booktitle="Video & Data Recording Conference",
*a58d3d2aSXin Li   year=1979,
*a58d3d2aSXin Li   address="Southampton",
*a58d3d2aSXin Li   month=Jul
*a58d3d2aSXin Li  }
*a58d3d2aSXin Li  @ARTICLE{MNW98,
*a58d3d2aSXin Li   author="Alistair Moffat and Radford Neal and Ian H. Witten",
*a58d3d2aSXin Li   title="Arithmetic Coding Revisited",
*a58d3d2aSXin Li   journal="{ACM} Transactions on Information Systems",
*a58d3d2aSXin Li   year=1998,
*a58d3d2aSXin Li   volume=16,
*a58d3d2aSXin Li   number=3,
*a58d3d2aSXin Li   pages="256--294",
*a58d3d2aSXin Li   month=Jul,
*a58d3d2aSXin Li   URL="http://www.stanford.edu/class/ee398a/handouts/papers/Moffat98ArithmCoding.pdf"
*a58d3d2aSXin Li  }*/
*a58d3d2aSXin Li
*a58d3d2aSXin Listatic int ec_read_byte(ec_dec *_this){
*a58d3d2aSXin Li  return _this->offs<_this->storage?_this->buf[_this->offs++]:0;
*a58d3d2aSXin Li}
*a58d3d2aSXin Li
*a58d3d2aSXin Listatic int ec_read_byte_from_end(ec_dec *_this){
*a58d3d2aSXin Li  return _this->end_offs<_this->storage?
*a58d3d2aSXin Li   _this->buf[_this->storage-++(_this->end_offs)]:0;
*a58d3d2aSXin Li}
*a58d3d2aSXin Li
*a58d3d2aSXin Li/*Normalizes the contents of val and rng so that rng lies entirely in the
*a58d3d2aSXin Li   high-order symbol.*/
*a58d3d2aSXin Listatic void ec_dec_normalize(ec_dec *_this){
*a58d3d2aSXin Li  /*If the range is too small, rescale it and input some bits.*/
*a58d3d2aSXin Li  while(_this->rng<=EC_CODE_BOT){
*a58d3d2aSXin Li    int sym;
*a58d3d2aSXin Li    _this->nbits_total+=EC_SYM_BITS;
*a58d3d2aSXin Li    _this->rng<<=EC_SYM_BITS;
*a58d3d2aSXin Li    /*Use up the remaining bits from our last symbol.*/
*a58d3d2aSXin Li    sym=_this->rem;
*a58d3d2aSXin Li    /*Read the next value from the input.*/
*a58d3d2aSXin Li    _this->rem=ec_read_byte(_this);
*a58d3d2aSXin Li    /*Take the rest of the bits we need from this new symbol.*/
*a58d3d2aSXin Li    sym=(sym<<EC_SYM_BITS|_this->rem)>>(EC_SYM_BITS-EC_CODE_EXTRA);
*a58d3d2aSXin Li    /*And subtract them from val, capped to be less than EC_CODE_TOP.*/
*a58d3d2aSXin Li    _this->val=((_this->val<<EC_SYM_BITS)+(EC_SYM_MAX&~sym))&(EC_CODE_TOP-1);
*a58d3d2aSXin Li  }
*a58d3d2aSXin Li}
*a58d3d2aSXin Li
*a58d3d2aSXin Livoid ec_dec_init(ec_dec *_this,unsigned char *_buf,opus_uint32 _storage){
*a58d3d2aSXin Li  _this->buf=_buf;
*a58d3d2aSXin Li  _this->storage=_storage;
*a58d3d2aSXin Li  _this->end_offs=0;
*a58d3d2aSXin Li  _this->end_window=0;
*a58d3d2aSXin Li  _this->nend_bits=0;
*a58d3d2aSXin Li  /*This is the offset from which ec_tell() will subtract partial bits.
*a58d3d2aSXin Li    The final value after the ec_dec_normalize() call will be the same as in
*a58d3d2aSXin Li     the encoder, but we have to compensate for the bits that are added there.*/
*a58d3d2aSXin Li  _this->nbits_total=EC_CODE_BITS+1
*a58d3d2aSXin Li   -((EC_CODE_BITS-EC_CODE_EXTRA)/EC_SYM_BITS)*EC_SYM_BITS;
*a58d3d2aSXin Li  _this->offs=0;
*a58d3d2aSXin Li  _this->rng=1U<<EC_CODE_EXTRA;
*a58d3d2aSXin Li  _this->rem=ec_read_byte(_this);
*a58d3d2aSXin Li  _this->val=_this->rng-1-(_this->rem>>(EC_SYM_BITS-EC_CODE_EXTRA));
*a58d3d2aSXin Li  _this->error=0;
*a58d3d2aSXin Li  /*Normalize the interval.*/
*a58d3d2aSXin Li  ec_dec_normalize(_this);
*a58d3d2aSXin Li}
*a58d3d2aSXin Li
*a58d3d2aSXin Liunsigned ec_decode(ec_dec *_this,unsigned _ft){
*a58d3d2aSXin Li  unsigned s;
*a58d3d2aSXin Li  _this->ext=celt_udiv(_this->rng,_ft);
*a58d3d2aSXin Li  s=(unsigned)(_this->val/_this->ext);
*a58d3d2aSXin Li  return _ft-EC_MINI(s+1,_ft);
*a58d3d2aSXin Li}
*a58d3d2aSXin Li
*a58d3d2aSXin Liunsigned ec_decode_bin(ec_dec *_this,unsigned _bits){
*a58d3d2aSXin Li   unsigned s;
*a58d3d2aSXin Li   _this->ext=_this->rng>>_bits;
*a58d3d2aSXin Li   s=(unsigned)(_this->val/_this->ext);
*a58d3d2aSXin Li   return (1U<<_bits)-EC_MINI(s+1U,1U<<_bits);
*a58d3d2aSXin Li}
*a58d3d2aSXin Li
*a58d3d2aSXin Livoid ec_dec_update(ec_dec *_this,unsigned _fl,unsigned _fh,unsigned _ft){
*a58d3d2aSXin Li  opus_uint32 s;
*a58d3d2aSXin Li  s=IMUL32(_this->ext,_ft-_fh);
*a58d3d2aSXin Li  _this->val-=s;
*a58d3d2aSXin Li  _this->rng=_fl>0?IMUL32(_this->ext,_fh-_fl):_this->rng-s;
*a58d3d2aSXin Li  ec_dec_normalize(_this);
*a58d3d2aSXin Li}
*a58d3d2aSXin Li
*a58d3d2aSXin Li/*The probability of having a "one" is 1/(1<<_logp).*/
*a58d3d2aSXin Liint ec_dec_bit_logp(ec_dec *_this,unsigned _logp){
*a58d3d2aSXin Li  opus_uint32 r;
*a58d3d2aSXin Li  opus_uint32 d;
*a58d3d2aSXin Li  opus_uint32 s;
*a58d3d2aSXin Li  int         ret;
*a58d3d2aSXin Li  r=_this->rng;
*a58d3d2aSXin Li  d=_this->val;
*a58d3d2aSXin Li  s=r>>_logp;
*a58d3d2aSXin Li  ret=d<s;
*a58d3d2aSXin Li  if(!ret)_this->val=d-s;
*a58d3d2aSXin Li  _this->rng=ret?s:r-s;
*a58d3d2aSXin Li  ec_dec_normalize(_this);
*a58d3d2aSXin Li  return ret;
*a58d3d2aSXin Li}
*a58d3d2aSXin Li
*a58d3d2aSXin Liint ec_dec_icdf(ec_dec *_this,const unsigned char *_icdf,unsigned _ftb){
*a58d3d2aSXin Li  opus_uint32 r;
*a58d3d2aSXin Li  opus_uint32 d;
*a58d3d2aSXin Li  opus_uint32 s;
*a58d3d2aSXin Li  opus_uint32 t;
*a58d3d2aSXin Li  int         ret;
*a58d3d2aSXin Li  s=_this->rng;
*a58d3d2aSXin Li  d=_this->val;
*a58d3d2aSXin Li  r=s>>_ftb;
*a58d3d2aSXin Li  ret=-1;
*a58d3d2aSXin Li  do{
*a58d3d2aSXin Li    t=s;
*a58d3d2aSXin Li    s=IMUL32(r,_icdf[++ret]);
*a58d3d2aSXin Li  }
*a58d3d2aSXin Li  while(d<s);
*a58d3d2aSXin Li  _this->val=d-s;
*a58d3d2aSXin Li  _this->rng=t-s;
*a58d3d2aSXin Li  ec_dec_normalize(_this);
*a58d3d2aSXin Li  return ret;
*a58d3d2aSXin Li}
*a58d3d2aSXin Li
*a58d3d2aSXin Liint ec_dec_icdf16(ec_dec *_this,const opus_uint16 *_icdf,unsigned _ftb){
*a58d3d2aSXin Li  opus_uint32 r;
*a58d3d2aSXin Li  opus_uint32 d;
*a58d3d2aSXin Li  opus_uint32 s;
*a58d3d2aSXin Li  opus_uint32 t;
*a58d3d2aSXin Li  int         ret;
*a58d3d2aSXin Li  s=_this->rng;
*a58d3d2aSXin Li  d=_this->val;
*a58d3d2aSXin Li  r=s>>_ftb;
*a58d3d2aSXin Li  ret=-1;
*a58d3d2aSXin Li  do{
*a58d3d2aSXin Li    t=s;
*a58d3d2aSXin Li    s=IMUL32(r,_icdf[++ret]);
*a58d3d2aSXin Li  }
*a58d3d2aSXin Li  while(d<s);
*a58d3d2aSXin Li  _this->val=d-s;
*a58d3d2aSXin Li  _this->rng=t-s;
*a58d3d2aSXin Li  ec_dec_normalize(_this);
*a58d3d2aSXin Li  return ret;
*a58d3d2aSXin Li}
*a58d3d2aSXin Li
*a58d3d2aSXin Liopus_uint32 ec_dec_uint(ec_dec *_this,opus_uint32 _ft){
*a58d3d2aSXin Li  unsigned ft;
*a58d3d2aSXin Li  unsigned s;
*a58d3d2aSXin Li  int      ftb;
*a58d3d2aSXin Li  /*In order to optimize EC_ILOG(), it is undefined for the value 0.*/
*a58d3d2aSXin Li  celt_assert(_ft>1);
*a58d3d2aSXin Li  _ft--;
*a58d3d2aSXin Li  ftb=EC_ILOG(_ft);
*a58d3d2aSXin Li  if(ftb>EC_UINT_BITS){
*a58d3d2aSXin Li    opus_uint32 t;
*a58d3d2aSXin Li    ftb-=EC_UINT_BITS;
*a58d3d2aSXin Li    ft=(unsigned)(_ft>>ftb)+1;
*a58d3d2aSXin Li    s=ec_decode(_this,ft);
*a58d3d2aSXin Li    ec_dec_update(_this,s,s+1,ft);
*a58d3d2aSXin Li    t=(opus_uint32)s<<ftb|ec_dec_bits(_this,ftb);
*a58d3d2aSXin Li    if(t<=_ft)return t;
*a58d3d2aSXin Li    _this->error=1;
*a58d3d2aSXin Li    return _ft;
*a58d3d2aSXin Li  }
*a58d3d2aSXin Li  else{
*a58d3d2aSXin Li    _ft++;
*a58d3d2aSXin Li    s=ec_decode(_this,(unsigned)_ft);
*a58d3d2aSXin Li    ec_dec_update(_this,s,s+1,(unsigned)_ft);
*a58d3d2aSXin Li    return s;
*a58d3d2aSXin Li  }
*a58d3d2aSXin Li}
*a58d3d2aSXin Li
*a58d3d2aSXin Liopus_uint32 ec_dec_bits(ec_dec *_this,unsigned _bits){
*a58d3d2aSXin Li  ec_window   window;
*a58d3d2aSXin Li  int         available;
*a58d3d2aSXin Li  opus_uint32 ret;
*a58d3d2aSXin Li  window=_this->end_window;
*a58d3d2aSXin Li  available=_this->nend_bits;
*a58d3d2aSXin Li  if((unsigned)available<_bits){
*a58d3d2aSXin Li    do{
*a58d3d2aSXin Li      window|=(ec_window)ec_read_byte_from_end(_this)<<available;
*a58d3d2aSXin Li      available+=EC_SYM_BITS;
*a58d3d2aSXin Li    }
*a58d3d2aSXin Li    while(available<=EC_WINDOW_SIZE-EC_SYM_BITS);
*a58d3d2aSXin Li  }
*a58d3d2aSXin Li  ret=(opus_uint32)window&(((opus_uint32)1<<_bits)-1U);
*a58d3d2aSXin Li  window>>=_bits;
*a58d3d2aSXin Li  available-=_bits;
*a58d3d2aSXin Li  _this->end_window=window;
*a58d3d2aSXin Li  _this->nend_bits=available;
*a58d3d2aSXin Li  _this->nbits_total+=_bits;
*a58d3d2aSXin Li  return ret;
*a58d3d2aSXin Li}