src/enc/vp8i_enc.h

*b2055c35SXin Li// Copyright 2011 Google Inc. All Rights Reserved.
*b2055c35SXin Li//
*b2055c35SXin Li// Use of this source code is governed by a BSD-style license
*b2055c35SXin Li// that can be found in the COPYING file in the root of the source
*b2055c35SXin Li// tree. An additional intellectual property rights grant can be found
*b2055c35SXin Li// in the file PATENTS. All contributing project authors may
*b2055c35SXin Li// be found in the AUTHORS file in the root of the source tree.
*b2055c35SXin Li// -----------------------------------------------------------------------------
*b2055c35SXin Li//
*b2055c35SXin Li//   WebP encoder: internal header.
*b2055c35SXin Li//
*b2055c35SXin Li// Author: Skal ([email protected])
*b2055c35SXin Li
*b2055c35SXin Li#ifndef WEBP_ENC_VP8I_ENC_H_
*b2055c35SXin Li#define WEBP_ENC_VP8I_ENC_H_
*b2055c35SXin Li
*b2055c35SXin Li#include <string.h>     // for memcpy()
*b2055c35SXin Li#include "src/dec/common_dec.h"
*b2055c35SXin Li#include "src/dsp/dsp.h"
*b2055c35SXin Li#include "src/utils/bit_writer_utils.h"
*b2055c35SXin Li#include "src/utils/thread_utils.h"
*b2055c35SXin Li#include "src/utils/utils.h"
*b2055c35SXin Li#include "src/webp/encode.h"
*b2055c35SXin Li
*b2055c35SXin Li#ifdef __cplusplus
*b2055c35SXin Liextern "C" {
*b2055c35SXin Li#endif
*b2055c35SXin Li
*b2055c35SXin Li//------------------------------------------------------------------------------
*b2055c35SXin Li// Various defines and enums
*b2055c35SXin Li
*b2055c35SXin Li// version numbers
*b2055c35SXin Li#define ENC_MAJ_VERSION 1
*b2055c35SXin Li#define ENC_MIN_VERSION 4
*b2055c35SXin Li#define ENC_REV_VERSION 0
*b2055c35SXin Li
*b2055c35SXin Lienum { MAX_LF_LEVELS = 64,       // Maximum loop filter level
*b2055c35SXin Li       MAX_VARIABLE_LEVEL = 67,  // last (inclusive) level with variable cost
*b2055c35SXin Li       MAX_LEVEL = 2047          // max level (note: max codable is 2047 + 67)
*b2055c35SXin Li     };
*b2055c35SXin Li
*b2055c35SXin Litypedef enum {   // Rate-distortion optimization levels
*b2055c35SXin Li  RD_OPT_NONE        = 0,  // no rd-opt
*b2055c35SXin Li  RD_OPT_BASIC       = 1,  // basic scoring (no trellis)
*b2055c35SXin Li  RD_OPT_TRELLIS     = 2,  // perform trellis-quant on the final decision only
*b2055c35SXin Li  RD_OPT_TRELLIS_ALL = 3   // trellis-quant for every scoring (much slower)
*b2055c35SXin Li} VP8RDLevel;
*b2055c35SXin Li
*b2055c35SXin Li// YUV-cache parameters. Cache is 32-bytes wide (= one cacheline).
*b2055c35SXin Li// The original or reconstructed samples can be accessed using VP8Scan[].
*b2055c35SXin Li// The predicted blocks can be accessed using offsets to yuv_p_ and
*b2055c35SXin Li// the arrays VP8*ModeOffsets[].
*b2055c35SXin Li// * YUV Samples area (yuv_in_/yuv_out_/yuv_out2_)
*b2055c35SXin Li//   (see VP8Scan[] for accessing the blocks, along with
*b2055c35SXin Li//   Y_OFF_ENC/U_OFF_ENC/V_OFF_ENC):
*b2055c35SXin Li//             +----+----+
*b2055c35SXin Li//  Y_OFF_ENC  |YYYY|UUVV|
*b2055c35SXin Li//  U_OFF_ENC  |YYYY|UUVV|
*b2055c35SXin Li//  V_OFF_ENC  |YYYY|....| <- 25% wasted U/V area
*b2055c35SXin Li//             |YYYY|....|
*b2055c35SXin Li//             +----+----+
*b2055c35SXin Li// * Prediction area ('yuv_p_', size = PRED_SIZE_ENC)
*b2055c35SXin Li//   Intra16 predictions (16x16 block each, two per row):
*b2055c35SXin Li//         |I16DC16|I16TM16|
*b2055c35SXin Li//         |I16VE16|I16HE16|
*b2055c35SXin Li//   Chroma U/V predictions (16x8 block each, two per row):
*b2055c35SXin Li//         |C8DC8|C8TM8|
*b2055c35SXin Li//         |C8VE8|C8HE8|
*b2055c35SXin Li//   Intra 4x4 predictions (4x4 block each)
*b2055c35SXin Li//         |I4DC4 I4TM4 I4VE4 I4HE4|I4RD4 I4VR4 I4LD4 I4VL4|
*b2055c35SXin Li//         |I4HD4 I4HU4 I4TMP .....|.......................| <- ~31% wasted
*b2055c35SXin Li#define YUV_SIZE_ENC (BPS * 16)
*b2055c35SXin Li#define PRED_SIZE_ENC (32 * BPS + 16 * BPS + 8 * BPS)   // I16+Chroma+I4 preds
*b2055c35SXin Li#define Y_OFF_ENC    (0)
*b2055c35SXin Li#define U_OFF_ENC    (16)
*b2055c35SXin Li#define V_OFF_ENC    (16 + 8)
*b2055c35SXin Li
*b2055c35SXin Liextern const uint16_t VP8Scan[16];
*b2055c35SXin Liextern const uint16_t VP8UVModeOffsets[4];
*b2055c35SXin Liextern const uint16_t VP8I16ModeOffsets[4];
*b2055c35SXin Liextern const uint16_t VP8I4ModeOffsets[NUM_BMODES];
*b2055c35SXin Li
*b2055c35SXin Li// Layout of prediction blocks
*b2055c35SXin Li// intra 16x16
*b2055c35SXin Li#define I16DC16 (0 * 16 * BPS)
*b2055c35SXin Li#define I16TM16 (I16DC16 + 16)
*b2055c35SXin Li#define I16VE16 (1 * 16 * BPS)
*b2055c35SXin Li#define I16HE16 (I16VE16 + 16)
*b2055c35SXin Li// chroma 8x8, two U/V blocks side by side (hence: 16x8 each)
*b2055c35SXin Li#define C8DC8 (2 * 16 * BPS)
*b2055c35SXin Li#define C8TM8 (C8DC8 + 1 * 16)
*b2055c35SXin Li#define C8VE8 (2 * 16 * BPS + 8 * BPS)
*b2055c35SXin Li#define C8HE8 (C8VE8 + 1 * 16)
*b2055c35SXin Li// intra 4x4
*b2055c35SXin Li#define I4DC4 (3 * 16 * BPS +  0)
*b2055c35SXin Li#define I4TM4 (I4DC4 +  4)
*b2055c35SXin Li#define I4VE4 (I4DC4 +  8)
*b2055c35SXin Li#define I4HE4 (I4DC4 + 12)
*b2055c35SXin Li#define I4RD4 (I4DC4 + 16)
*b2055c35SXin Li#define I4VR4 (I4DC4 + 20)
*b2055c35SXin Li#define I4LD4 (I4DC4 + 24)
*b2055c35SXin Li#define I4VL4 (I4DC4 + 28)
*b2055c35SXin Li#define I4HD4 (3 * 16 * BPS + 4 * BPS)
*b2055c35SXin Li#define I4HU4 (I4HD4 + 4)
*b2055c35SXin Li#define I4TMP (I4HD4 + 8)
*b2055c35SXin Li
*b2055c35SXin Litypedef int64_t score_t;     // type used for scores, rate, distortion
*b2055c35SXin Li// Note that MAX_COST is not the maximum allowed by sizeof(score_t),
*b2055c35SXin Li// in order to allow overflowing computations.
*b2055c35SXin Li#define MAX_COST ((score_t)0x7fffffffffffffLL)
*b2055c35SXin Li
*b2055c35SXin Li#define QFIX 17
*b2055c35SXin Li#define BIAS(b)  ((b) << (QFIX - 8))
*b2055c35SXin Li// Fun fact: this is the _only_ line where we're actually being lossy and
*b2055c35SXin Li// discarding bits.
*b2055c35SXin Listatic WEBP_INLINE int QUANTDIV(uint32_t n, uint32_t iQ, uint32_t B) {
*b2055c35SXin Li  return (int)((n * iQ + B) >> QFIX);
*b2055c35SXin Li}
*b2055c35SXin Li
*b2055c35SXin Li// Uncomment the following to remove token-buffer code:
*b2055c35SXin Li// #define DISABLE_TOKEN_BUFFER
*b2055c35SXin Li
*b2055c35SXin Li// quality below which error-diffusion is enabled
*b2055c35SXin Li#define ERROR_DIFFUSION_QUALITY 98
*b2055c35SXin Li
*b2055c35SXin Li//------------------------------------------------------------------------------
*b2055c35SXin Li// Headers
*b2055c35SXin Li
*b2055c35SXin Litypedef uint32_t proba_t;   // 16b + 16b
*b2055c35SXin Litypedef uint8_t ProbaArray[NUM_CTX][NUM_PROBAS];
*b2055c35SXin Litypedef proba_t StatsArray[NUM_CTX][NUM_PROBAS];
*b2055c35SXin Litypedef uint16_t CostArray[NUM_CTX][MAX_VARIABLE_LEVEL + 1];
*b2055c35SXin Litypedef const uint16_t* (*CostArrayPtr)[NUM_CTX];   // for easy casting
*b2055c35SXin Litypedef const uint16_t* CostArrayMap[16][NUM_CTX];
*b2055c35SXin Litypedef double LFStats[NUM_MB_SEGMENTS][MAX_LF_LEVELS];  // filter stats
*b2055c35SXin Li
*b2055c35SXin Litypedef struct VP8Encoder VP8Encoder;
*b2055c35SXin Li
*b2055c35SXin Li// segment features
*b2055c35SXin Litypedef struct {
*b2055c35SXin Li  int num_segments_;      // Actual number of segments. 1 segment only = unused.
*b2055c35SXin Li  int update_map_;        // whether to update the segment map or not.
*b2055c35SXin Li                          // must be 0 if there's only 1 segment.
*b2055c35SXin Li  int size_;              // bit-cost for transmitting the segment map
*b2055c35SXin Li} VP8EncSegmentHeader;
*b2055c35SXin Li
*b2055c35SXin Li// Struct collecting all frame-persistent probabilities.
*b2055c35SXin Litypedef struct {
*b2055c35SXin Li  uint8_t segments_[3];     // probabilities for segment tree
*b2055c35SXin Li  uint8_t skip_proba_;      // final probability of being skipped.
*b2055c35SXin Li  ProbaArray coeffs_[NUM_TYPES][NUM_BANDS];      // 1056 bytes
*b2055c35SXin Li  StatsArray stats_[NUM_TYPES][NUM_BANDS];       // 4224 bytes
*b2055c35SXin Li  CostArray level_cost_[NUM_TYPES][NUM_BANDS];   // 13056 bytes
*b2055c35SXin Li  CostArrayMap remapped_costs_[NUM_TYPES];       // 1536 bytes
*b2055c35SXin Li  int dirty_;               // if true, need to call VP8CalculateLevelCosts()
*b2055c35SXin Li  int use_skip_proba_;      // Note: we always use skip_proba for now.
*b2055c35SXin Li  int nb_skip_;             // number of skipped blocks
*b2055c35SXin Li} VP8EncProba;
*b2055c35SXin Li
*b2055c35SXin Li// Filter parameters. Not actually used in the code (we don't perform
*b2055c35SXin Li// the in-loop filtering), but filled from user's config
*b2055c35SXin Litypedef struct {
*b2055c35SXin Li  int simple_;             // filtering type: 0=complex, 1=simple
*b2055c35SXin Li  int level_;              // base filter level [0..63]
*b2055c35SXin Li  int sharpness_;          // [0..7]
*b2055c35SXin Li  int i4x4_lf_delta_;      // delta filter level for i4x4 relative to i16x16
*b2055c35SXin Li} VP8EncFilterHeader;
*b2055c35SXin Li
*b2055c35SXin Li//------------------------------------------------------------------------------
*b2055c35SXin Li// Informations about the macroblocks.
*b2055c35SXin Li
*b2055c35SXin Litypedef struct {
*b2055c35SXin Li  // block type
*b2055c35SXin Li  unsigned int type_:2;     // 0=i4x4, 1=i16x16
*b2055c35SXin Li  unsigned int uv_mode_:2;
*b2055c35SXin Li  unsigned int skip_:1;
*b2055c35SXin Li  unsigned int segment_:2;
*b2055c35SXin Li  uint8_t alpha_;      // quantization-susceptibility
*b2055c35SXin Li} VP8MBInfo;
*b2055c35SXin Li
*b2055c35SXin Litypedef struct VP8Matrix {
*b2055c35SXin Li  uint16_t q_[16];        // quantizer steps
*b2055c35SXin Li  uint16_t iq_[16];       // reciprocals, fixed point.
*b2055c35SXin Li  uint32_t bias_[16];     // rounding bias
*b2055c35SXin Li  uint32_t zthresh_[16];  // value below which a coefficient is zeroed
*b2055c35SXin Li  uint16_t sharpen_[16];  // frequency boosters for slight sharpening
*b2055c35SXin Li} VP8Matrix;
*b2055c35SXin Li
*b2055c35SXin Litypedef struct {
*b2055c35SXin Li  VP8Matrix y1_, y2_, uv_;  // quantization matrices
*b2055c35SXin Li  int alpha_;      // quant-susceptibility, range [-127,127]. Zero is neutral.
*b2055c35SXin Li                   // Lower values indicate a lower risk of blurriness.
*b2055c35SXin Li  int beta_;       // filter-susceptibility, range [0,255].
*b2055c35SXin Li  int quant_;      // final segment quantizer.
*b2055c35SXin Li  int fstrength_;  // final in-loop filtering strength
*b2055c35SXin Li  int max_edge_;   // max edge delta (for filtering strength)
*b2055c35SXin Li  int min_disto_;  // minimum distortion required to trigger filtering record
*b2055c35SXin Li  // reactivities
*b2055c35SXin Li  int lambda_i16_, lambda_i4_, lambda_uv_;
*b2055c35SXin Li  int lambda_mode_, lambda_trellis_, tlambda_;
*b2055c35SXin Li  int lambda_trellis_i16_, lambda_trellis_i4_, lambda_trellis_uv_;
*b2055c35SXin Li
*b2055c35SXin Li  // lambda values for distortion-based evaluation
*b2055c35SXin Li  score_t i4_penalty_;   // penalty for using Intra4
*b2055c35SXin Li} VP8SegmentInfo;
*b2055c35SXin Li
*b2055c35SXin Litypedef int8_t DError[2 /* u/v */][2 /* top or left */];
*b2055c35SXin Li
*b2055c35SXin Li// Handy transient struct to accumulate score and info during RD-optimization
*b2055c35SXin Li// and mode evaluation.
*b2055c35SXin Litypedef struct {
*b2055c35SXin Li  score_t D, SD;              // Distortion, spectral distortion
*b2055c35SXin Li  score_t H, R, score;        // header bits, rate, score.
*b2055c35SXin Li  int16_t y_dc_levels[16];    // Quantized levels for luma-DC, luma-AC, chroma.
*b2055c35SXin Li  int16_t y_ac_levels[16][16];
*b2055c35SXin Li  int16_t uv_levels[4 + 4][16];
*b2055c35SXin Li  int mode_i16;               // mode number for intra16 prediction
*b2055c35SXin Li  uint8_t modes_i4[16];       // mode numbers for intra4 predictions
*b2055c35SXin Li  int mode_uv;                // mode number of chroma prediction
*b2055c35SXin Li  uint32_t nz;                // non-zero blocks
*b2055c35SXin Li  int8_t derr[2][3];          // DC diffusion errors for U/V for blocks #1/2/3
*b2055c35SXin Li} VP8ModeScore;
*b2055c35SXin Li
*b2055c35SXin Li// Iterator structure to iterate through macroblocks, pointing to the
*b2055c35SXin Li// right neighbouring data (samples, predictions, contexts, ...)
*b2055c35SXin Litypedef struct {
*b2055c35SXin Li  int x_, y_;                      // current macroblock
*b2055c35SXin Li  uint8_t*      yuv_in_;           // input samples
*b2055c35SXin Li  uint8_t*      yuv_out_;          // output samples
*b2055c35SXin Li  uint8_t*      yuv_out2_;         // secondary buffer swapped with yuv_out_.
*b2055c35SXin Li  uint8_t*      yuv_p_;            // scratch buffer for prediction
*b2055c35SXin Li  VP8Encoder*   enc_;              // back-pointer
*b2055c35SXin Li  VP8MBInfo*    mb_;               // current macroblock
*b2055c35SXin Li  VP8BitWriter* bw_;               // current bit-writer
*b2055c35SXin Li  uint8_t*      preds_;            // intra mode predictors (4x4 blocks)
*b2055c35SXin Li  uint32_t*     nz_;               // non-zero pattern
*b2055c35SXin Li  uint8_t       i4_boundary_[37];  // 32+5 boundary samples needed by intra4x4
*b2055c35SXin Li  uint8_t*      i4_top_;           // pointer to the current top boundary sample
*b2055c35SXin Li  int           i4_;               // current intra4x4 mode being tested
*b2055c35SXin Li  int           top_nz_[9];        // top-non-zero context.
*b2055c35SXin Li  int           left_nz_[9];       // left-non-zero. left_nz[8] is independent.
*b2055c35SXin Li  uint64_t      bit_count_[4][3];  // bit counters for coded levels.
*b2055c35SXin Li  uint64_t      luma_bits_;        // macroblock bit-cost for luma
*b2055c35SXin Li  uint64_t      uv_bits_;          // macroblock bit-cost for chroma
*b2055c35SXin Li  LFStats*      lf_stats_;         // filter stats (borrowed from enc_)
*b2055c35SXin Li  int           do_trellis_;       // if true, perform extra level optimisation
*b2055c35SXin Li  int           count_down_;       // number of mb still to be processed
*b2055c35SXin Li  int           count_down0_;      // starting counter value (for progress)
*b2055c35SXin Li  int           percent0_;         // saved initial progress percent
*b2055c35SXin Li
*b2055c35SXin Li  DError        left_derr_;        // left error diffusion (u/v)
*b2055c35SXin Li  DError*       top_derr_;         // top diffusion error - NULL if disabled
*b2055c35SXin Li
*b2055c35SXin Li  uint8_t* y_left_;    // left luma samples (addressable from index -1 to 15).
*b2055c35SXin Li  uint8_t* u_left_;    // left u samples (addressable from index -1 to 7)
*b2055c35SXin Li  uint8_t* v_left_;    // left v samples (addressable from index -1 to 7)
*b2055c35SXin Li
*b2055c35SXin Li  uint8_t* y_top_;     // top luma samples at position 'x_'
*b2055c35SXin Li  uint8_t* uv_top_;    // top u/v samples at position 'x_', packed as 16 bytes
*b2055c35SXin Li
*b2055c35SXin Li  // memory for storing y/u/v_left_
*b2055c35SXin Li  uint8_t yuv_left_mem_[17 + 16 + 16 + 8 + WEBP_ALIGN_CST];
*b2055c35SXin Li  // memory for yuv_*
*b2055c35SXin Li  uint8_t yuv_mem_[3 * YUV_SIZE_ENC + PRED_SIZE_ENC + WEBP_ALIGN_CST];
*b2055c35SXin Li} VP8EncIterator;
*b2055c35SXin Li
*b2055c35SXin Li  // in iterator.c
*b2055c35SXin Li// must be called first
*b2055c35SXin Livoid VP8IteratorInit(VP8Encoder* const enc, VP8EncIterator* const it);
*b2055c35SXin Li// restart a scan
*b2055c35SXin Livoid VP8IteratorReset(VP8EncIterator* const it);
*b2055c35SXin Li// reset iterator position to row 'y'
*b2055c35SXin Livoid VP8IteratorSetRow(VP8EncIterator* const it, int y);
*b2055c35SXin Li// set count down (=number of iterations to go)
*b2055c35SXin Livoid VP8IteratorSetCountDown(VP8EncIterator* const it, int count_down);
*b2055c35SXin Li// return true if iteration is finished
*b2055c35SXin Liint VP8IteratorIsDone(const VP8EncIterator* const it);
*b2055c35SXin Li// Import uncompressed samples from source.
*b2055c35SXin Li// If tmp_32 is not NULL, import boundary samples too.
*b2055c35SXin Li// tmp_32 is a 32-bytes scratch buffer that must be aligned in memory.
*b2055c35SXin Livoid VP8IteratorImport(VP8EncIterator* const it, uint8_t* const tmp_32);
*b2055c35SXin Li// export decimated samples
*b2055c35SXin Livoid VP8IteratorExport(const VP8EncIterator* const it);
*b2055c35SXin Li// go to next macroblock. Returns false if not finished.
*b2055c35SXin Liint VP8IteratorNext(VP8EncIterator* const it);
*b2055c35SXin Li// save the yuv_out_ boundary values to top_/left_ arrays for next iterations.
*b2055c35SXin Livoid VP8IteratorSaveBoundary(VP8EncIterator* const it);
*b2055c35SXin Li// Report progression based on macroblock rows. Return 0 for user-abort request.
*b2055c35SXin Liint VP8IteratorProgress(const VP8EncIterator* const it, int delta);
*b2055c35SXin Li// Intra4x4 iterations
*b2055c35SXin Livoid VP8IteratorStartI4(VP8EncIterator* const it);
*b2055c35SXin Li// returns true if not done.
*b2055c35SXin Liint VP8IteratorRotateI4(VP8EncIterator* const it,
*b2055c35SXin Li                        const uint8_t* const yuv_out);
*b2055c35SXin Li
*b2055c35SXin Li// Non-zero context setup/teardown
*b2055c35SXin Livoid VP8IteratorNzToBytes(VP8EncIterator* const it);
*b2055c35SXin Livoid VP8IteratorBytesToNz(VP8EncIterator* const it);
*b2055c35SXin Li
*b2055c35SXin Li// Helper functions to set mode properties
*b2055c35SXin Livoid VP8SetIntra16Mode(const VP8EncIterator* const it, int mode);
*b2055c35SXin Livoid VP8SetIntra4Mode(const VP8EncIterator* const it, const uint8_t* modes);
*b2055c35SXin Livoid VP8SetIntraUVMode(const VP8EncIterator* const it, int mode);
*b2055c35SXin Livoid VP8SetSkip(const VP8EncIterator* const it, int skip);
*b2055c35SXin Livoid VP8SetSegment(const VP8EncIterator* const it, int segment);
*b2055c35SXin Li
*b2055c35SXin Li//------------------------------------------------------------------------------
*b2055c35SXin Li// Paginated token buffer
*b2055c35SXin Li
*b2055c35SXin Litypedef struct VP8Tokens VP8Tokens;  // struct details in token.c
*b2055c35SXin Li
*b2055c35SXin Litypedef struct {
*b2055c35SXin Li#if !defined(DISABLE_TOKEN_BUFFER)
*b2055c35SXin Li  VP8Tokens* pages_;        // first page
*b2055c35SXin Li  VP8Tokens** last_page_;   // last page
*b2055c35SXin Li  uint16_t* tokens_;        // set to (*last_page_)->tokens_
*b2055c35SXin Li  int left_;                // how many free tokens left before the page is full
*b2055c35SXin Li  int page_size_;           // number of tokens per page
*b2055c35SXin Li#endif
*b2055c35SXin Li  int error_;         // true in case of malloc error
*b2055c35SXin Li} VP8TBuffer;
*b2055c35SXin Li
*b2055c35SXin Li// initialize an empty buffer
*b2055c35SXin Livoid VP8TBufferInit(VP8TBuffer* const b, int page_size);
*b2055c35SXin Livoid VP8TBufferClear(VP8TBuffer* const b);   // de-allocate pages memory
*b2055c35SXin Li
*b2055c35SXin Li#if !defined(DISABLE_TOKEN_BUFFER)
*b2055c35SXin Li
*b2055c35SXin Li// Finalizes bitstream when probabilities are known.
*b2055c35SXin Li// Deletes the allocated token memory if final_pass is true.
*b2055c35SXin Liint VP8EmitTokens(VP8TBuffer* const b, VP8BitWriter* const bw,
*b2055c35SXin Li                  const uint8_t* const probas, int final_pass);
*b2055c35SXin Li
*b2055c35SXin Li// record the coding of coefficients without knowing the probabilities yet
*b2055c35SXin Liint VP8RecordCoeffTokens(int ctx, const struct VP8Residual* const res,
*b2055c35SXin Li                         VP8TBuffer* const tokens);
*b2055c35SXin Li
*b2055c35SXin Li// Estimate the final coded size given a set of 'probas'.
*b2055c35SXin Lisize_t VP8EstimateTokenSize(VP8TBuffer* const b, const uint8_t* const probas);
*b2055c35SXin Li
*b2055c35SXin Li#endif  // !DISABLE_TOKEN_BUFFER
*b2055c35SXin Li
*b2055c35SXin Li//------------------------------------------------------------------------------
*b2055c35SXin Li// VP8Encoder
*b2055c35SXin Li
*b2055c35SXin Listruct VP8Encoder {
*b2055c35SXin Li  const WebPConfig* config_;    // user configuration and parameters
*b2055c35SXin Li  WebPPicture* pic_;            // input / output picture
*b2055c35SXin Li
*b2055c35SXin Li  // headers
*b2055c35SXin Li  VP8EncFilterHeader   filter_hdr_;     // filtering information
*b2055c35SXin Li  VP8EncSegmentHeader  segment_hdr_;    // segment information
*b2055c35SXin Li
*b2055c35SXin Li  int profile_;                      // VP8's profile, deduced from Config.
*b2055c35SXin Li
*b2055c35SXin Li  // dimension, in macroblock units.
*b2055c35SXin Li  int mb_w_, mb_h_;
*b2055c35SXin Li  int preds_w_;   // stride of the *preds_ prediction plane (=4*mb_w + 1)
*b2055c35SXin Li
*b2055c35SXin Li  // number of partitions (1, 2, 4 or 8 = MAX_NUM_PARTITIONS)
*b2055c35SXin Li  int num_parts_;
*b2055c35SXin Li
*b2055c35SXin Li  // per-partition boolean decoders.
*b2055c35SXin Li  VP8BitWriter bw_;                         // part0
*b2055c35SXin Li  VP8BitWriter parts_[MAX_NUM_PARTITIONS];  // token partitions
*b2055c35SXin Li  VP8TBuffer tokens_;                       // token buffer
*b2055c35SXin Li
*b2055c35SXin Li  int percent_;                             // for progress
*b2055c35SXin Li
*b2055c35SXin Li  // transparency blob
*b2055c35SXin Li  int has_alpha_;
*b2055c35SXin Li  uint8_t* alpha_data_;       // non-NULL if transparency is present
*b2055c35SXin Li  uint32_t alpha_data_size_;
*b2055c35SXin Li  WebPWorker alpha_worker_;
*b2055c35SXin Li
*b2055c35SXin Li  // quantization info (one set of DC/AC dequant factor per segment)
*b2055c35SXin Li  VP8SegmentInfo dqm_[NUM_MB_SEGMENTS];
*b2055c35SXin Li  int base_quant_;                 // nominal quantizer value. Only used
*b2055c35SXin Li                                   // for relative coding of segments' quant.
*b2055c35SXin Li  int alpha_;                      // global susceptibility (<=> complexity)
*b2055c35SXin Li  int uv_alpha_;                   // U/V quantization susceptibility
*b2055c35SXin Li  // global offset of quantizers, shared by all segments
*b2055c35SXin Li  int dq_y1_dc_;
*b2055c35SXin Li  int dq_y2_dc_, dq_y2_ac_;
*b2055c35SXin Li  int dq_uv_dc_, dq_uv_ac_;
*b2055c35SXin Li
*b2055c35SXin Li  // probabilities and statistics
*b2055c35SXin Li  VP8EncProba proba_;
*b2055c35SXin Li  uint64_t    sse_[4];      // sum of Y/U/V/A squared errors for all macroblocks
*b2055c35SXin Li  uint64_t    sse_count_;   // pixel count for the sse_[] stats
*b2055c35SXin Li  int         coded_size_;
*b2055c35SXin Li  int         residual_bytes_[3][4];
*b2055c35SXin Li  int         block_count_[3];
*b2055c35SXin Li
*b2055c35SXin Li  // quality/speed settings
*b2055c35SXin Li  int method_;               // 0=fastest, 6=best/slowest.
*b2055c35SXin Li  VP8RDLevel rd_opt_level_;  // Deduced from method_.
*b2055c35SXin Li  int max_i4_header_bits_;   // partition #0 safeness factor
*b2055c35SXin Li  int mb_header_limit_;      // rough limit for header bits per MB
*b2055c35SXin Li  int thread_level_;         // derived from config->thread_level
*b2055c35SXin Li  int do_search_;            // derived from config->target_XXX
*b2055c35SXin Li  int use_tokens_;           // if true, use token buffer
*b2055c35SXin Li
*b2055c35SXin Li  // Memory
*b2055c35SXin Li  VP8MBInfo* mb_info_;   // contextual macroblock infos (mb_w_ + 1)
*b2055c35SXin Li  uint8_t*   preds_;     // predictions modes: (4*mb_w+1) * (4*mb_h+1)
*b2055c35SXin Li  uint32_t*  nz_;        // non-zero bit context: mb_w+1
*b2055c35SXin Li  uint8_t*   y_top_;     // top luma samples.
*b2055c35SXin Li  uint8_t*   uv_top_;    // top u/v samples.
*b2055c35SXin Li                         // U and V are packed into 16 bytes (8 U + 8 V)
*b2055c35SXin Li  LFStats*   lf_stats_;  // autofilter stats (if NULL, autofilter is off)
*b2055c35SXin Li  DError*    top_derr_;  // diffusion error (NULL if disabled)
*b2055c35SXin Li};
*b2055c35SXin Li
*b2055c35SXin Li//------------------------------------------------------------------------------
*b2055c35SXin Li// internal functions. Not public.
*b2055c35SXin Li
*b2055c35SXin Li  // in tree.c
*b2055c35SXin Liextern const uint8_t VP8CoeffsProba0[NUM_TYPES][NUM_BANDS][NUM_CTX][NUM_PROBAS];
*b2055c35SXin Liextern const uint8_t
*b2055c35SXin Li    VP8CoeffsUpdateProba[NUM_TYPES][NUM_BANDS][NUM_CTX][NUM_PROBAS];
*b2055c35SXin Li// Reset the token probabilities to their initial (default) values
*b2055c35SXin Livoid VP8DefaultProbas(VP8Encoder* const enc);
*b2055c35SXin Li// Write the token probabilities
*b2055c35SXin Livoid VP8WriteProbas(VP8BitWriter* const bw, const VP8EncProba* const probas);
*b2055c35SXin Li// Writes the partition #0 modes (that is: all intra modes)
*b2055c35SXin Livoid VP8CodeIntraModes(VP8Encoder* const enc);
*b2055c35SXin Li
*b2055c35SXin Li  // in syntax.c
*b2055c35SXin Li// Generates the final bitstream by coding the partition0 and headers,
*b2055c35SXin Li// and appending an assembly of all the pre-coded token partitions.
*b2055c35SXin Li// Return true if everything is ok.
*b2055c35SXin Liint VP8EncWrite(VP8Encoder* const enc);
*b2055c35SXin Li// Release memory allocated for bit-writing in VP8EncLoop & seq.
*b2055c35SXin Livoid VP8EncFreeBitWriters(VP8Encoder* const enc);
*b2055c35SXin Li
*b2055c35SXin Li  // in frame.c
*b2055c35SXin Liextern const uint8_t VP8Cat3[];
*b2055c35SXin Liextern const uint8_t VP8Cat4[];
*b2055c35SXin Liextern const uint8_t VP8Cat5[];
*b2055c35SXin Liextern const uint8_t VP8Cat6[];
*b2055c35SXin Li
*b2055c35SXin Li// Form all the four Intra16x16 predictions in the yuv_p_ cache
*b2055c35SXin Livoid VP8MakeLuma16Preds(const VP8EncIterator* const it);
*b2055c35SXin Li// Form all the four Chroma8x8 predictions in the yuv_p_ cache
*b2055c35SXin Livoid VP8MakeChroma8Preds(const VP8EncIterator* const it);
*b2055c35SXin Li// Form all the ten Intra4x4 predictions in the yuv_p_ cache
*b2055c35SXin Li// for the 4x4 block it->i4_
*b2055c35SXin Livoid VP8MakeIntra4Preds(const VP8EncIterator* const it);
*b2055c35SXin Li// Rate calculation
*b2055c35SXin Liint VP8GetCostLuma16(VP8EncIterator* const it, const VP8ModeScore* const rd);
*b2055c35SXin Liint VP8GetCostLuma4(VP8EncIterator* const it, const int16_t levels[16]);
*b2055c35SXin Liint VP8GetCostUV(VP8EncIterator* const it, const VP8ModeScore* const rd);
*b2055c35SXin Li// Main coding calls
*b2055c35SXin Liint VP8EncLoop(VP8Encoder* const enc);
*b2055c35SXin Liint VP8EncTokenLoop(VP8Encoder* const enc);
*b2055c35SXin Li
*b2055c35SXin Li  // in webpenc.c
*b2055c35SXin Li// Assign an error code to a picture. Return false for convenience.
*b2055c35SXin Liint WebPEncodingSetError(const WebPPicture* const pic, WebPEncodingError error);
*b2055c35SXin Liint WebPReportProgress(const WebPPicture* const pic,
*b2055c35SXin Li                       int percent, int* const percent_store);
*b2055c35SXin Li
*b2055c35SXin Li  // in analysis.c
*b2055c35SXin Li// Main analysis loop. Decides the segmentations and complexity.
*b2055c35SXin Li// Assigns a first guess for Intra16 and uvmode_ prediction modes.
*b2055c35SXin Liint VP8EncAnalyze(VP8Encoder* const enc);
*b2055c35SXin Li
*b2055c35SXin Li  // in quant.c
*b2055c35SXin Li// Sets up segment's quantization values, base_quant_ and filter strengths.
*b2055c35SXin Livoid VP8SetSegmentParams(VP8Encoder* const enc, float quality);
*b2055c35SXin Li// Pick best modes and fills the levels. Returns true if skipped.
*b2055c35SXin Liint VP8Decimate(VP8EncIterator* WEBP_RESTRICT const it,
*b2055c35SXin Li                VP8ModeScore* WEBP_RESTRICT const rd,
*b2055c35SXin Li                VP8RDLevel rd_opt);
*b2055c35SXin Li
*b2055c35SXin Li  // in alpha.c
*b2055c35SXin Livoid VP8EncInitAlpha(VP8Encoder* const enc);    // initialize alpha compression
*b2055c35SXin Liint VP8EncStartAlpha(VP8Encoder* const enc);    // start alpha coding process
*b2055c35SXin Liint VP8EncFinishAlpha(VP8Encoder* const enc);   // finalize compressed data
*b2055c35SXin Liint VP8EncDeleteAlpha(VP8Encoder* const enc);   // delete compressed data
*b2055c35SXin Li
*b2055c35SXin Li// autofilter
*b2055c35SXin Livoid VP8InitFilter(VP8EncIterator* const it);
*b2055c35SXin Livoid VP8StoreFilterStats(VP8EncIterator* const it);
*b2055c35SXin Livoid VP8AdjustFilterStrength(VP8EncIterator* const it);
*b2055c35SXin Li
*b2055c35SXin Li// returns the approximate filtering strength needed to smooth a edge
*b2055c35SXin Li// step of 'delta', given a sharpness parameter 'sharpness'.
*b2055c35SXin Liint VP8FilterStrengthFromDelta(int sharpness, int delta);
*b2055c35SXin Li
*b2055c35SXin Li  // misc utils for picture_*.c:
*b2055c35SXin Li
*b2055c35SXin Li// Returns true if 'picture' is non-NULL and dimensions/colorspace are within
*b2055c35SXin Li// their valid ranges. If returning false, the 'error_code' in 'picture' is
*b2055c35SXin Li// updated.
*b2055c35SXin Liint WebPValidatePicture(const WebPPicture* const picture);
*b2055c35SXin Li
*b2055c35SXin Li// Remove reference to the ARGB/YUVA buffer (doesn't free anything).
*b2055c35SXin Livoid WebPPictureResetBuffers(WebPPicture* const picture);
*b2055c35SXin Li
*b2055c35SXin Li// Allocates ARGB buffer according to set width/height (previous one is
*b2055c35SXin Li// always free'd). Preserves the YUV(A) buffer. Returns false in case of error
*b2055c35SXin Li// (invalid param, out-of-memory).
*b2055c35SXin Liint WebPPictureAllocARGB(WebPPicture* const picture);
*b2055c35SXin Li
*b2055c35SXin Li// Allocates YUVA buffer according to set width/height (previous one is always
*b2055c35SXin Li// free'd). Uses picture->csp to determine whether an alpha buffer is needed.
*b2055c35SXin Li// Preserves the ARGB buffer.
*b2055c35SXin Li// Returns false in case of error (invalid param, out-of-memory).
*b2055c35SXin Liint WebPPictureAllocYUVA(WebPPicture* const picture);
*b2055c35SXin Li
*b2055c35SXin Li// Replace samples that are fully transparent by 'color' to help compressibility
*b2055c35SXin Li// (no guarantee, though). Assumes pic->use_argb is true.
*b2055c35SXin Livoid WebPReplaceTransparentPixels(WebPPicture* const pic, uint32_t color);
*b2055c35SXin Li
*b2055c35SXin Li//------------------------------------------------------------------------------
*b2055c35SXin Li
*b2055c35SXin Li#ifdef __cplusplus
*b2055c35SXin Li}    // extern "C"
*b2055c35SXin Li#endif
*b2055c35SXin Li
*b2055c35SXin Li#endif  // WEBP_ENC_VP8I_ENC_H_