xref: /aosp_15_r20/external/webp/src/enc/vp8i_enc.h (revision b2055c353e87c8814eb2b6b1b11112a1562253bd)
1*b2055c35SXin Li // Copyright 2011 Google Inc. All Rights Reserved.
2*b2055c35SXin Li //
3*b2055c35SXin Li // Use of this source code is governed by a BSD-style license
4*b2055c35SXin Li // that can be found in the COPYING file in the root of the source
5*b2055c35SXin Li // tree. An additional intellectual property rights grant can be found
6*b2055c35SXin Li // in the file PATENTS. All contributing project authors may
7*b2055c35SXin Li // be found in the AUTHORS file in the root of the source tree.
8*b2055c35SXin Li // -----------------------------------------------------------------------------
9*b2055c35SXin Li //
10*b2055c35SXin Li //   WebP encoder: internal header.
11*b2055c35SXin Li //
12*b2055c35SXin Li // Author: Skal ([email protected])
13*b2055c35SXin Li 
14*b2055c35SXin Li #ifndef WEBP_ENC_VP8I_ENC_H_
15*b2055c35SXin Li #define WEBP_ENC_VP8I_ENC_H_
16*b2055c35SXin Li 
17*b2055c35SXin Li #include <string.h>     // for memcpy()
18*b2055c35SXin Li #include "src/dec/common_dec.h"
19*b2055c35SXin Li #include "src/dsp/dsp.h"
20*b2055c35SXin Li #include "src/utils/bit_writer_utils.h"
21*b2055c35SXin Li #include "src/utils/thread_utils.h"
22*b2055c35SXin Li #include "src/utils/utils.h"
23*b2055c35SXin Li #include "src/webp/encode.h"
24*b2055c35SXin Li 
25*b2055c35SXin Li #ifdef __cplusplus
26*b2055c35SXin Li extern "C" {
27*b2055c35SXin Li #endif
28*b2055c35SXin Li 
29*b2055c35SXin Li //------------------------------------------------------------------------------
30*b2055c35SXin Li // Various defines and enums
31*b2055c35SXin Li 
32*b2055c35SXin Li // version numbers
33*b2055c35SXin Li #define ENC_MAJ_VERSION 1
34*b2055c35SXin Li #define ENC_MIN_VERSION 4
35*b2055c35SXin Li #define ENC_REV_VERSION 0
36*b2055c35SXin Li 
37*b2055c35SXin Li enum { MAX_LF_LEVELS = 64,       // Maximum loop filter level
38*b2055c35SXin Li        MAX_VARIABLE_LEVEL = 67,  // last (inclusive) level with variable cost
39*b2055c35SXin Li        MAX_LEVEL = 2047          // max level (note: max codable is 2047 + 67)
40*b2055c35SXin Li      };
41*b2055c35SXin Li 
42*b2055c35SXin Li typedef enum {   // Rate-distortion optimization levels
43*b2055c35SXin Li   RD_OPT_NONE        = 0,  // no rd-opt
44*b2055c35SXin Li   RD_OPT_BASIC       = 1,  // basic scoring (no trellis)
45*b2055c35SXin Li   RD_OPT_TRELLIS     = 2,  // perform trellis-quant on the final decision only
46*b2055c35SXin Li   RD_OPT_TRELLIS_ALL = 3   // trellis-quant for every scoring (much slower)
47*b2055c35SXin Li } VP8RDLevel;
48*b2055c35SXin Li 
49*b2055c35SXin Li // YUV-cache parameters. Cache is 32-bytes wide (= one cacheline).
50*b2055c35SXin Li // The original or reconstructed samples can be accessed using VP8Scan[].
51*b2055c35SXin Li // The predicted blocks can be accessed using offsets to yuv_p_ and
52*b2055c35SXin Li // the arrays VP8*ModeOffsets[].
53*b2055c35SXin Li // * YUV Samples area (yuv_in_/yuv_out_/yuv_out2_)
54*b2055c35SXin Li //   (see VP8Scan[] for accessing the blocks, along with
55*b2055c35SXin Li //   Y_OFF_ENC/U_OFF_ENC/V_OFF_ENC):
56*b2055c35SXin Li //             +----+----+
57*b2055c35SXin Li //  Y_OFF_ENC  |YYYY|UUVV|
58*b2055c35SXin Li //  U_OFF_ENC  |YYYY|UUVV|
59*b2055c35SXin Li //  V_OFF_ENC  |YYYY|....| <- 25% wasted U/V area
60*b2055c35SXin Li //             |YYYY|....|
61*b2055c35SXin Li //             +----+----+
62*b2055c35SXin Li // * Prediction area ('yuv_p_', size = PRED_SIZE_ENC)
63*b2055c35SXin Li //   Intra16 predictions (16x16 block each, two per row):
64*b2055c35SXin Li //         |I16DC16|I16TM16|
65*b2055c35SXin Li //         |I16VE16|I16HE16|
66*b2055c35SXin Li //   Chroma U/V predictions (16x8 block each, two per row):
67*b2055c35SXin Li //         |C8DC8|C8TM8|
68*b2055c35SXin Li //         |C8VE8|C8HE8|
69*b2055c35SXin Li //   Intra 4x4 predictions (4x4 block each)
70*b2055c35SXin Li //         |I4DC4 I4TM4 I4VE4 I4HE4|I4RD4 I4VR4 I4LD4 I4VL4|
71*b2055c35SXin Li //         |I4HD4 I4HU4 I4TMP .....|.......................| <- ~31% wasted
72*b2055c35SXin Li #define YUV_SIZE_ENC (BPS * 16)
73*b2055c35SXin Li #define PRED_SIZE_ENC (32 * BPS + 16 * BPS + 8 * BPS)   // I16+Chroma+I4 preds
74*b2055c35SXin Li #define Y_OFF_ENC    (0)
75*b2055c35SXin Li #define U_OFF_ENC    (16)
76*b2055c35SXin Li #define V_OFF_ENC    (16 + 8)
77*b2055c35SXin Li 
78*b2055c35SXin Li extern const uint16_t VP8Scan[16];
79*b2055c35SXin Li extern const uint16_t VP8UVModeOffsets[4];
80*b2055c35SXin Li extern const uint16_t VP8I16ModeOffsets[4];
81*b2055c35SXin Li extern const uint16_t VP8I4ModeOffsets[NUM_BMODES];
82*b2055c35SXin Li 
83*b2055c35SXin Li // Layout of prediction blocks
84*b2055c35SXin Li // intra 16x16
85*b2055c35SXin Li #define I16DC16 (0 * 16 * BPS)
86*b2055c35SXin Li #define I16TM16 (I16DC16 + 16)
87*b2055c35SXin Li #define I16VE16 (1 * 16 * BPS)
88*b2055c35SXin Li #define I16HE16 (I16VE16 + 16)
89*b2055c35SXin Li // chroma 8x8, two U/V blocks side by side (hence: 16x8 each)
90*b2055c35SXin Li #define C8DC8 (2 * 16 * BPS)
91*b2055c35SXin Li #define C8TM8 (C8DC8 + 1 * 16)
92*b2055c35SXin Li #define C8VE8 (2 * 16 * BPS + 8 * BPS)
93*b2055c35SXin Li #define C8HE8 (C8VE8 + 1 * 16)
94*b2055c35SXin Li // intra 4x4
95*b2055c35SXin Li #define I4DC4 (3 * 16 * BPS +  0)
96*b2055c35SXin Li #define I4TM4 (I4DC4 +  4)
97*b2055c35SXin Li #define I4VE4 (I4DC4 +  8)
98*b2055c35SXin Li #define I4HE4 (I4DC4 + 12)
99*b2055c35SXin Li #define I4RD4 (I4DC4 + 16)
100*b2055c35SXin Li #define I4VR4 (I4DC4 + 20)
101*b2055c35SXin Li #define I4LD4 (I4DC4 + 24)
102*b2055c35SXin Li #define I4VL4 (I4DC4 + 28)
103*b2055c35SXin Li #define I4HD4 (3 * 16 * BPS + 4 * BPS)
104*b2055c35SXin Li #define I4HU4 (I4HD4 + 4)
105*b2055c35SXin Li #define I4TMP (I4HD4 + 8)
106*b2055c35SXin Li 
107*b2055c35SXin Li typedef int64_t score_t;     // type used for scores, rate, distortion
108*b2055c35SXin Li // Note that MAX_COST is not the maximum allowed by sizeof(score_t),
109*b2055c35SXin Li // in order to allow overflowing computations.
110*b2055c35SXin Li #define MAX_COST ((score_t)0x7fffffffffffffLL)
111*b2055c35SXin Li 
112*b2055c35SXin Li #define QFIX 17
113*b2055c35SXin Li #define BIAS(b)  ((b) << (QFIX - 8))
114*b2055c35SXin Li // Fun fact: this is the _only_ line where we're actually being lossy and
115*b2055c35SXin Li // discarding bits.
QUANTDIV(uint32_t n,uint32_t iQ,uint32_t B)116*b2055c35SXin Li static WEBP_INLINE int QUANTDIV(uint32_t n, uint32_t iQ, uint32_t B) {
117*b2055c35SXin Li   return (int)((n * iQ + B) >> QFIX);
118*b2055c35SXin Li }
119*b2055c35SXin Li 
120*b2055c35SXin Li // Uncomment the following to remove token-buffer code:
121*b2055c35SXin Li // #define DISABLE_TOKEN_BUFFER
122*b2055c35SXin Li 
123*b2055c35SXin Li // quality below which error-diffusion is enabled
124*b2055c35SXin Li #define ERROR_DIFFUSION_QUALITY 98
125*b2055c35SXin Li 
126*b2055c35SXin Li //------------------------------------------------------------------------------
127*b2055c35SXin Li // Headers
128*b2055c35SXin Li 
129*b2055c35SXin Li typedef uint32_t proba_t;   // 16b + 16b
130*b2055c35SXin Li typedef uint8_t ProbaArray[NUM_CTX][NUM_PROBAS];
131*b2055c35SXin Li typedef proba_t StatsArray[NUM_CTX][NUM_PROBAS];
132*b2055c35SXin Li typedef uint16_t CostArray[NUM_CTX][MAX_VARIABLE_LEVEL + 1];
133*b2055c35SXin Li typedef const uint16_t* (*CostArrayPtr)[NUM_CTX];   // for easy casting
134*b2055c35SXin Li typedef const uint16_t* CostArrayMap[16][NUM_CTX];
135*b2055c35SXin Li typedef double LFStats[NUM_MB_SEGMENTS][MAX_LF_LEVELS];  // filter stats
136*b2055c35SXin Li 
137*b2055c35SXin Li typedef struct VP8Encoder VP8Encoder;
138*b2055c35SXin Li 
139*b2055c35SXin Li // segment features
140*b2055c35SXin Li typedef struct {
141*b2055c35SXin Li   int num_segments_;      // Actual number of segments. 1 segment only = unused.
142*b2055c35SXin Li   int update_map_;        // whether to update the segment map or not.
143*b2055c35SXin Li                           // must be 0 if there's only 1 segment.
144*b2055c35SXin Li   int size_;              // bit-cost for transmitting the segment map
145*b2055c35SXin Li } VP8EncSegmentHeader;
146*b2055c35SXin Li 
147*b2055c35SXin Li // Struct collecting all frame-persistent probabilities.
148*b2055c35SXin Li typedef struct {
149*b2055c35SXin Li   uint8_t segments_[3];     // probabilities for segment tree
150*b2055c35SXin Li   uint8_t skip_proba_;      // final probability of being skipped.
151*b2055c35SXin Li   ProbaArray coeffs_[NUM_TYPES][NUM_BANDS];      // 1056 bytes
152*b2055c35SXin Li   StatsArray stats_[NUM_TYPES][NUM_BANDS];       // 4224 bytes
153*b2055c35SXin Li   CostArray level_cost_[NUM_TYPES][NUM_BANDS];   // 13056 bytes
154*b2055c35SXin Li   CostArrayMap remapped_costs_[NUM_TYPES];       // 1536 bytes
155*b2055c35SXin Li   int dirty_;               // if true, need to call VP8CalculateLevelCosts()
156*b2055c35SXin Li   int use_skip_proba_;      // Note: we always use skip_proba for now.
157*b2055c35SXin Li   int nb_skip_;             // number of skipped blocks
158*b2055c35SXin Li } VP8EncProba;
159*b2055c35SXin Li 
160*b2055c35SXin Li // Filter parameters. Not actually used in the code (we don't perform
161*b2055c35SXin Li // the in-loop filtering), but filled from user's config
162*b2055c35SXin Li typedef struct {
163*b2055c35SXin Li   int simple_;             // filtering type: 0=complex, 1=simple
164*b2055c35SXin Li   int level_;              // base filter level [0..63]
165*b2055c35SXin Li   int sharpness_;          // [0..7]
166*b2055c35SXin Li   int i4x4_lf_delta_;      // delta filter level for i4x4 relative to i16x16
167*b2055c35SXin Li } VP8EncFilterHeader;
168*b2055c35SXin Li 
169*b2055c35SXin Li //------------------------------------------------------------------------------
170*b2055c35SXin Li // Informations about the macroblocks.
171*b2055c35SXin Li 
172*b2055c35SXin Li typedef struct {
173*b2055c35SXin Li   // block type
174*b2055c35SXin Li   unsigned int type_:2;     // 0=i4x4, 1=i16x16
175*b2055c35SXin Li   unsigned int uv_mode_:2;
176*b2055c35SXin Li   unsigned int skip_:1;
177*b2055c35SXin Li   unsigned int segment_:2;
178*b2055c35SXin Li   uint8_t alpha_;      // quantization-susceptibility
179*b2055c35SXin Li } VP8MBInfo;
180*b2055c35SXin Li 
181*b2055c35SXin Li typedef struct VP8Matrix {
182*b2055c35SXin Li   uint16_t q_[16];        // quantizer steps
183*b2055c35SXin Li   uint16_t iq_[16];       // reciprocals, fixed point.
184*b2055c35SXin Li   uint32_t bias_[16];     // rounding bias
185*b2055c35SXin Li   uint32_t zthresh_[16];  // value below which a coefficient is zeroed
186*b2055c35SXin Li   uint16_t sharpen_[16];  // frequency boosters for slight sharpening
187*b2055c35SXin Li } VP8Matrix;
188*b2055c35SXin Li 
189*b2055c35SXin Li typedef struct {
190*b2055c35SXin Li   VP8Matrix y1_, y2_, uv_;  // quantization matrices
191*b2055c35SXin Li   int alpha_;      // quant-susceptibility, range [-127,127]. Zero is neutral.
192*b2055c35SXin Li                    // Lower values indicate a lower risk of blurriness.
193*b2055c35SXin Li   int beta_;       // filter-susceptibility, range [0,255].
194*b2055c35SXin Li   int quant_;      // final segment quantizer.
195*b2055c35SXin Li   int fstrength_;  // final in-loop filtering strength
196*b2055c35SXin Li   int max_edge_;   // max edge delta (for filtering strength)
197*b2055c35SXin Li   int min_disto_;  // minimum distortion required to trigger filtering record
198*b2055c35SXin Li   // reactivities
199*b2055c35SXin Li   int lambda_i16_, lambda_i4_, lambda_uv_;
200*b2055c35SXin Li   int lambda_mode_, lambda_trellis_, tlambda_;
201*b2055c35SXin Li   int lambda_trellis_i16_, lambda_trellis_i4_, lambda_trellis_uv_;
202*b2055c35SXin Li 
203*b2055c35SXin Li   // lambda values for distortion-based evaluation
204*b2055c35SXin Li   score_t i4_penalty_;   // penalty for using Intra4
205*b2055c35SXin Li } VP8SegmentInfo;
206*b2055c35SXin Li 
207*b2055c35SXin Li typedef int8_t DError[2 /* u/v */][2 /* top or left */];
208*b2055c35SXin Li 
209*b2055c35SXin Li // Handy transient struct to accumulate score and info during RD-optimization
210*b2055c35SXin Li // and mode evaluation.
211*b2055c35SXin Li typedef struct {
212*b2055c35SXin Li   score_t D, SD;              // Distortion, spectral distortion
213*b2055c35SXin Li   score_t H, R, score;        // header bits, rate, score.
214*b2055c35SXin Li   int16_t y_dc_levels[16];    // Quantized levels for luma-DC, luma-AC, chroma.
215*b2055c35SXin Li   int16_t y_ac_levels[16][16];
216*b2055c35SXin Li   int16_t uv_levels[4 + 4][16];
217*b2055c35SXin Li   int mode_i16;               // mode number for intra16 prediction
218*b2055c35SXin Li   uint8_t modes_i4[16];       // mode numbers for intra4 predictions
219*b2055c35SXin Li   int mode_uv;                // mode number of chroma prediction
220*b2055c35SXin Li   uint32_t nz;                // non-zero blocks
221*b2055c35SXin Li   int8_t derr[2][3];          // DC diffusion errors for U/V for blocks #1/2/3
222*b2055c35SXin Li } VP8ModeScore;
223*b2055c35SXin Li 
224*b2055c35SXin Li // Iterator structure to iterate through macroblocks, pointing to the
225*b2055c35SXin Li // right neighbouring data (samples, predictions, contexts, ...)
226*b2055c35SXin Li typedef struct {
227*b2055c35SXin Li   int x_, y_;                      // current macroblock
228*b2055c35SXin Li   uint8_t*      yuv_in_;           // input samples
229*b2055c35SXin Li   uint8_t*      yuv_out_;          // output samples
230*b2055c35SXin Li   uint8_t*      yuv_out2_;         // secondary buffer swapped with yuv_out_.
231*b2055c35SXin Li   uint8_t*      yuv_p_;            // scratch buffer for prediction
232*b2055c35SXin Li   VP8Encoder*   enc_;              // back-pointer
233*b2055c35SXin Li   VP8MBInfo*    mb_;               // current macroblock
234*b2055c35SXin Li   VP8BitWriter* bw_;               // current bit-writer
235*b2055c35SXin Li   uint8_t*      preds_;            // intra mode predictors (4x4 blocks)
236*b2055c35SXin Li   uint32_t*     nz_;               // non-zero pattern
237*b2055c35SXin Li   uint8_t       i4_boundary_[37];  // 32+5 boundary samples needed by intra4x4
238*b2055c35SXin Li   uint8_t*      i4_top_;           // pointer to the current top boundary sample
239*b2055c35SXin Li   int           i4_;               // current intra4x4 mode being tested
240*b2055c35SXin Li   int           top_nz_[9];        // top-non-zero context.
241*b2055c35SXin Li   int           left_nz_[9];       // left-non-zero. left_nz[8] is independent.
242*b2055c35SXin Li   uint64_t      bit_count_[4][3];  // bit counters for coded levels.
243*b2055c35SXin Li   uint64_t      luma_bits_;        // macroblock bit-cost for luma
244*b2055c35SXin Li   uint64_t      uv_bits_;          // macroblock bit-cost for chroma
245*b2055c35SXin Li   LFStats*      lf_stats_;         // filter stats (borrowed from enc_)
246*b2055c35SXin Li   int           do_trellis_;       // if true, perform extra level optimisation
247*b2055c35SXin Li   int           count_down_;       // number of mb still to be processed
248*b2055c35SXin Li   int           count_down0_;      // starting counter value (for progress)
249*b2055c35SXin Li   int           percent0_;         // saved initial progress percent
250*b2055c35SXin Li 
251*b2055c35SXin Li   DError        left_derr_;        // left error diffusion (u/v)
252*b2055c35SXin Li   DError*       top_derr_;         // top diffusion error - NULL if disabled
253*b2055c35SXin Li 
254*b2055c35SXin Li   uint8_t* y_left_;    // left luma samples (addressable from index -1 to 15).
255*b2055c35SXin Li   uint8_t* u_left_;    // left u samples (addressable from index -1 to 7)
256*b2055c35SXin Li   uint8_t* v_left_;    // left v samples (addressable from index -1 to 7)
257*b2055c35SXin Li 
258*b2055c35SXin Li   uint8_t* y_top_;     // top luma samples at position 'x_'
259*b2055c35SXin Li   uint8_t* uv_top_;    // top u/v samples at position 'x_', packed as 16 bytes
260*b2055c35SXin Li 
261*b2055c35SXin Li   // memory for storing y/u/v_left_
262*b2055c35SXin Li   uint8_t yuv_left_mem_[17 + 16 + 16 + 8 + WEBP_ALIGN_CST];
263*b2055c35SXin Li   // memory for yuv_*
264*b2055c35SXin Li   uint8_t yuv_mem_[3 * YUV_SIZE_ENC + PRED_SIZE_ENC + WEBP_ALIGN_CST];
265*b2055c35SXin Li } VP8EncIterator;
266*b2055c35SXin Li 
267*b2055c35SXin Li   // in iterator.c
268*b2055c35SXin Li // must be called first
269*b2055c35SXin Li void VP8IteratorInit(VP8Encoder* const enc, VP8EncIterator* const it);
270*b2055c35SXin Li // restart a scan
271*b2055c35SXin Li void VP8IteratorReset(VP8EncIterator* const it);
272*b2055c35SXin Li // reset iterator position to row 'y'
273*b2055c35SXin Li void VP8IteratorSetRow(VP8EncIterator* const it, int y);
274*b2055c35SXin Li // set count down (=number of iterations to go)
275*b2055c35SXin Li void VP8IteratorSetCountDown(VP8EncIterator* const it, int count_down);
276*b2055c35SXin Li // return true if iteration is finished
277*b2055c35SXin Li int VP8IteratorIsDone(const VP8EncIterator* const it);
278*b2055c35SXin Li // Import uncompressed samples from source.
279*b2055c35SXin Li // If tmp_32 is not NULL, import boundary samples too.
280*b2055c35SXin Li // tmp_32 is a 32-bytes scratch buffer that must be aligned in memory.
281*b2055c35SXin Li void VP8IteratorImport(VP8EncIterator* const it, uint8_t* const tmp_32);
282*b2055c35SXin Li // export decimated samples
283*b2055c35SXin Li void VP8IteratorExport(const VP8EncIterator* const it);
284*b2055c35SXin Li // go to next macroblock. Returns false if not finished.
285*b2055c35SXin Li int VP8IteratorNext(VP8EncIterator* const it);
286*b2055c35SXin Li // save the yuv_out_ boundary values to top_/left_ arrays for next iterations.
287*b2055c35SXin Li void VP8IteratorSaveBoundary(VP8EncIterator* const it);
288*b2055c35SXin Li // Report progression based on macroblock rows. Return 0 for user-abort request.
289*b2055c35SXin Li int VP8IteratorProgress(const VP8EncIterator* const it, int delta);
290*b2055c35SXin Li // Intra4x4 iterations
291*b2055c35SXin Li void VP8IteratorStartI4(VP8EncIterator* const it);
292*b2055c35SXin Li // returns true if not done.
293*b2055c35SXin Li int VP8IteratorRotateI4(VP8EncIterator* const it,
294*b2055c35SXin Li                         const uint8_t* const yuv_out);
295*b2055c35SXin Li 
296*b2055c35SXin Li // Non-zero context setup/teardown
297*b2055c35SXin Li void VP8IteratorNzToBytes(VP8EncIterator* const it);
298*b2055c35SXin Li void VP8IteratorBytesToNz(VP8EncIterator* const it);
299*b2055c35SXin Li 
300*b2055c35SXin Li // Helper functions to set mode properties
301*b2055c35SXin Li void VP8SetIntra16Mode(const VP8EncIterator* const it, int mode);
302*b2055c35SXin Li void VP8SetIntra4Mode(const VP8EncIterator* const it, const uint8_t* modes);
303*b2055c35SXin Li void VP8SetIntraUVMode(const VP8EncIterator* const it, int mode);
304*b2055c35SXin Li void VP8SetSkip(const VP8EncIterator* const it, int skip);
305*b2055c35SXin Li void VP8SetSegment(const VP8EncIterator* const it, int segment);
306*b2055c35SXin Li 
307*b2055c35SXin Li //------------------------------------------------------------------------------
308*b2055c35SXin Li // Paginated token buffer
309*b2055c35SXin Li 
310*b2055c35SXin Li typedef struct VP8Tokens VP8Tokens;  // struct details in token.c
311*b2055c35SXin Li 
312*b2055c35SXin Li typedef struct {
313*b2055c35SXin Li #if !defined(DISABLE_TOKEN_BUFFER)
314*b2055c35SXin Li   VP8Tokens* pages_;        // first page
315*b2055c35SXin Li   VP8Tokens** last_page_;   // last page
316*b2055c35SXin Li   uint16_t* tokens_;        // set to (*last_page_)->tokens_
317*b2055c35SXin Li   int left_;                // how many free tokens left before the page is full
318*b2055c35SXin Li   int page_size_;           // number of tokens per page
319*b2055c35SXin Li #endif
320*b2055c35SXin Li   int error_;         // true in case of malloc error
321*b2055c35SXin Li } VP8TBuffer;
322*b2055c35SXin Li 
323*b2055c35SXin Li // initialize an empty buffer
324*b2055c35SXin Li void VP8TBufferInit(VP8TBuffer* const b, int page_size);
325*b2055c35SXin Li void VP8TBufferClear(VP8TBuffer* const b);   // de-allocate pages memory
326*b2055c35SXin Li 
327*b2055c35SXin Li #if !defined(DISABLE_TOKEN_BUFFER)
328*b2055c35SXin Li 
329*b2055c35SXin Li // Finalizes bitstream when probabilities are known.
330*b2055c35SXin Li // Deletes the allocated token memory if final_pass is true.
331*b2055c35SXin Li int VP8EmitTokens(VP8TBuffer* const b, VP8BitWriter* const bw,
332*b2055c35SXin Li                   const uint8_t* const probas, int final_pass);
333*b2055c35SXin Li 
334*b2055c35SXin Li // record the coding of coefficients without knowing the probabilities yet
335*b2055c35SXin Li int VP8RecordCoeffTokens(int ctx, const struct VP8Residual* const res,
336*b2055c35SXin Li                          VP8TBuffer* const tokens);
337*b2055c35SXin Li 
338*b2055c35SXin Li // Estimate the final coded size given a set of 'probas'.
339*b2055c35SXin Li size_t VP8EstimateTokenSize(VP8TBuffer* const b, const uint8_t* const probas);
340*b2055c35SXin Li 
341*b2055c35SXin Li #endif  // !DISABLE_TOKEN_BUFFER
342*b2055c35SXin Li 
343*b2055c35SXin Li //------------------------------------------------------------------------------
344*b2055c35SXin Li // VP8Encoder
345*b2055c35SXin Li 
346*b2055c35SXin Li struct VP8Encoder {
347*b2055c35SXin Li   const WebPConfig* config_;    // user configuration and parameters
348*b2055c35SXin Li   WebPPicture* pic_;            // input / output picture
349*b2055c35SXin Li 
350*b2055c35SXin Li   // headers
351*b2055c35SXin Li   VP8EncFilterHeader   filter_hdr_;     // filtering information
352*b2055c35SXin Li   VP8EncSegmentHeader  segment_hdr_;    // segment information
353*b2055c35SXin Li 
354*b2055c35SXin Li   int profile_;                      // VP8's profile, deduced from Config.
355*b2055c35SXin Li 
356*b2055c35SXin Li   // dimension, in macroblock units.
357*b2055c35SXin Li   int mb_w_, mb_h_;
358*b2055c35SXin Li   int preds_w_;   // stride of the *preds_ prediction plane (=4*mb_w + 1)
359*b2055c35SXin Li 
360*b2055c35SXin Li   // number of partitions (1, 2, 4 or 8 = MAX_NUM_PARTITIONS)
361*b2055c35SXin Li   int num_parts_;
362*b2055c35SXin Li 
363*b2055c35SXin Li   // per-partition boolean decoders.
364*b2055c35SXin Li   VP8BitWriter bw_;                         // part0
365*b2055c35SXin Li   VP8BitWriter parts_[MAX_NUM_PARTITIONS];  // token partitions
366*b2055c35SXin Li   VP8TBuffer tokens_;                       // token buffer
367*b2055c35SXin Li 
368*b2055c35SXin Li   int percent_;                             // for progress
369*b2055c35SXin Li 
370*b2055c35SXin Li   // transparency blob
371*b2055c35SXin Li   int has_alpha_;
372*b2055c35SXin Li   uint8_t* alpha_data_;       // non-NULL if transparency is present
373*b2055c35SXin Li   uint32_t alpha_data_size_;
374*b2055c35SXin Li   WebPWorker alpha_worker_;
375*b2055c35SXin Li 
376*b2055c35SXin Li   // quantization info (one set of DC/AC dequant factor per segment)
377*b2055c35SXin Li   VP8SegmentInfo dqm_[NUM_MB_SEGMENTS];
378*b2055c35SXin Li   int base_quant_;                 // nominal quantizer value. Only used
379*b2055c35SXin Li                                    // for relative coding of segments' quant.
380*b2055c35SXin Li   int alpha_;                      // global susceptibility (<=> complexity)
381*b2055c35SXin Li   int uv_alpha_;                   // U/V quantization susceptibility
382*b2055c35SXin Li   // global offset of quantizers, shared by all segments
383*b2055c35SXin Li   int dq_y1_dc_;
384*b2055c35SXin Li   int dq_y2_dc_, dq_y2_ac_;
385*b2055c35SXin Li   int dq_uv_dc_, dq_uv_ac_;
386*b2055c35SXin Li 
387*b2055c35SXin Li   // probabilities and statistics
388*b2055c35SXin Li   VP8EncProba proba_;
389*b2055c35SXin Li   uint64_t    sse_[4];      // sum of Y/U/V/A squared errors for all macroblocks
390*b2055c35SXin Li   uint64_t    sse_count_;   // pixel count for the sse_[] stats
391*b2055c35SXin Li   int         coded_size_;
392*b2055c35SXin Li   int         residual_bytes_[3][4];
393*b2055c35SXin Li   int         block_count_[3];
394*b2055c35SXin Li 
395*b2055c35SXin Li   // quality/speed settings
396*b2055c35SXin Li   int method_;               // 0=fastest, 6=best/slowest.
397*b2055c35SXin Li   VP8RDLevel rd_opt_level_;  // Deduced from method_.
398*b2055c35SXin Li   int max_i4_header_bits_;   // partition #0 safeness factor
399*b2055c35SXin Li   int mb_header_limit_;      // rough limit for header bits per MB
400*b2055c35SXin Li   int thread_level_;         // derived from config->thread_level
401*b2055c35SXin Li   int do_search_;            // derived from config->target_XXX
402*b2055c35SXin Li   int use_tokens_;           // if true, use token buffer
403*b2055c35SXin Li 
404*b2055c35SXin Li   // Memory
405*b2055c35SXin Li   VP8MBInfo* mb_info_;   // contextual macroblock infos (mb_w_ + 1)
406*b2055c35SXin Li   uint8_t*   preds_;     // predictions modes: (4*mb_w+1) * (4*mb_h+1)
407*b2055c35SXin Li   uint32_t*  nz_;        // non-zero bit context: mb_w+1
408*b2055c35SXin Li   uint8_t*   y_top_;     // top luma samples.
409*b2055c35SXin Li   uint8_t*   uv_top_;    // top u/v samples.
410*b2055c35SXin Li                          // U and V are packed into 16 bytes (8 U + 8 V)
411*b2055c35SXin Li   LFStats*   lf_stats_;  // autofilter stats (if NULL, autofilter is off)
412*b2055c35SXin Li   DError*    top_derr_;  // diffusion error (NULL if disabled)
413*b2055c35SXin Li };
414*b2055c35SXin Li 
415*b2055c35SXin Li //------------------------------------------------------------------------------
416*b2055c35SXin Li // internal functions. Not public.
417*b2055c35SXin Li 
418*b2055c35SXin Li   // in tree.c
419*b2055c35SXin Li extern const uint8_t VP8CoeffsProba0[NUM_TYPES][NUM_BANDS][NUM_CTX][NUM_PROBAS];
420*b2055c35SXin Li extern const uint8_t
421*b2055c35SXin Li     VP8CoeffsUpdateProba[NUM_TYPES][NUM_BANDS][NUM_CTX][NUM_PROBAS];
422*b2055c35SXin Li // Reset the token probabilities to their initial (default) values
423*b2055c35SXin Li void VP8DefaultProbas(VP8Encoder* const enc);
424*b2055c35SXin Li // Write the token probabilities
425*b2055c35SXin Li void VP8WriteProbas(VP8BitWriter* const bw, const VP8EncProba* const probas);
426*b2055c35SXin Li // Writes the partition #0 modes (that is: all intra modes)
427*b2055c35SXin Li void VP8CodeIntraModes(VP8Encoder* const enc);
428*b2055c35SXin Li 
429*b2055c35SXin Li   // in syntax.c
430*b2055c35SXin Li // Generates the final bitstream by coding the partition0 and headers,
431*b2055c35SXin Li // and appending an assembly of all the pre-coded token partitions.
432*b2055c35SXin Li // Return true if everything is ok.
433*b2055c35SXin Li int VP8EncWrite(VP8Encoder* const enc);
434*b2055c35SXin Li // Release memory allocated for bit-writing in VP8EncLoop & seq.
435*b2055c35SXin Li void VP8EncFreeBitWriters(VP8Encoder* const enc);
436*b2055c35SXin Li 
437*b2055c35SXin Li   // in frame.c
438*b2055c35SXin Li extern const uint8_t VP8Cat3[];
439*b2055c35SXin Li extern const uint8_t VP8Cat4[];
440*b2055c35SXin Li extern const uint8_t VP8Cat5[];
441*b2055c35SXin Li extern const uint8_t VP8Cat6[];
442*b2055c35SXin Li 
443*b2055c35SXin Li // Form all the four Intra16x16 predictions in the yuv_p_ cache
444*b2055c35SXin Li void VP8MakeLuma16Preds(const VP8EncIterator* const it);
445*b2055c35SXin Li // Form all the four Chroma8x8 predictions in the yuv_p_ cache
446*b2055c35SXin Li void VP8MakeChroma8Preds(const VP8EncIterator* const it);
447*b2055c35SXin Li // Form all the ten Intra4x4 predictions in the yuv_p_ cache
448*b2055c35SXin Li // for the 4x4 block it->i4_
449*b2055c35SXin Li void VP8MakeIntra4Preds(const VP8EncIterator* const it);
450*b2055c35SXin Li // Rate calculation
451*b2055c35SXin Li int VP8GetCostLuma16(VP8EncIterator* const it, const VP8ModeScore* const rd);
452*b2055c35SXin Li int VP8GetCostLuma4(VP8EncIterator* const it, const int16_t levels[16]);
453*b2055c35SXin Li int VP8GetCostUV(VP8EncIterator* const it, const VP8ModeScore* const rd);
454*b2055c35SXin Li // Main coding calls
455*b2055c35SXin Li int VP8EncLoop(VP8Encoder* const enc);
456*b2055c35SXin Li int VP8EncTokenLoop(VP8Encoder* const enc);
457*b2055c35SXin Li 
458*b2055c35SXin Li   // in webpenc.c
459*b2055c35SXin Li // Assign an error code to a picture. Return false for convenience.
460*b2055c35SXin Li int WebPEncodingSetError(const WebPPicture* const pic, WebPEncodingError error);
461*b2055c35SXin Li int WebPReportProgress(const WebPPicture* const pic,
462*b2055c35SXin Li                        int percent, int* const percent_store);
463*b2055c35SXin Li 
464*b2055c35SXin Li   // in analysis.c
465*b2055c35SXin Li // Main analysis loop. Decides the segmentations and complexity.
466*b2055c35SXin Li // Assigns a first guess for Intra16 and uvmode_ prediction modes.
467*b2055c35SXin Li int VP8EncAnalyze(VP8Encoder* const enc);
468*b2055c35SXin Li 
469*b2055c35SXin Li   // in quant.c
470*b2055c35SXin Li // Sets up segment's quantization values, base_quant_ and filter strengths.
471*b2055c35SXin Li void VP8SetSegmentParams(VP8Encoder* const enc, float quality);
472*b2055c35SXin Li // Pick best modes and fills the levels. Returns true if skipped.
473*b2055c35SXin Li int VP8Decimate(VP8EncIterator* WEBP_RESTRICT const it,
474*b2055c35SXin Li                 VP8ModeScore* WEBP_RESTRICT const rd,
475*b2055c35SXin Li                 VP8RDLevel rd_opt);
476*b2055c35SXin Li 
477*b2055c35SXin Li   // in alpha.c
478*b2055c35SXin Li void VP8EncInitAlpha(VP8Encoder* const enc);    // initialize alpha compression
479*b2055c35SXin Li int VP8EncStartAlpha(VP8Encoder* const enc);    // start alpha coding process
480*b2055c35SXin Li int VP8EncFinishAlpha(VP8Encoder* const enc);   // finalize compressed data
481*b2055c35SXin Li int VP8EncDeleteAlpha(VP8Encoder* const enc);   // delete compressed data
482*b2055c35SXin Li 
483*b2055c35SXin Li // autofilter
484*b2055c35SXin Li void VP8InitFilter(VP8EncIterator* const it);
485*b2055c35SXin Li void VP8StoreFilterStats(VP8EncIterator* const it);
486*b2055c35SXin Li void VP8AdjustFilterStrength(VP8EncIterator* const it);
487*b2055c35SXin Li 
488*b2055c35SXin Li // returns the approximate filtering strength needed to smooth a edge
489*b2055c35SXin Li // step of 'delta', given a sharpness parameter 'sharpness'.
490*b2055c35SXin Li int VP8FilterStrengthFromDelta(int sharpness, int delta);
491*b2055c35SXin Li 
492*b2055c35SXin Li   // misc utils for picture_*.c:
493*b2055c35SXin Li 
494*b2055c35SXin Li // Returns true if 'picture' is non-NULL and dimensions/colorspace are within
495*b2055c35SXin Li // their valid ranges. If returning false, the 'error_code' in 'picture' is
496*b2055c35SXin Li // updated.
497*b2055c35SXin Li int WebPValidatePicture(const WebPPicture* const picture);
498*b2055c35SXin Li 
499*b2055c35SXin Li // Remove reference to the ARGB/YUVA buffer (doesn't free anything).
500*b2055c35SXin Li void WebPPictureResetBuffers(WebPPicture* const picture);
501*b2055c35SXin Li 
502*b2055c35SXin Li // Allocates ARGB buffer according to set width/height (previous one is
503*b2055c35SXin Li // always free'd). Preserves the YUV(A) buffer. Returns false in case of error
504*b2055c35SXin Li // (invalid param, out-of-memory).
505*b2055c35SXin Li int WebPPictureAllocARGB(WebPPicture* const picture);
506*b2055c35SXin Li 
507*b2055c35SXin Li // Allocates YUVA buffer according to set width/height (previous one is always
508*b2055c35SXin Li // free'd). Uses picture->csp to determine whether an alpha buffer is needed.
509*b2055c35SXin Li // Preserves the ARGB buffer.
510*b2055c35SXin Li // Returns false in case of error (invalid param, out-of-memory).
511*b2055c35SXin Li int WebPPictureAllocYUVA(WebPPicture* const picture);
512*b2055c35SXin Li 
513*b2055c35SXin Li // Replace samples that are fully transparent by 'color' to help compressibility
514*b2055c35SXin Li // (no guarantee, though). Assumes pic->use_argb is true.
515*b2055c35SXin Li void WebPReplaceTransparentPixels(WebPPicture* const pic, uint32_t color);
516*b2055c35SXin Li 
517*b2055c35SXin Li //------------------------------------------------------------------------------
518*b2055c35SXin Li 
519*b2055c35SXin Li #ifdef __cplusplus
520*b2055c35SXin Li }    // extern "C"
521*b2055c35SXin Li #endif
522*b2055c35SXin Li 
523*b2055c35SXin Li #endif  // WEBP_ENC_VP8I_ENC_H_
524