1*b2055c35SXin Li // Copyright 2011 Google Inc. All Rights Reserved.
2*b2055c35SXin Li //
3*b2055c35SXin Li // Use of this source code is governed by a BSD-style license
4*b2055c35SXin Li // that can be found in the COPYING file in the root of the source
5*b2055c35SXin Li // tree. An additional intellectual property rights grant can be found
6*b2055c35SXin Li // in the file PATENTS. All contributing project authors may
7*b2055c35SXin Li // be found in the AUTHORS file in the root of the source tree.
8*b2055c35SXin Li // -----------------------------------------------------------------------------
9*b2055c35SXin Li //
10*b2055c35SXin Li // WebP encoder: internal header.
11*b2055c35SXin Li //
12*b2055c35SXin Li // Author: Skal ([email protected])
13*b2055c35SXin Li
14*b2055c35SXin Li #ifndef WEBP_ENC_VP8I_ENC_H_
15*b2055c35SXin Li #define WEBP_ENC_VP8I_ENC_H_
16*b2055c35SXin Li
17*b2055c35SXin Li #include <string.h> // for memcpy()
18*b2055c35SXin Li #include "src/dec/common_dec.h"
19*b2055c35SXin Li #include "src/dsp/dsp.h"
20*b2055c35SXin Li #include "src/utils/bit_writer_utils.h"
21*b2055c35SXin Li #include "src/utils/thread_utils.h"
22*b2055c35SXin Li #include "src/utils/utils.h"
23*b2055c35SXin Li #include "src/webp/encode.h"
24*b2055c35SXin Li
25*b2055c35SXin Li #ifdef __cplusplus
26*b2055c35SXin Li extern "C" {
27*b2055c35SXin Li #endif
28*b2055c35SXin Li
29*b2055c35SXin Li //------------------------------------------------------------------------------
30*b2055c35SXin Li // Various defines and enums
31*b2055c35SXin Li
32*b2055c35SXin Li // version numbers
33*b2055c35SXin Li #define ENC_MAJ_VERSION 1
34*b2055c35SXin Li #define ENC_MIN_VERSION 4
35*b2055c35SXin Li #define ENC_REV_VERSION 0
36*b2055c35SXin Li
37*b2055c35SXin Li enum { MAX_LF_LEVELS = 64, // Maximum loop filter level
38*b2055c35SXin Li MAX_VARIABLE_LEVEL = 67, // last (inclusive) level with variable cost
39*b2055c35SXin Li MAX_LEVEL = 2047 // max level (note: max codable is 2047 + 67)
40*b2055c35SXin Li };
41*b2055c35SXin Li
42*b2055c35SXin Li typedef enum { // Rate-distortion optimization levels
43*b2055c35SXin Li RD_OPT_NONE = 0, // no rd-opt
44*b2055c35SXin Li RD_OPT_BASIC = 1, // basic scoring (no trellis)
45*b2055c35SXin Li RD_OPT_TRELLIS = 2, // perform trellis-quant on the final decision only
46*b2055c35SXin Li RD_OPT_TRELLIS_ALL = 3 // trellis-quant for every scoring (much slower)
47*b2055c35SXin Li } VP8RDLevel;
48*b2055c35SXin Li
49*b2055c35SXin Li // YUV-cache parameters. Cache is 32-bytes wide (= one cacheline).
50*b2055c35SXin Li // The original or reconstructed samples can be accessed using VP8Scan[].
51*b2055c35SXin Li // The predicted blocks can be accessed using offsets to yuv_p_ and
52*b2055c35SXin Li // the arrays VP8*ModeOffsets[].
53*b2055c35SXin Li // * YUV Samples area (yuv_in_/yuv_out_/yuv_out2_)
54*b2055c35SXin Li // (see VP8Scan[] for accessing the blocks, along with
55*b2055c35SXin Li // Y_OFF_ENC/U_OFF_ENC/V_OFF_ENC):
56*b2055c35SXin Li // +----+----+
57*b2055c35SXin Li // Y_OFF_ENC |YYYY|UUVV|
58*b2055c35SXin Li // U_OFF_ENC |YYYY|UUVV|
59*b2055c35SXin Li // V_OFF_ENC |YYYY|....| <- 25% wasted U/V area
60*b2055c35SXin Li // |YYYY|....|
61*b2055c35SXin Li // +----+----+
62*b2055c35SXin Li // * Prediction area ('yuv_p_', size = PRED_SIZE_ENC)
63*b2055c35SXin Li // Intra16 predictions (16x16 block each, two per row):
64*b2055c35SXin Li // |I16DC16|I16TM16|
65*b2055c35SXin Li // |I16VE16|I16HE16|
66*b2055c35SXin Li // Chroma U/V predictions (16x8 block each, two per row):
67*b2055c35SXin Li // |C8DC8|C8TM8|
68*b2055c35SXin Li // |C8VE8|C8HE8|
69*b2055c35SXin Li // Intra 4x4 predictions (4x4 block each)
70*b2055c35SXin Li // |I4DC4 I4TM4 I4VE4 I4HE4|I4RD4 I4VR4 I4LD4 I4VL4|
71*b2055c35SXin Li // |I4HD4 I4HU4 I4TMP .....|.......................| <- ~31% wasted
72*b2055c35SXin Li #define YUV_SIZE_ENC (BPS * 16)
73*b2055c35SXin Li #define PRED_SIZE_ENC (32 * BPS + 16 * BPS + 8 * BPS) // I16+Chroma+I4 preds
74*b2055c35SXin Li #define Y_OFF_ENC (0)
75*b2055c35SXin Li #define U_OFF_ENC (16)
76*b2055c35SXin Li #define V_OFF_ENC (16 + 8)
77*b2055c35SXin Li
78*b2055c35SXin Li extern const uint16_t VP8Scan[16];
79*b2055c35SXin Li extern const uint16_t VP8UVModeOffsets[4];
80*b2055c35SXin Li extern const uint16_t VP8I16ModeOffsets[4];
81*b2055c35SXin Li extern const uint16_t VP8I4ModeOffsets[NUM_BMODES];
82*b2055c35SXin Li
83*b2055c35SXin Li // Layout of prediction blocks
84*b2055c35SXin Li // intra 16x16
85*b2055c35SXin Li #define I16DC16 (0 * 16 * BPS)
86*b2055c35SXin Li #define I16TM16 (I16DC16 + 16)
87*b2055c35SXin Li #define I16VE16 (1 * 16 * BPS)
88*b2055c35SXin Li #define I16HE16 (I16VE16 + 16)
89*b2055c35SXin Li // chroma 8x8, two U/V blocks side by side (hence: 16x8 each)
90*b2055c35SXin Li #define C8DC8 (2 * 16 * BPS)
91*b2055c35SXin Li #define C8TM8 (C8DC8 + 1 * 16)
92*b2055c35SXin Li #define C8VE8 (2 * 16 * BPS + 8 * BPS)
93*b2055c35SXin Li #define C8HE8 (C8VE8 + 1 * 16)
94*b2055c35SXin Li // intra 4x4
95*b2055c35SXin Li #define I4DC4 (3 * 16 * BPS + 0)
96*b2055c35SXin Li #define I4TM4 (I4DC4 + 4)
97*b2055c35SXin Li #define I4VE4 (I4DC4 + 8)
98*b2055c35SXin Li #define I4HE4 (I4DC4 + 12)
99*b2055c35SXin Li #define I4RD4 (I4DC4 + 16)
100*b2055c35SXin Li #define I4VR4 (I4DC4 + 20)
101*b2055c35SXin Li #define I4LD4 (I4DC4 + 24)
102*b2055c35SXin Li #define I4VL4 (I4DC4 + 28)
103*b2055c35SXin Li #define I4HD4 (3 * 16 * BPS + 4 * BPS)
104*b2055c35SXin Li #define I4HU4 (I4HD4 + 4)
105*b2055c35SXin Li #define I4TMP (I4HD4 + 8)
106*b2055c35SXin Li
107*b2055c35SXin Li typedef int64_t score_t; // type used for scores, rate, distortion
108*b2055c35SXin Li // Note that MAX_COST is not the maximum allowed by sizeof(score_t),
109*b2055c35SXin Li // in order to allow overflowing computations.
110*b2055c35SXin Li #define MAX_COST ((score_t)0x7fffffffffffffLL)
111*b2055c35SXin Li
112*b2055c35SXin Li #define QFIX 17
113*b2055c35SXin Li #define BIAS(b) ((b) << (QFIX - 8))
114*b2055c35SXin Li // Fun fact: this is the _only_ line where we're actually being lossy and
115*b2055c35SXin Li // discarding bits.
QUANTDIV(uint32_t n,uint32_t iQ,uint32_t B)116*b2055c35SXin Li static WEBP_INLINE int QUANTDIV(uint32_t n, uint32_t iQ, uint32_t B) {
117*b2055c35SXin Li return (int)((n * iQ + B) >> QFIX);
118*b2055c35SXin Li }
119*b2055c35SXin Li
120*b2055c35SXin Li // Uncomment the following to remove token-buffer code:
121*b2055c35SXin Li // #define DISABLE_TOKEN_BUFFER
122*b2055c35SXin Li
123*b2055c35SXin Li // quality below which error-diffusion is enabled
124*b2055c35SXin Li #define ERROR_DIFFUSION_QUALITY 98
125*b2055c35SXin Li
126*b2055c35SXin Li //------------------------------------------------------------------------------
127*b2055c35SXin Li // Headers
128*b2055c35SXin Li
129*b2055c35SXin Li typedef uint32_t proba_t; // 16b + 16b
130*b2055c35SXin Li typedef uint8_t ProbaArray[NUM_CTX][NUM_PROBAS];
131*b2055c35SXin Li typedef proba_t StatsArray[NUM_CTX][NUM_PROBAS];
132*b2055c35SXin Li typedef uint16_t CostArray[NUM_CTX][MAX_VARIABLE_LEVEL + 1];
133*b2055c35SXin Li typedef const uint16_t* (*CostArrayPtr)[NUM_CTX]; // for easy casting
134*b2055c35SXin Li typedef const uint16_t* CostArrayMap[16][NUM_CTX];
135*b2055c35SXin Li typedef double LFStats[NUM_MB_SEGMENTS][MAX_LF_LEVELS]; // filter stats
136*b2055c35SXin Li
137*b2055c35SXin Li typedef struct VP8Encoder VP8Encoder;
138*b2055c35SXin Li
139*b2055c35SXin Li // segment features
140*b2055c35SXin Li typedef struct {
141*b2055c35SXin Li int num_segments_; // Actual number of segments. 1 segment only = unused.
142*b2055c35SXin Li int update_map_; // whether to update the segment map or not.
143*b2055c35SXin Li // must be 0 if there's only 1 segment.
144*b2055c35SXin Li int size_; // bit-cost for transmitting the segment map
145*b2055c35SXin Li } VP8EncSegmentHeader;
146*b2055c35SXin Li
147*b2055c35SXin Li // Struct collecting all frame-persistent probabilities.
148*b2055c35SXin Li typedef struct {
149*b2055c35SXin Li uint8_t segments_[3]; // probabilities for segment tree
150*b2055c35SXin Li uint8_t skip_proba_; // final probability of being skipped.
151*b2055c35SXin Li ProbaArray coeffs_[NUM_TYPES][NUM_BANDS]; // 1056 bytes
152*b2055c35SXin Li StatsArray stats_[NUM_TYPES][NUM_BANDS]; // 4224 bytes
153*b2055c35SXin Li CostArray level_cost_[NUM_TYPES][NUM_BANDS]; // 13056 bytes
154*b2055c35SXin Li CostArrayMap remapped_costs_[NUM_TYPES]; // 1536 bytes
155*b2055c35SXin Li int dirty_; // if true, need to call VP8CalculateLevelCosts()
156*b2055c35SXin Li int use_skip_proba_; // Note: we always use skip_proba for now.
157*b2055c35SXin Li int nb_skip_; // number of skipped blocks
158*b2055c35SXin Li } VP8EncProba;
159*b2055c35SXin Li
160*b2055c35SXin Li // Filter parameters. Not actually used in the code (we don't perform
161*b2055c35SXin Li // the in-loop filtering), but filled from user's config
162*b2055c35SXin Li typedef struct {
163*b2055c35SXin Li int simple_; // filtering type: 0=complex, 1=simple
164*b2055c35SXin Li int level_; // base filter level [0..63]
165*b2055c35SXin Li int sharpness_; // [0..7]
166*b2055c35SXin Li int i4x4_lf_delta_; // delta filter level for i4x4 relative to i16x16
167*b2055c35SXin Li } VP8EncFilterHeader;
168*b2055c35SXin Li
169*b2055c35SXin Li //------------------------------------------------------------------------------
170*b2055c35SXin Li // Informations about the macroblocks.
171*b2055c35SXin Li
172*b2055c35SXin Li typedef struct {
173*b2055c35SXin Li // block type
174*b2055c35SXin Li unsigned int type_:2; // 0=i4x4, 1=i16x16
175*b2055c35SXin Li unsigned int uv_mode_:2;
176*b2055c35SXin Li unsigned int skip_:1;
177*b2055c35SXin Li unsigned int segment_:2;
178*b2055c35SXin Li uint8_t alpha_; // quantization-susceptibility
179*b2055c35SXin Li } VP8MBInfo;
180*b2055c35SXin Li
181*b2055c35SXin Li typedef struct VP8Matrix {
182*b2055c35SXin Li uint16_t q_[16]; // quantizer steps
183*b2055c35SXin Li uint16_t iq_[16]; // reciprocals, fixed point.
184*b2055c35SXin Li uint32_t bias_[16]; // rounding bias
185*b2055c35SXin Li uint32_t zthresh_[16]; // value below which a coefficient is zeroed
186*b2055c35SXin Li uint16_t sharpen_[16]; // frequency boosters for slight sharpening
187*b2055c35SXin Li } VP8Matrix;
188*b2055c35SXin Li
189*b2055c35SXin Li typedef struct {
190*b2055c35SXin Li VP8Matrix y1_, y2_, uv_; // quantization matrices
191*b2055c35SXin Li int alpha_; // quant-susceptibility, range [-127,127]. Zero is neutral.
192*b2055c35SXin Li // Lower values indicate a lower risk of blurriness.
193*b2055c35SXin Li int beta_; // filter-susceptibility, range [0,255].
194*b2055c35SXin Li int quant_; // final segment quantizer.
195*b2055c35SXin Li int fstrength_; // final in-loop filtering strength
196*b2055c35SXin Li int max_edge_; // max edge delta (for filtering strength)
197*b2055c35SXin Li int min_disto_; // minimum distortion required to trigger filtering record
198*b2055c35SXin Li // reactivities
199*b2055c35SXin Li int lambda_i16_, lambda_i4_, lambda_uv_;
200*b2055c35SXin Li int lambda_mode_, lambda_trellis_, tlambda_;
201*b2055c35SXin Li int lambda_trellis_i16_, lambda_trellis_i4_, lambda_trellis_uv_;
202*b2055c35SXin Li
203*b2055c35SXin Li // lambda values for distortion-based evaluation
204*b2055c35SXin Li score_t i4_penalty_; // penalty for using Intra4
205*b2055c35SXin Li } VP8SegmentInfo;
206*b2055c35SXin Li
207*b2055c35SXin Li typedef int8_t DError[2 /* u/v */][2 /* top or left */];
208*b2055c35SXin Li
209*b2055c35SXin Li // Handy transient struct to accumulate score and info during RD-optimization
210*b2055c35SXin Li // and mode evaluation.
211*b2055c35SXin Li typedef struct {
212*b2055c35SXin Li score_t D, SD; // Distortion, spectral distortion
213*b2055c35SXin Li score_t H, R, score; // header bits, rate, score.
214*b2055c35SXin Li int16_t y_dc_levels[16]; // Quantized levels for luma-DC, luma-AC, chroma.
215*b2055c35SXin Li int16_t y_ac_levels[16][16];
216*b2055c35SXin Li int16_t uv_levels[4 + 4][16];
217*b2055c35SXin Li int mode_i16; // mode number for intra16 prediction
218*b2055c35SXin Li uint8_t modes_i4[16]; // mode numbers for intra4 predictions
219*b2055c35SXin Li int mode_uv; // mode number of chroma prediction
220*b2055c35SXin Li uint32_t nz; // non-zero blocks
221*b2055c35SXin Li int8_t derr[2][3]; // DC diffusion errors for U/V for blocks #1/2/3
222*b2055c35SXin Li } VP8ModeScore;
223*b2055c35SXin Li
224*b2055c35SXin Li // Iterator structure to iterate through macroblocks, pointing to the
225*b2055c35SXin Li // right neighbouring data (samples, predictions, contexts, ...)
226*b2055c35SXin Li typedef struct {
227*b2055c35SXin Li int x_, y_; // current macroblock
228*b2055c35SXin Li uint8_t* yuv_in_; // input samples
229*b2055c35SXin Li uint8_t* yuv_out_; // output samples
230*b2055c35SXin Li uint8_t* yuv_out2_; // secondary buffer swapped with yuv_out_.
231*b2055c35SXin Li uint8_t* yuv_p_; // scratch buffer for prediction
232*b2055c35SXin Li VP8Encoder* enc_; // back-pointer
233*b2055c35SXin Li VP8MBInfo* mb_; // current macroblock
234*b2055c35SXin Li VP8BitWriter* bw_; // current bit-writer
235*b2055c35SXin Li uint8_t* preds_; // intra mode predictors (4x4 blocks)
236*b2055c35SXin Li uint32_t* nz_; // non-zero pattern
237*b2055c35SXin Li uint8_t i4_boundary_[37]; // 32+5 boundary samples needed by intra4x4
238*b2055c35SXin Li uint8_t* i4_top_; // pointer to the current top boundary sample
239*b2055c35SXin Li int i4_; // current intra4x4 mode being tested
240*b2055c35SXin Li int top_nz_[9]; // top-non-zero context.
241*b2055c35SXin Li int left_nz_[9]; // left-non-zero. left_nz[8] is independent.
242*b2055c35SXin Li uint64_t bit_count_[4][3]; // bit counters for coded levels.
243*b2055c35SXin Li uint64_t luma_bits_; // macroblock bit-cost for luma
244*b2055c35SXin Li uint64_t uv_bits_; // macroblock bit-cost for chroma
245*b2055c35SXin Li LFStats* lf_stats_; // filter stats (borrowed from enc_)
246*b2055c35SXin Li int do_trellis_; // if true, perform extra level optimisation
247*b2055c35SXin Li int count_down_; // number of mb still to be processed
248*b2055c35SXin Li int count_down0_; // starting counter value (for progress)
249*b2055c35SXin Li int percent0_; // saved initial progress percent
250*b2055c35SXin Li
251*b2055c35SXin Li DError left_derr_; // left error diffusion (u/v)
252*b2055c35SXin Li DError* top_derr_; // top diffusion error - NULL if disabled
253*b2055c35SXin Li
254*b2055c35SXin Li uint8_t* y_left_; // left luma samples (addressable from index -1 to 15).
255*b2055c35SXin Li uint8_t* u_left_; // left u samples (addressable from index -1 to 7)
256*b2055c35SXin Li uint8_t* v_left_; // left v samples (addressable from index -1 to 7)
257*b2055c35SXin Li
258*b2055c35SXin Li uint8_t* y_top_; // top luma samples at position 'x_'
259*b2055c35SXin Li uint8_t* uv_top_; // top u/v samples at position 'x_', packed as 16 bytes
260*b2055c35SXin Li
261*b2055c35SXin Li // memory for storing y/u/v_left_
262*b2055c35SXin Li uint8_t yuv_left_mem_[17 + 16 + 16 + 8 + WEBP_ALIGN_CST];
263*b2055c35SXin Li // memory for yuv_*
264*b2055c35SXin Li uint8_t yuv_mem_[3 * YUV_SIZE_ENC + PRED_SIZE_ENC + WEBP_ALIGN_CST];
265*b2055c35SXin Li } VP8EncIterator;
266*b2055c35SXin Li
267*b2055c35SXin Li // in iterator.c
268*b2055c35SXin Li // must be called first
269*b2055c35SXin Li void VP8IteratorInit(VP8Encoder* const enc, VP8EncIterator* const it);
270*b2055c35SXin Li // restart a scan
271*b2055c35SXin Li void VP8IteratorReset(VP8EncIterator* const it);
272*b2055c35SXin Li // reset iterator position to row 'y'
273*b2055c35SXin Li void VP8IteratorSetRow(VP8EncIterator* const it, int y);
274*b2055c35SXin Li // set count down (=number of iterations to go)
275*b2055c35SXin Li void VP8IteratorSetCountDown(VP8EncIterator* const it, int count_down);
276*b2055c35SXin Li // return true if iteration is finished
277*b2055c35SXin Li int VP8IteratorIsDone(const VP8EncIterator* const it);
278*b2055c35SXin Li // Import uncompressed samples from source.
279*b2055c35SXin Li // If tmp_32 is not NULL, import boundary samples too.
280*b2055c35SXin Li // tmp_32 is a 32-bytes scratch buffer that must be aligned in memory.
281*b2055c35SXin Li void VP8IteratorImport(VP8EncIterator* const it, uint8_t* const tmp_32);
282*b2055c35SXin Li // export decimated samples
283*b2055c35SXin Li void VP8IteratorExport(const VP8EncIterator* const it);
284*b2055c35SXin Li // go to next macroblock. Returns false if not finished.
285*b2055c35SXin Li int VP8IteratorNext(VP8EncIterator* const it);
286*b2055c35SXin Li // save the yuv_out_ boundary values to top_/left_ arrays for next iterations.
287*b2055c35SXin Li void VP8IteratorSaveBoundary(VP8EncIterator* const it);
288*b2055c35SXin Li // Report progression based on macroblock rows. Return 0 for user-abort request.
289*b2055c35SXin Li int VP8IteratorProgress(const VP8EncIterator* const it, int delta);
290*b2055c35SXin Li // Intra4x4 iterations
291*b2055c35SXin Li void VP8IteratorStartI4(VP8EncIterator* const it);
292*b2055c35SXin Li // returns true if not done.
293*b2055c35SXin Li int VP8IteratorRotateI4(VP8EncIterator* const it,
294*b2055c35SXin Li const uint8_t* const yuv_out);
295*b2055c35SXin Li
296*b2055c35SXin Li // Non-zero context setup/teardown
297*b2055c35SXin Li void VP8IteratorNzToBytes(VP8EncIterator* const it);
298*b2055c35SXin Li void VP8IteratorBytesToNz(VP8EncIterator* const it);
299*b2055c35SXin Li
300*b2055c35SXin Li // Helper functions to set mode properties
301*b2055c35SXin Li void VP8SetIntra16Mode(const VP8EncIterator* const it, int mode);
302*b2055c35SXin Li void VP8SetIntra4Mode(const VP8EncIterator* const it, const uint8_t* modes);
303*b2055c35SXin Li void VP8SetIntraUVMode(const VP8EncIterator* const it, int mode);
304*b2055c35SXin Li void VP8SetSkip(const VP8EncIterator* const it, int skip);
305*b2055c35SXin Li void VP8SetSegment(const VP8EncIterator* const it, int segment);
306*b2055c35SXin Li
307*b2055c35SXin Li //------------------------------------------------------------------------------
308*b2055c35SXin Li // Paginated token buffer
309*b2055c35SXin Li
310*b2055c35SXin Li typedef struct VP8Tokens VP8Tokens; // struct details in token.c
311*b2055c35SXin Li
312*b2055c35SXin Li typedef struct {
313*b2055c35SXin Li #if !defined(DISABLE_TOKEN_BUFFER)
314*b2055c35SXin Li VP8Tokens* pages_; // first page
315*b2055c35SXin Li VP8Tokens** last_page_; // last page
316*b2055c35SXin Li uint16_t* tokens_; // set to (*last_page_)->tokens_
317*b2055c35SXin Li int left_; // how many free tokens left before the page is full
318*b2055c35SXin Li int page_size_; // number of tokens per page
319*b2055c35SXin Li #endif
320*b2055c35SXin Li int error_; // true in case of malloc error
321*b2055c35SXin Li } VP8TBuffer;
322*b2055c35SXin Li
323*b2055c35SXin Li // initialize an empty buffer
324*b2055c35SXin Li void VP8TBufferInit(VP8TBuffer* const b, int page_size);
325*b2055c35SXin Li void VP8TBufferClear(VP8TBuffer* const b); // de-allocate pages memory
326*b2055c35SXin Li
327*b2055c35SXin Li #if !defined(DISABLE_TOKEN_BUFFER)
328*b2055c35SXin Li
329*b2055c35SXin Li // Finalizes bitstream when probabilities are known.
330*b2055c35SXin Li // Deletes the allocated token memory if final_pass is true.
331*b2055c35SXin Li int VP8EmitTokens(VP8TBuffer* const b, VP8BitWriter* const bw,
332*b2055c35SXin Li const uint8_t* const probas, int final_pass);
333*b2055c35SXin Li
334*b2055c35SXin Li // record the coding of coefficients without knowing the probabilities yet
335*b2055c35SXin Li int VP8RecordCoeffTokens(int ctx, const struct VP8Residual* const res,
336*b2055c35SXin Li VP8TBuffer* const tokens);
337*b2055c35SXin Li
338*b2055c35SXin Li // Estimate the final coded size given a set of 'probas'.
339*b2055c35SXin Li size_t VP8EstimateTokenSize(VP8TBuffer* const b, const uint8_t* const probas);
340*b2055c35SXin Li
341*b2055c35SXin Li #endif // !DISABLE_TOKEN_BUFFER
342*b2055c35SXin Li
343*b2055c35SXin Li //------------------------------------------------------------------------------
344*b2055c35SXin Li // VP8Encoder
345*b2055c35SXin Li
346*b2055c35SXin Li struct VP8Encoder {
347*b2055c35SXin Li const WebPConfig* config_; // user configuration and parameters
348*b2055c35SXin Li WebPPicture* pic_; // input / output picture
349*b2055c35SXin Li
350*b2055c35SXin Li // headers
351*b2055c35SXin Li VP8EncFilterHeader filter_hdr_; // filtering information
352*b2055c35SXin Li VP8EncSegmentHeader segment_hdr_; // segment information
353*b2055c35SXin Li
354*b2055c35SXin Li int profile_; // VP8's profile, deduced from Config.
355*b2055c35SXin Li
356*b2055c35SXin Li // dimension, in macroblock units.
357*b2055c35SXin Li int mb_w_, mb_h_;
358*b2055c35SXin Li int preds_w_; // stride of the *preds_ prediction plane (=4*mb_w + 1)
359*b2055c35SXin Li
360*b2055c35SXin Li // number of partitions (1, 2, 4 or 8 = MAX_NUM_PARTITIONS)
361*b2055c35SXin Li int num_parts_;
362*b2055c35SXin Li
363*b2055c35SXin Li // per-partition boolean decoders.
364*b2055c35SXin Li VP8BitWriter bw_; // part0
365*b2055c35SXin Li VP8BitWriter parts_[MAX_NUM_PARTITIONS]; // token partitions
366*b2055c35SXin Li VP8TBuffer tokens_; // token buffer
367*b2055c35SXin Li
368*b2055c35SXin Li int percent_; // for progress
369*b2055c35SXin Li
370*b2055c35SXin Li // transparency blob
371*b2055c35SXin Li int has_alpha_;
372*b2055c35SXin Li uint8_t* alpha_data_; // non-NULL if transparency is present
373*b2055c35SXin Li uint32_t alpha_data_size_;
374*b2055c35SXin Li WebPWorker alpha_worker_;
375*b2055c35SXin Li
376*b2055c35SXin Li // quantization info (one set of DC/AC dequant factor per segment)
377*b2055c35SXin Li VP8SegmentInfo dqm_[NUM_MB_SEGMENTS];
378*b2055c35SXin Li int base_quant_; // nominal quantizer value. Only used
379*b2055c35SXin Li // for relative coding of segments' quant.
380*b2055c35SXin Li int alpha_; // global susceptibility (<=> complexity)
381*b2055c35SXin Li int uv_alpha_; // U/V quantization susceptibility
382*b2055c35SXin Li // global offset of quantizers, shared by all segments
383*b2055c35SXin Li int dq_y1_dc_;
384*b2055c35SXin Li int dq_y2_dc_, dq_y2_ac_;
385*b2055c35SXin Li int dq_uv_dc_, dq_uv_ac_;
386*b2055c35SXin Li
387*b2055c35SXin Li // probabilities and statistics
388*b2055c35SXin Li VP8EncProba proba_;
389*b2055c35SXin Li uint64_t sse_[4]; // sum of Y/U/V/A squared errors for all macroblocks
390*b2055c35SXin Li uint64_t sse_count_; // pixel count for the sse_[] stats
391*b2055c35SXin Li int coded_size_;
392*b2055c35SXin Li int residual_bytes_[3][4];
393*b2055c35SXin Li int block_count_[3];
394*b2055c35SXin Li
395*b2055c35SXin Li // quality/speed settings
396*b2055c35SXin Li int method_; // 0=fastest, 6=best/slowest.
397*b2055c35SXin Li VP8RDLevel rd_opt_level_; // Deduced from method_.
398*b2055c35SXin Li int max_i4_header_bits_; // partition #0 safeness factor
399*b2055c35SXin Li int mb_header_limit_; // rough limit for header bits per MB
400*b2055c35SXin Li int thread_level_; // derived from config->thread_level
401*b2055c35SXin Li int do_search_; // derived from config->target_XXX
402*b2055c35SXin Li int use_tokens_; // if true, use token buffer
403*b2055c35SXin Li
404*b2055c35SXin Li // Memory
405*b2055c35SXin Li VP8MBInfo* mb_info_; // contextual macroblock infos (mb_w_ + 1)
406*b2055c35SXin Li uint8_t* preds_; // predictions modes: (4*mb_w+1) * (4*mb_h+1)
407*b2055c35SXin Li uint32_t* nz_; // non-zero bit context: mb_w+1
408*b2055c35SXin Li uint8_t* y_top_; // top luma samples.
409*b2055c35SXin Li uint8_t* uv_top_; // top u/v samples.
410*b2055c35SXin Li // U and V are packed into 16 bytes (8 U + 8 V)
411*b2055c35SXin Li LFStats* lf_stats_; // autofilter stats (if NULL, autofilter is off)
412*b2055c35SXin Li DError* top_derr_; // diffusion error (NULL if disabled)
413*b2055c35SXin Li };
414*b2055c35SXin Li
415*b2055c35SXin Li //------------------------------------------------------------------------------
416*b2055c35SXin Li // internal functions. Not public.
417*b2055c35SXin Li
418*b2055c35SXin Li // in tree.c
419*b2055c35SXin Li extern const uint8_t VP8CoeffsProba0[NUM_TYPES][NUM_BANDS][NUM_CTX][NUM_PROBAS];
420*b2055c35SXin Li extern const uint8_t
421*b2055c35SXin Li VP8CoeffsUpdateProba[NUM_TYPES][NUM_BANDS][NUM_CTX][NUM_PROBAS];
422*b2055c35SXin Li // Reset the token probabilities to their initial (default) values
423*b2055c35SXin Li void VP8DefaultProbas(VP8Encoder* const enc);
424*b2055c35SXin Li // Write the token probabilities
425*b2055c35SXin Li void VP8WriteProbas(VP8BitWriter* const bw, const VP8EncProba* const probas);
426*b2055c35SXin Li // Writes the partition #0 modes (that is: all intra modes)
427*b2055c35SXin Li void VP8CodeIntraModes(VP8Encoder* const enc);
428*b2055c35SXin Li
429*b2055c35SXin Li // in syntax.c
430*b2055c35SXin Li // Generates the final bitstream by coding the partition0 and headers,
431*b2055c35SXin Li // and appending an assembly of all the pre-coded token partitions.
432*b2055c35SXin Li // Return true if everything is ok.
433*b2055c35SXin Li int VP8EncWrite(VP8Encoder* const enc);
434*b2055c35SXin Li // Release memory allocated for bit-writing in VP8EncLoop & seq.
435*b2055c35SXin Li void VP8EncFreeBitWriters(VP8Encoder* const enc);
436*b2055c35SXin Li
437*b2055c35SXin Li // in frame.c
438*b2055c35SXin Li extern const uint8_t VP8Cat3[];
439*b2055c35SXin Li extern const uint8_t VP8Cat4[];
440*b2055c35SXin Li extern const uint8_t VP8Cat5[];
441*b2055c35SXin Li extern const uint8_t VP8Cat6[];
442*b2055c35SXin Li
443*b2055c35SXin Li // Form all the four Intra16x16 predictions in the yuv_p_ cache
444*b2055c35SXin Li void VP8MakeLuma16Preds(const VP8EncIterator* const it);
445*b2055c35SXin Li // Form all the four Chroma8x8 predictions in the yuv_p_ cache
446*b2055c35SXin Li void VP8MakeChroma8Preds(const VP8EncIterator* const it);
447*b2055c35SXin Li // Form all the ten Intra4x4 predictions in the yuv_p_ cache
448*b2055c35SXin Li // for the 4x4 block it->i4_
449*b2055c35SXin Li void VP8MakeIntra4Preds(const VP8EncIterator* const it);
450*b2055c35SXin Li // Rate calculation
451*b2055c35SXin Li int VP8GetCostLuma16(VP8EncIterator* const it, const VP8ModeScore* const rd);
452*b2055c35SXin Li int VP8GetCostLuma4(VP8EncIterator* const it, const int16_t levels[16]);
453*b2055c35SXin Li int VP8GetCostUV(VP8EncIterator* const it, const VP8ModeScore* const rd);
454*b2055c35SXin Li // Main coding calls
455*b2055c35SXin Li int VP8EncLoop(VP8Encoder* const enc);
456*b2055c35SXin Li int VP8EncTokenLoop(VP8Encoder* const enc);
457*b2055c35SXin Li
458*b2055c35SXin Li // in webpenc.c
459*b2055c35SXin Li // Assign an error code to a picture. Return false for convenience.
460*b2055c35SXin Li int WebPEncodingSetError(const WebPPicture* const pic, WebPEncodingError error);
461*b2055c35SXin Li int WebPReportProgress(const WebPPicture* const pic,
462*b2055c35SXin Li int percent, int* const percent_store);
463*b2055c35SXin Li
464*b2055c35SXin Li // in analysis.c
465*b2055c35SXin Li // Main analysis loop. Decides the segmentations and complexity.
466*b2055c35SXin Li // Assigns a first guess for Intra16 and uvmode_ prediction modes.
467*b2055c35SXin Li int VP8EncAnalyze(VP8Encoder* const enc);
468*b2055c35SXin Li
469*b2055c35SXin Li // in quant.c
470*b2055c35SXin Li // Sets up segment's quantization values, base_quant_ and filter strengths.
471*b2055c35SXin Li void VP8SetSegmentParams(VP8Encoder* const enc, float quality);
472*b2055c35SXin Li // Pick best modes and fills the levels. Returns true if skipped.
473*b2055c35SXin Li int VP8Decimate(VP8EncIterator* WEBP_RESTRICT const it,
474*b2055c35SXin Li VP8ModeScore* WEBP_RESTRICT const rd,
475*b2055c35SXin Li VP8RDLevel rd_opt);
476*b2055c35SXin Li
477*b2055c35SXin Li // in alpha.c
478*b2055c35SXin Li void VP8EncInitAlpha(VP8Encoder* const enc); // initialize alpha compression
479*b2055c35SXin Li int VP8EncStartAlpha(VP8Encoder* const enc); // start alpha coding process
480*b2055c35SXin Li int VP8EncFinishAlpha(VP8Encoder* const enc); // finalize compressed data
481*b2055c35SXin Li int VP8EncDeleteAlpha(VP8Encoder* const enc); // delete compressed data
482*b2055c35SXin Li
483*b2055c35SXin Li // autofilter
484*b2055c35SXin Li void VP8InitFilter(VP8EncIterator* const it);
485*b2055c35SXin Li void VP8StoreFilterStats(VP8EncIterator* const it);
486*b2055c35SXin Li void VP8AdjustFilterStrength(VP8EncIterator* const it);
487*b2055c35SXin Li
488*b2055c35SXin Li // returns the approximate filtering strength needed to smooth a edge
489*b2055c35SXin Li // step of 'delta', given a sharpness parameter 'sharpness'.
490*b2055c35SXin Li int VP8FilterStrengthFromDelta(int sharpness, int delta);
491*b2055c35SXin Li
492*b2055c35SXin Li // misc utils for picture_*.c:
493*b2055c35SXin Li
494*b2055c35SXin Li // Returns true if 'picture' is non-NULL and dimensions/colorspace are within
495*b2055c35SXin Li // their valid ranges. If returning false, the 'error_code' in 'picture' is
496*b2055c35SXin Li // updated.
497*b2055c35SXin Li int WebPValidatePicture(const WebPPicture* const picture);
498*b2055c35SXin Li
499*b2055c35SXin Li // Remove reference to the ARGB/YUVA buffer (doesn't free anything).
500*b2055c35SXin Li void WebPPictureResetBuffers(WebPPicture* const picture);
501*b2055c35SXin Li
502*b2055c35SXin Li // Allocates ARGB buffer according to set width/height (previous one is
503*b2055c35SXin Li // always free'd). Preserves the YUV(A) buffer. Returns false in case of error
504*b2055c35SXin Li // (invalid param, out-of-memory).
505*b2055c35SXin Li int WebPPictureAllocARGB(WebPPicture* const picture);
506*b2055c35SXin Li
507*b2055c35SXin Li // Allocates YUVA buffer according to set width/height (previous one is always
508*b2055c35SXin Li // free'd). Uses picture->csp to determine whether an alpha buffer is needed.
509*b2055c35SXin Li // Preserves the ARGB buffer.
510*b2055c35SXin Li // Returns false in case of error (invalid param, out-of-memory).
511*b2055c35SXin Li int WebPPictureAllocYUVA(WebPPicture* const picture);
512*b2055c35SXin Li
513*b2055c35SXin Li // Replace samples that are fully transparent by 'color' to help compressibility
514*b2055c35SXin Li // (no guarantee, though). Assumes pic->use_argb is true.
515*b2055c35SXin Li void WebPReplaceTransparentPixels(WebPPicture* const pic, uint32_t color);
516*b2055c35SXin Li
517*b2055c35SXin Li //------------------------------------------------------------------------------
518*b2055c35SXin Li
519*b2055c35SXin Li #ifdef __cplusplus
520*b2055c35SXin Li } // extern "C"
521*b2055c35SXin Li #endif
522*b2055c35SXin Li
523*b2055c35SXin Li #endif // WEBP_ENC_VP8I_ENC_H_
524