1*b2055c35SXin Li // Copyright 2011 Google Inc. All Rights Reserved.
2*b2055c35SXin Li //
3*b2055c35SXin Li // Use of this source code is governed by a BSD-style license
4*b2055c35SXin Li // that can be found in the COPYING file in the root of the source
5*b2055c35SXin Li // tree. An additional intellectual property rights grant can be found
6*b2055c35SXin Li // in the file PATENTS. All contributing project authors may
7*b2055c35SXin Li // be found in the AUTHORS file in the root of the source tree.
8*b2055c35SXin Li // -----------------------------------------------------------------------------
9*b2055c35SXin Li //
10*b2055c35SXin Li // Paginated token buffer
11*b2055c35SXin Li //
12*b2055c35SXin Li // A 'token' is a bit value associated with a probability, either fixed
13*b2055c35SXin Li // or a later-to-be-determined after statistics have been collected.
14*b2055c35SXin Li // For dynamic probability, we just record the slot id (idx) for the probability
15*b2055c35SXin Li // value in the final probability array (uint8_t* probas in VP8EmitTokens).
16*b2055c35SXin Li //
17*b2055c35SXin Li // Author: Skal ([email protected])
18*b2055c35SXin Li
19*b2055c35SXin Li #include <assert.h>
20*b2055c35SXin Li #include <stdlib.h>
21*b2055c35SXin Li #include <string.h>
22*b2055c35SXin Li
23*b2055c35SXin Li #include "src/enc/cost_enc.h"
24*b2055c35SXin Li #include "src/enc/vp8i_enc.h"
25*b2055c35SXin Li #include "src/utils/utils.h"
26*b2055c35SXin Li
27*b2055c35SXin Li #if !defined(DISABLE_TOKEN_BUFFER)
28*b2055c35SXin Li
29*b2055c35SXin Li // we use pages to reduce the number of memcpy()
30*b2055c35SXin Li #define MIN_PAGE_SIZE 8192 // minimum number of token per page
31*b2055c35SXin Li #define FIXED_PROBA_BIT (1u << 14)
32*b2055c35SXin Li
33*b2055c35SXin Li typedef uint16_t token_t; // bit #15: bit value
34*b2055c35SXin Li // bit #14: flags for constant proba or idx
35*b2055c35SXin Li // bits #0..13: slot or constant proba
36*b2055c35SXin Li struct VP8Tokens {
37*b2055c35SXin Li VP8Tokens* next_; // pointer to next page
38*b2055c35SXin Li };
39*b2055c35SXin Li // Token data is located in memory just after the next_ field.
40*b2055c35SXin Li // This macro is used to return their address and hide the trick.
41*b2055c35SXin Li #define TOKEN_DATA(p) ((const token_t*)&(p)[1])
42*b2055c35SXin Li
43*b2055c35SXin Li //------------------------------------------------------------------------------
44*b2055c35SXin Li
VP8TBufferInit(VP8TBuffer * const b,int page_size)45*b2055c35SXin Li void VP8TBufferInit(VP8TBuffer* const b, int page_size) {
46*b2055c35SXin Li b->tokens_ = NULL;
47*b2055c35SXin Li b->pages_ = NULL;
48*b2055c35SXin Li b->last_page_ = &b->pages_;
49*b2055c35SXin Li b->left_ = 0;
50*b2055c35SXin Li b->page_size_ = (page_size < MIN_PAGE_SIZE) ? MIN_PAGE_SIZE : page_size;
51*b2055c35SXin Li b->error_ = 0;
52*b2055c35SXin Li }
53*b2055c35SXin Li
VP8TBufferClear(VP8TBuffer * const b)54*b2055c35SXin Li void VP8TBufferClear(VP8TBuffer* const b) {
55*b2055c35SXin Li if (b != NULL) {
56*b2055c35SXin Li VP8Tokens* p = b->pages_;
57*b2055c35SXin Li while (p != NULL) {
58*b2055c35SXin Li VP8Tokens* const next = p->next_;
59*b2055c35SXin Li WebPSafeFree(p);
60*b2055c35SXin Li p = next;
61*b2055c35SXin Li }
62*b2055c35SXin Li VP8TBufferInit(b, b->page_size_);
63*b2055c35SXin Li }
64*b2055c35SXin Li }
65*b2055c35SXin Li
TBufferNewPage(VP8TBuffer * const b)66*b2055c35SXin Li static int TBufferNewPage(VP8TBuffer* const b) {
67*b2055c35SXin Li VP8Tokens* page = NULL;
68*b2055c35SXin Li if (!b->error_) {
69*b2055c35SXin Li const size_t size = sizeof(*page) + b->page_size_ * sizeof(token_t);
70*b2055c35SXin Li page = (VP8Tokens*)WebPSafeMalloc(1ULL, size);
71*b2055c35SXin Li }
72*b2055c35SXin Li if (page == NULL) {
73*b2055c35SXin Li b->error_ = 1;
74*b2055c35SXin Li return 0;
75*b2055c35SXin Li }
76*b2055c35SXin Li page->next_ = NULL;
77*b2055c35SXin Li
78*b2055c35SXin Li *b->last_page_ = page;
79*b2055c35SXin Li b->last_page_ = &page->next_;
80*b2055c35SXin Li b->left_ = b->page_size_;
81*b2055c35SXin Li b->tokens_ = (token_t*)TOKEN_DATA(page);
82*b2055c35SXin Li return 1;
83*b2055c35SXin Li }
84*b2055c35SXin Li
85*b2055c35SXin Li //------------------------------------------------------------------------------
86*b2055c35SXin Li
87*b2055c35SXin Li #define TOKEN_ID(t, b, ctx) \
88*b2055c35SXin Li (NUM_PROBAS * ((ctx) + NUM_CTX * ((b) + NUM_BANDS * (t))))
89*b2055c35SXin Li
AddToken(VP8TBuffer * const b,uint32_t bit,uint32_t proba_idx,proba_t * const stats)90*b2055c35SXin Li static WEBP_INLINE uint32_t AddToken(VP8TBuffer* const b, uint32_t bit,
91*b2055c35SXin Li uint32_t proba_idx,
92*b2055c35SXin Li proba_t* const stats) {
93*b2055c35SXin Li assert(proba_idx < FIXED_PROBA_BIT);
94*b2055c35SXin Li assert(bit <= 1);
95*b2055c35SXin Li if (b->left_ > 0 || TBufferNewPage(b)) {
96*b2055c35SXin Li const int slot = --b->left_;
97*b2055c35SXin Li b->tokens_[slot] = (bit << 15) | proba_idx;
98*b2055c35SXin Li }
99*b2055c35SXin Li VP8RecordStats(bit, stats);
100*b2055c35SXin Li return bit;
101*b2055c35SXin Li }
102*b2055c35SXin Li
AddConstantToken(VP8TBuffer * const b,uint32_t bit,uint32_t proba)103*b2055c35SXin Li static WEBP_INLINE void AddConstantToken(VP8TBuffer* const b,
104*b2055c35SXin Li uint32_t bit, uint32_t proba) {
105*b2055c35SXin Li assert(proba < 256);
106*b2055c35SXin Li assert(bit <= 1);
107*b2055c35SXin Li if (b->left_ > 0 || TBufferNewPage(b)) {
108*b2055c35SXin Li const int slot = --b->left_;
109*b2055c35SXin Li b->tokens_[slot] = (bit << 15) | FIXED_PROBA_BIT | proba;
110*b2055c35SXin Li }
111*b2055c35SXin Li }
112*b2055c35SXin Li
VP8RecordCoeffTokens(int ctx,const struct VP8Residual * const res,VP8TBuffer * const tokens)113*b2055c35SXin Li int VP8RecordCoeffTokens(int ctx, const struct VP8Residual* const res,
114*b2055c35SXin Li VP8TBuffer* const tokens) {
115*b2055c35SXin Li const int16_t* const coeffs = res->coeffs;
116*b2055c35SXin Li const int coeff_type = res->coeff_type;
117*b2055c35SXin Li const int last = res->last;
118*b2055c35SXin Li int n = res->first;
119*b2055c35SXin Li uint32_t base_id = TOKEN_ID(coeff_type, n, ctx);
120*b2055c35SXin Li // should be stats[VP8EncBands[n]], but it's equivalent for n=0 or 1
121*b2055c35SXin Li proba_t* s = res->stats[n][ctx];
122*b2055c35SXin Li if (!AddToken(tokens, last >= 0, base_id + 0, s + 0)) {
123*b2055c35SXin Li return 0;
124*b2055c35SXin Li }
125*b2055c35SXin Li
126*b2055c35SXin Li while (n < 16) {
127*b2055c35SXin Li const int c = coeffs[n++];
128*b2055c35SXin Li const int sign = c < 0;
129*b2055c35SXin Li const uint32_t v = sign ? -c : c;
130*b2055c35SXin Li if (!AddToken(tokens, v != 0, base_id + 1, s + 1)) {
131*b2055c35SXin Li base_id = TOKEN_ID(coeff_type, VP8EncBands[n], 0); // ctx=0
132*b2055c35SXin Li s = res->stats[VP8EncBands[n]][0];
133*b2055c35SXin Li continue;
134*b2055c35SXin Li }
135*b2055c35SXin Li if (!AddToken(tokens, v > 1, base_id + 2, s + 2)) {
136*b2055c35SXin Li base_id = TOKEN_ID(coeff_type, VP8EncBands[n], 1); // ctx=1
137*b2055c35SXin Li s = res->stats[VP8EncBands[n]][1];
138*b2055c35SXin Li } else {
139*b2055c35SXin Li if (!AddToken(tokens, v > 4, base_id + 3, s + 3)) {
140*b2055c35SXin Li if (AddToken(tokens, v != 2, base_id + 4, s + 4)) {
141*b2055c35SXin Li AddToken(tokens, v == 4, base_id + 5, s + 5);
142*b2055c35SXin Li }
143*b2055c35SXin Li } else if (!AddToken(tokens, v > 10, base_id + 6, s + 6)) {
144*b2055c35SXin Li if (!AddToken(tokens, v > 6, base_id + 7, s + 7)) {
145*b2055c35SXin Li AddConstantToken(tokens, v == 6, 159);
146*b2055c35SXin Li } else {
147*b2055c35SXin Li AddConstantToken(tokens, v >= 9, 165);
148*b2055c35SXin Li AddConstantToken(tokens, !(v & 1), 145);
149*b2055c35SXin Li }
150*b2055c35SXin Li } else {
151*b2055c35SXin Li int mask;
152*b2055c35SXin Li const uint8_t* tab;
153*b2055c35SXin Li uint32_t residue = v - 3;
154*b2055c35SXin Li if (residue < (8 << 1)) { // VP8Cat3 (3b)
155*b2055c35SXin Li AddToken(tokens, 0, base_id + 8, s + 8);
156*b2055c35SXin Li AddToken(tokens, 0, base_id + 9, s + 9);
157*b2055c35SXin Li residue -= (8 << 0);
158*b2055c35SXin Li mask = 1 << 2;
159*b2055c35SXin Li tab = VP8Cat3;
160*b2055c35SXin Li } else if (residue < (8 << 2)) { // VP8Cat4 (4b)
161*b2055c35SXin Li AddToken(tokens, 0, base_id + 8, s + 8);
162*b2055c35SXin Li AddToken(tokens, 1, base_id + 9, s + 9);
163*b2055c35SXin Li residue -= (8 << 1);
164*b2055c35SXin Li mask = 1 << 3;
165*b2055c35SXin Li tab = VP8Cat4;
166*b2055c35SXin Li } else if (residue < (8 << 3)) { // VP8Cat5 (5b)
167*b2055c35SXin Li AddToken(tokens, 1, base_id + 8, s + 8);
168*b2055c35SXin Li AddToken(tokens, 0, base_id + 10, s + 9);
169*b2055c35SXin Li residue -= (8 << 2);
170*b2055c35SXin Li mask = 1 << 4;
171*b2055c35SXin Li tab = VP8Cat5;
172*b2055c35SXin Li } else { // VP8Cat6 (11b)
173*b2055c35SXin Li AddToken(tokens, 1, base_id + 8, s + 8);
174*b2055c35SXin Li AddToken(tokens, 1, base_id + 10, s + 9);
175*b2055c35SXin Li residue -= (8 << 3);
176*b2055c35SXin Li mask = 1 << 10;
177*b2055c35SXin Li tab = VP8Cat6;
178*b2055c35SXin Li }
179*b2055c35SXin Li while (mask) {
180*b2055c35SXin Li AddConstantToken(tokens, !!(residue & mask), *tab++);
181*b2055c35SXin Li mask >>= 1;
182*b2055c35SXin Li }
183*b2055c35SXin Li }
184*b2055c35SXin Li base_id = TOKEN_ID(coeff_type, VP8EncBands[n], 2); // ctx=2
185*b2055c35SXin Li s = res->stats[VP8EncBands[n]][2];
186*b2055c35SXin Li }
187*b2055c35SXin Li AddConstantToken(tokens, sign, 128);
188*b2055c35SXin Li if (n == 16 || !AddToken(tokens, n <= last, base_id + 0, s + 0)) {
189*b2055c35SXin Li return 1; // EOB
190*b2055c35SXin Li }
191*b2055c35SXin Li }
192*b2055c35SXin Li return 1;
193*b2055c35SXin Li }
194*b2055c35SXin Li
195*b2055c35SXin Li #undef TOKEN_ID
196*b2055c35SXin Li
197*b2055c35SXin Li //------------------------------------------------------------------------------
198*b2055c35SXin Li // Final coding pass, with known probabilities
199*b2055c35SXin Li
VP8EmitTokens(VP8TBuffer * const b,VP8BitWriter * const bw,const uint8_t * const probas,int final_pass)200*b2055c35SXin Li int VP8EmitTokens(VP8TBuffer* const b, VP8BitWriter* const bw,
201*b2055c35SXin Li const uint8_t* const probas, int final_pass) {
202*b2055c35SXin Li const VP8Tokens* p = b->pages_;
203*b2055c35SXin Li assert(!b->error_);
204*b2055c35SXin Li while (p != NULL) {
205*b2055c35SXin Li const VP8Tokens* const next = p->next_;
206*b2055c35SXin Li const int N = (next == NULL) ? b->left_ : 0;
207*b2055c35SXin Li int n = b->page_size_;
208*b2055c35SXin Li const token_t* const tokens = TOKEN_DATA(p);
209*b2055c35SXin Li while (n-- > N) {
210*b2055c35SXin Li const token_t token = tokens[n];
211*b2055c35SXin Li const int bit = (token >> 15) & 1;
212*b2055c35SXin Li if (token & FIXED_PROBA_BIT) {
213*b2055c35SXin Li VP8PutBit(bw, bit, token & 0xffu); // constant proba
214*b2055c35SXin Li } else {
215*b2055c35SXin Li VP8PutBit(bw, bit, probas[token & 0x3fffu]);
216*b2055c35SXin Li }
217*b2055c35SXin Li }
218*b2055c35SXin Li if (final_pass) WebPSafeFree((void*)p);
219*b2055c35SXin Li p = next;
220*b2055c35SXin Li }
221*b2055c35SXin Li if (final_pass) b->pages_ = NULL;
222*b2055c35SXin Li return 1;
223*b2055c35SXin Li }
224*b2055c35SXin Li
225*b2055c35SXin Li // Size estimation
VP8EstimateTokenSize(VP8TBuffer * const b,const uint8_t * const probas)226*b2055c35SXin Li size_t VP8EstimateTokenSize(VP8TBuffer* const b, const uint8_t* const probas) {
227*b2055c35SXin Li size_t size = 0;
228*b2055c35SXin Li const VP8Tokens* p = b->pages_;
229*b2055c35SXin Li assert(!b->error_);
230*b2055c35SXin Li while (p != NULL) {
231*b2055c35SXin Li const VP8Tokens* const next = p->next_;
232*b2055c35SXin Li const int N = (next == NULL) ? b->left_ : 0;
233*b2055c35SXin Li int n = b->page_size_;
234*b2055c35SXin Li const token_t* const tokens = TOKEN_DATA(p);
235*b2055c35SXin Li while (n-- > N) {
236*b2055c35SXin Li const token_t token = tokens[n];
237*b2055c35SXin Li const int bit = token & (1 << 15);
238*b2055c35SXin Li if (token & FIXED_PROBA_BIT) {
239*b2055c35SXin Li size += VP8BitCost(bit, token & 0xffu);
240*b2055c35SXin Li } else {
241*b2055c35SXin Li size += VP8BitCost(bit, probas[token & 0x3fffu]);
242*b2055c35SXin Li }
243*b2055c35SXin Li }
244*b2055c35SXin Li p = next;
245*b2055c35SXin Li }
246*b2055c35SXin Li return size;
247*b2055c35SXin Li }
248*b2055c35SXin Li
249*b2055c35SXin Li //------------------------------------------------------------------------------
250*b2055c35SXin Li
251*b2055c35SXin Li #else // DISABLE_TOKEN_BUFFER
252*b2055c35SXin Li
VP8TBufferInit(VP8TBuffer * const b,int page_size)253*b2055c35SXin Li void VP8TBufferInit(VP8TBuffer* const b, int page_size) {
254*b2055c35SXin Li (void)b;
255*b2055c35SXin Li (void)page_size;
256*b2055c35SXin Li }
VP8TBufferClear(VP8TBuffer * const b)257*b2055c35SXin Li void VP8TBufferClear(VP8TBuffer* const b) {
258*b2055c35SXin Li (void)b;
259*b2055c35SXin Li }
260*b2055c35SXin Li
261*b2055c35SXin Li #endif // !DISABLE_TOKEN_BUFFER
262*b2055c35SXin Li
263