1*b2055c35SXin Li // Copyright 2014 Google Inc. All Rights Reserved.
2*b2055c35SXin Li //
3*b2055c35SXin Li // Use of this source code is governed by a BSD-style license
4*b2055c35SXin Li // that can be found in the COPYING file in the root of the source
5*b2055c35SXin Li // tree. An additional intellectual property rights grant can be found
6*b2055c35SXin Li // in the file PATENTS. All contributing project authors may
7*b2055c35SXin Li // be found in the AUTHORS file in the root of the source tree.
8*b2055c35SXin Li // -----------------------------------------------------------------------------
9*b2055c35SXin Li //
10*b2055c35SXin Li // WebPPicture utils for colorspace conversion
11*b2055c35SXin Li //
12*b2055c35SXin Li // Author: Skal ([email protected])
13*b2055c35SXin Li
14*b2055c35SXin Li #include <assert.h>
15*b2055c35SXin Li #include <stdlib.h>
16*b2055c35SXin Li #include <math.h>
17*b2055c35SXin Li
18*b2055c35SXin Li #include "sharpyuv/sharpyuv.h"
19*b2055c35SXin Li #include "sharpyuv/sharpyuv_csp.h"
20*b2055c35SXin Li #include "src/enc/vp8i_enc.h"
21*b2055c35SXin Li #include "src/utils/random_utils.h"
22*b2055c35SXin Li #include "src/utils/utils.h"
23*b2055c35SXin Li #include "src/dsp/dsp.h"
24*b2055c35SXin Li #include "src/dsp/lossless.h"
25*b2055c35SXin Li #include "src/dsp/yuv.h"
26*b2055c35SXin Li #include "src/dsp/cpu.h"
27*b2055c35SXin Li
28*b2055c35SXin Li #if defined(WEBP_USE_THREAD) && !defined(_WIN32)
29*b2055c35SXin Li #include <pthread.h>
30*b2055c35SXin Li #endif
31*b2055c35SXin Li
32*b2055c35SXin Li // Uncomment to disable gamma-compression during RGB->U/V averaging
33*b2055c35SXin Li #define USE_GAMMA_COMPRESSION
34*b2055c35SXin Li
35*b2055c35SXin Li // If defined, use table to compute x / alpha.
36*b2055c35SXin Li #define USE_INVERSE_ALPHA_TABLE
37*b2055c35SXin Li
38*b2055c35SXin Li #ifdef WORDS_BIGENDIAN
39*b2055c35SXin Li // uint32_t 0xff000000 is 0xff,00,00,00 in memory
40*b2055c35SXin Li #define CHANNEL_OFFSET(i) (i)
41*b2055c35SXin Li #else
42*b2055c35SXin Li // uint32_t 0xff000000 is 0x00,00,00,ff in memory
43*b2055c35SXin Li #define CHANNEL_OFFSET(i) (3-(i))
44*b2055c35SXin Li #endif
45*b2055c35SXin Li
46*b2055c35SXin Li #define ALPHA_OFFSET CHANNEL_OFFSET(0)
47*b2055c35SXin Li
48*b2055c35SXin Li //------------------------------------------------------------------------------
49*b2055c35SXin Li // Detection of non-trivial transparency
50*b2055c35SXin Li
51*b2055c35SXin Li // Returns true if alpha[] has non-0xff values.
CheckNonOpaque(const uint8_t * alpha,int width,int height,int x_step,int y_step)52*b2055c35SXin Li static int CheckNonOpaque(const uint8_t* alpha, int width, int height,
53*b2055c35SXin Li int x_step, int y_step) {
54*b2055c35SXin Li if (alpha == NULL) return 0;
55*b2055c35SXin Li WebPInitAlphaProcessing();
56*b2055c35SXin Li if (x_step == 1) {
57*b2055c35SXin Li for (; height-- > 0; alpha += y_step) {
58*b2055c35SXin Li if (WebPHasAlpha8b(alpha, width)) return 1;
59*b2055c35SXin Li }
60*b2055c35SXin Li } else {
61*b2055c35SXin Li for (; height-- > 0; alpha += y_step) {
62*b2055c35SXin Li if (WebPHasAlpha32b(alpha, width)) return 1;
63*b2055c35SXin Li }
64*b2055c35SXin Li }
65*b2055c35SXin Li return 0;
66*b2055c35SXin Li }
67*b2055c35SXin Li
68*b2055c35SXin Li // Checking for the presence of non-opaque alpha.
WebPPictureHasTransparency(const WebPPicture * picture)69*b2055c35SXin Li int WebPPictureHasTransparency(const WebPPicture* picture) {
70*b2055c35SXin Li if (picture == NULL) return 0;
71*b2055c35SXin Li if (picture->use_argb) {
72*b2055c35SXin Li if (picture->argb != NULL) {
73*b2055c35SXin Li return CheckNonOpaque((const uint8_t*)picture->argb + ALPHA_OFFSET,
74*b2055c35SXin Li picture->width, picture->height,
75*b2055c35SXin Li 4, picture->argb_stride * sizeof(*picture->argb));
76*b2055c35SXin Li }
77*b2055c35SXin Li return 0;
78*b2055c35SXin Li }
79*b2055c35SXin Li return CheckNonOpaque(picture->a, picture->width, picture->height,
80*b2055c35SXin Li 1, picture->a_stride);
81*b2055c35SXin Li }
82*b2055c35SXin Li
83*b2055c35SXin Li //------------------------------------------------------------------------------
84*b2055c35SXin Li // Code for gamma correction
85*b2055c35SXin Li
86*b2055c35SXin Li #if defined(USE_GAMMA_COMPRESSION)
87*b2055c35SXin Li
88*b2055c35SXin Li // Gamma correction compensates loss of resolution during chroma subsampling.
89*b2055c35SXin Li #define GAMMA_FIX 12 // fixed-point precision for linear values
90*b2055c35SXin Li #define GAMMA_TAB_FIX 7 // fixed-point fractional bits precision
91*b2055c35SXin Li #define GAMMA_TAB_SIZE (1 << (GAMMA_FIX - GAMMA_TAB_FIX))
92*b2055c35SXin Li static const double kGamma = 0.80;
93*b2055c35SXin Li static const int kGammaScale = ((1 << GAMMA_FIX) - 1);
94*b2055c35SXin Li static const int kGammaTabScale = (1 << GAMMA_TAB_FIX);
95*b2055c35SXin Li static const int kGammaTabRounder = (1 << GAMMA_TAB_FIX >> 1);
96*b2055c35SXin Li
97*b2055c35SXin Li static int kLinearToGammaTab[GAMMA_TAB_SIZE + 1];
98*b2055c35SXin Li static uint16_t kGammaToLinearTab[256];
99*b2055c35SXin Li static volatile int kGammaTablesOk = 0;
100*b2055c35SXin Li static void InitGammaTables(void);
101*b2055c35SXin Li extern VP8CPUInfo VP8GetCPUInfo;
102*b2055c35SXin Li
WEBP_DSP_INIT_FUNC(InitGammaTables)103*b2055c35SXin Li WEBP_DSP_INIT_FUNC(InitGammaTables) {
104*b2055c35SXin Li if (!kGammaTablesOk) {
105*b2055c35SXin Li int v;
106*b2055c35SXin Li const double scale = (double)(1 << GAMMA_TAB_FIX) / kGammaScale;
107*b2055c35SXin Li const double norm = 1. / 255.;
108*b2055c35SXin Li for (v = 0; v <= 255; ++v) {
109*b2055c35SXin Li kGammaToLinearTab[v] =
110*b2055c35SXin Li (uint16_t)(pow(norm * v, kGamma) * kGammaScale + .5);
111*b2055c35SXin Li }
112*b2055c35SXin Li for (v = 0; v <= GAMMA_TAB_SIZE; ++v) {
113*b2055c35SXin Li kLinearToGammaTab[v] = (int)(255. * pow(scale * v, 1. / kGamma) + .5);
114*b2055c35SXin Li }
115*b2055c35SXin Li kGammaTablesOk = 1;
116*b2055c35SXin Li }
117*b2055c35SXin Li }
118*b2055c35SXin Li
GammaToLinear(uint8_t v)119*b2055c35SXin Li static WEBP_INLINE uint32_t GammaToLinear(uint8_t v) {
120*b2055c35SXin Li return kGammaToLinearTab[v];
121*b2055c35SXin Li }
122*b2055c35SXin Li
Interpolate(int v)123*b2055c35SXin Li static WEBP_INLINE int Interpolate(int v) {
124*b2055c35SXin Li const int tab_pos = v >> (GAMMA_TAB_FIX + 2); // integer part
125*b2055c35SXin Li const int x = v & ((kGammaTabScale << 2) - 1); // fractional part
126*b2055c35SXin Li const int v0 = kLinearToGammaTab[tab_pos];
127*b2055c35SXin Li const int v1 = kLinearToGammaTab[tab_pos + 1];
128*b2055c35SXin Li const int y = v1 * x + v0 * ((kGammaTabScale << 2) - x); // interpolate
129*b2055c35SXin Li assert(tab_pos + 1 < GAMMA_TAB_SIZE + 1);
130*b2055c35SXin Li return y;
131*b2055c35SXin Li }
132*b2055c35SXin Li
133*b2055c35SXin Li // Convert a linear value 'v' to YUV_FIX+2 fixed-point precision
134*b2055c35SXin Li // U/V value, suitable for RGBToU/V calls.
LinearToGamma(uint32_t base_value,int shift)135*b2055c35SXin Li static WEBP_INLINE int LinearToGamma(uint32_t base_value, int shift) {
136*b2055c35SXin Li const int y = Interpolate(base_value << shift); // final uplifted value
137*b2055c35SXin Li return (y + kGammaTabRounder) >> GAMMA_TAB_FIX; // descale
138*b2055c35SXin Li }
139*b2055c35SXin Li
140*b2055c35SXin Li #else
141*b2055c35SXin Li
InitGammaTables(void)142*b2055c35SXin Li static void InitGammaTables(void) {}
GammaToLinear(uint8_t v)143*b2055c35SXin Li static WEBP_INLINE uint32_t GammaToLinear(uint8_t v) { return v; }
LinearToGamma(uint32_t base_value,int shift)144*b2055c35SXin Li static WEBP_INLINE int LinearToGamma(uint32_t base_value, int shift) {
145*b2055c35SXin Li return (int)(base_value << shift);
146*b2055c35SXin Li }
147*b2055c35SXin Li
148*b2055c35SXin Li #endif // USE_GAMMA_COMPRESSION
149*b2055c35SXin Li
150*b2055c35SXin Li //------------------------------------------------------------------------------
151*b2055c35SXin Li // RGB -> YUV conversion
152*b2055c35SXin Li
RGBToY(int r,int g,int b,VP8Random * const rg)153*b2055c35SXin Li static int RGBToY(int r, int g, int b, VP8Random* const rg) {
154*b2055c35SXin Li return (rg == NULL) ? VP8RGBToY(r, g, b, YUV_HALF)
155*b2055c35SXin Li : VP8RGBToY(r, g, b, VP8RandomBits(rg, YUV_FIX));
156*b2055c35SXin Li }
157*b2055c35SXin Li
RGBToU(int r,int g,int b,VP8Random * const rg)158*b2055c35SXin Li static int RGBToU(int r, int g, int b, VP8Random* const rg) {
159*b2055c35SXin Li return (rg == NULL) ? VP8RGBToU(r, g, b, YUV_HALF << 2)
160*b2055c35SXin Li : VP8RGBToU(r, g, b, VP8RandomBits(rg, YUV_FIX + 2));
161*b2055c35SXin Li }
162*b2055c35SXin Li
RGBToV(int r,int g,int b,VP8Random * const rg)163*b2055c35SXin Li static int RGBToV(int r, int g, int b, VP8Random* const rg) {
164*b2055c35SXin Li return (rg == NULL) ? VP8RGBToV(r, g, b, YUV_HALF << 2)
165*b2055c35SXin Li : VP8RGBToV(r, g, b, VP8RandomBits(rg, YUV_FIX + 2));
166*b2055c35SXin Li }
167*b2055c35SXin Li
168*b2055c35SXin Li //------------------------------------------------------------------------------
169*b2055c35SXin Li // Sharp RGB->YUV conversion
170*b2055c35SXin Li
171*b2055c35SXin Li static const int kMinDimensionIterativeConversion = 4;
172*b2055c35SXin Li
173*b2055c35SXin Li //------------------------------------------------------------------------------
174*b2055c35SXin Li // Main function
175*b2055c35SXin Li
PreprocessARGB(const uint8_t * r_ptr,const uint8_t * g_ptr,const uint8_t * b_ptr,int step,int rgb_stride,WebPPicture * const picture)176*b2055c35SXin Li static int PreprocessARGB(const uint8_t* r_ptr,
177*b2055c35SXin Li const uint8_t* g_ptr,
178*b2055c35SXin Li const uint8_t* b_ptr,
179*b2055c35SXin Li int step, int rgb_stride,
180*b2055c35SXin Li WebPPicture* const picture) {
181*b2055c35SXin Li const int ok = SharpYuvConvert(
182*b2055c35SXin Li r_ptr, g_ptr, b_ptr, step, rgb_stride, /*rgb_bit_depth=*/8,
183*b2055c35SXin Li picture->y, picture->y_stride, picture->u, picture->uv_stride, picture->v,
184*b2055c35SXin Li picture->uv_stride, /*yuv_bit_depth=*/8, picture->width,
185*b2055c35SXin Li picture->height, SharpYuvGetConversionMatrix(kSharpYuvMatrixWebp));
186*b2055c35SXin Li if (!ok) {
187*b2055c35SXin Li return WebPEncodingSetError(picture, VP8_ENC_ERROR_OUT_OF_MEMORY);
188*b2055c35SXin Li }
189*b2055c35SXin Li return ok;
190*b2055c35SXin Li }
191*b2055c35SXin Li
192*b2055c35SXin Li //------------------------------------------------------------------------------
193*b2055c35SXin Li // "Fast" regular RGB->YUV
194*b2055c35SXin Li
195*b2055c35SXin Li #define SUM4(ptr, step) LinearToGamma( \
196*b2055c35SXin Li GammaToLinear((ptr)[0]) + \
197*b2055c35SXin Li GammaToLinear((ptr)[(step)]) + \
198*b2055c35SXin Li GammaToLinear((ptr)[rgb_stride]) + \
199*b2055c35SXin Li GammaToLinear((ptr)[rgb_stride + (step)]), 0) \
200*b2055c35SXin Li
201*b2055c35SXin Li #define SUM2(ptr) \
202*b2055c35SXin Li LinearToGamma(GammaToLinear((ptr)[0]) + GammaToLinear((ptr)[rgb_stride]), 1)
203*b2055c35SXin Li
204*b2055c35SXin Li #define SUM2ALPHA(ptr) ((ptr)[0] + (ptr)[rgb_stride])
205*b2055c35SXin Li #define SUM4ALPHA(ptr) (SUM2ALPHA(ptr) + SUM2ALPHA((ptr) + 4))
206*b2055c35SXin Li
207*b2055c35SXin Li #if defined(USE_INVERSE_ALPHA_TABLE)
208*b2055c35SXin Li
209*b2055c35SXin Li static const int kAlphaFix = 19;
210*b2055c35SXin Li // Following table is (1 << kAlphaFix) / a. The (v * kInvAlpha[a]) >> kAlphaFix
211*b2055c35SXin Li // formula is then equal to v / a in most (99.6%) cases. Note that this table
212*b2055c35SXin Li // and constant are adjusted very tightly to fit 32b arithmetic.
213*b2055c35SXin Li // In particular, they use the fact that the operands for 'v / a' are actually
214*b2055c35SXin Li // derived as v = (a0.p0 + a1.p1 + a2.p2 + a3.p3) and a = a0 + a1 + a2 + a3
215*b2055c35SXin Li // with ai in [0..255] and pi in [0..1<<GAMMA_FIX). The constraint to avoid
216*b2055c35SXin Li // overflow is: GAMMA_FIX + kAlphaFix <= 31.
217*b2055c35SXin Li static const uint32_t kInvAlpha[4 * 0xff + 1] = {
218*b2055c35SXin Li 0, /* alpha = 0 */
219*b2055c35SXin Li 524288, 262144, 174762, 131072, 104857, 87381, 74898, 65536,
220*b2055c35SXin Li 58254, 52428, 47662, 43690, 40329, 37449, 34952, 32768,
221*b2055c35SXin Li 30840, 29127, 27594, 26214, 24966, 23831, 22795, 21845,
222*b2055c35SXin Li 20971, 20164, 19418, 18724, 18078, 17476, 16912, 16384,
223*b2055c35SXin Li 15887, 15420, 14979, 14563, 14169, 13797, 13443, 13107,
224*b2055c35SXin Li 12787, 12483, 12192, 11915, 11650, 11397, 11155, 10922,
225*b2055c35SXin Li 10699, 10485, 10280, 10082, 9892, 9709, 9532, 9362,
226*b2055c35SXin Li 9198, 9039, 8886, 8738, 8594, 8456, 8322, 8192,
227*b2055c35SXin Li 8065, 7943, 7825, 7710, 7598, 7489, 7384, 7281,
228*b2055c35SXin Li 7182, 7084, 6990, 6898, 6808, 6721, 6636, 6553,
229*b2055c35SXin Li 6472, 6393, 6316, 6241, 6168, 6096, 6026, 5957,
230*b2055c35SXin Li 5890, 5825, 5761, 5698, 5637, 5577, 5518, 5461,
231*b2055c35SXin Li 5405, 5349, 5295, 5242, 5190, 5140, 5090, 5041,
232*b2055c35SXin Li 4993, 4946, 4899, 4854, 4809, 4766, 4723, 4681,
233*b2055c35SXin Li 4639, 4599, 4559, 4519, 4481, 4443, 4405, 4369,
234*b2055c35SXin Li 4332, 4297, 4262, 4228, 4194, 4161, 4128, 4096,
235*b2055c35SXin Li 4064, 4032, 4002, 3971, 3942, 3912, 3883, 3855,
236*b2055c35SXin Li 3826, 3799, 3771, 3744, 3718, 3692, 3666, 3640,
237*b2055c35SXin Li 3615, 3591, 3566, 3542, 3518, 3495, 3472, 3449,
238*b2055c35SXin Li 3426, 3404, 3382, 3360, 3339, 3318, 3297, 3276,
239*b2055c35SXin Li 3256, 3236, 3216, 3196, 3177, 3158, 3139, 3120,
240*b2055c35SXin Li 3102, 3084, 3066, 3048, 3030, 3013, 2995, 2978,
241*b2055c35SXin Li 2962, 2945, 2928, 2912, 2896, 2880, 2864, 2849,
242*b2055c35SXin Li 2833, 2818, 2803, 2788, 2774, 2759, 2744, 2730,
243*b2055c35SXin Li 2716, 2702, 2688, 2674, 2661, 2647, 2634, 2621,
244*b2055c35SXin Li 2608, 2595, 2582, 2570, 2557, 2545, 2532, 2520,
245*b2055c35SXin Li 2508, 2496, 2484, 2473, 2461, 2449, 2438, 2427,
246*b2055c35SXin Li 2416, 2404, 2394, 2383, 2372, 2361, 2351, 2340,
247*b2055c35SXin Li 2330, 2319, 2309, 2299, 2289, 2279, 2269, 2259,
248*b2055c35SXin Li 2250, 2240, 2231, 2221, 2212, 2202, 2193, 2184,
249*b2055c35SXin Li 2175, 2166, 2157, 2148, 2139, 2131, 2122, 2114,
250*b2055c35SXin Li 2105, 2097, 2088, 2080, 2072, 2064, 2056, 2048,
251*b2055c35SXin Li 2040, 2032, 2024, 2016, 2008, 2001, 1993, 1985,
252*b2055c35SXin Li 1978, 1971, 1963, 1956, 1949, 1941, 1934, 1927,
253*b2055c35SXin Li 1920, 1913, 1906, 1899, 1892, 1885, 1879, 1872,
254*b2055c35SXin Li 1865, 1859, 1852, 1846, 1839, 1833, 1826, 1820,
255*b2055c35SXin Li 1814, 1807, 1801, 1795, 1789, 1783, 1777, 1771,
256*b2055c35SXin Li 1765, 1759, 1753, 1747, 1741, 1736, 1730, 1724,
257*b2055c35SXin Li 1718, 1713, 1707, 1702, 1696, 1691, 1685, 1680,
258*b2055c35SXin Li 1675, 1669, 1664, 1659, 1653, 1648, 1643, 1638,
259*b2055c35SXin Li 1633, 1628, 1623, 1618, 1613, 1608, 1603, 1598,
260*b2055c35SXin Li 1593, 1588, 1583, 1579, 1574, 1569, 1565, 1560,
261*b2055c35SXin Li 1555, 1551, 1546, 1542, 1537, 1533, 1528, 1524,
262*b2055c35SXin Li 1519, 1515, 1510, 1506, 1502, 1497, 1493, 1489,
263*b2055c35SXin Li 1485, 1481, 1476, 1472, 1468, 1464, 1460, 1456,
264*b2055c35SXin Li 1452, 1448, 1444, 1440, 1436, 1432, 1428, 1424,
265*b2055c35SXin Li 1420, 1416, 1413, 1409, 1405, 1401, 1398, 1394,
266*b2055c35SXin Li 1390, 1387, 1383, 1379, 1376, 1372, 1368, 1365,
267*b2055c35SXin Li 1361, 1358, 1354, 1351, 1347, 1344, 1340, 1337,
268*b2055c35SXin Li 1334, 1330, 1327, 1323, 1320, 1317, 1314, 1310,
269*b2055c35SXin Li 1307, 1304, 1300, 1297, 1294, 1291, 1288, 1285,
270*b2055c35SXin Li 1281, 1278, 1275, 1272, 1269, 1266, 1263, 1260,
271*b2055c35SXin Li 1257, 1254, 1251, 1248, 1245, 1242, 1239, 1236,
272*b2055c35SXin Li 1233, 1230, 1227, 1224, 1222, 1219, 1216, 1213,
273*b2055c35SXin Li 1210, 1208, 1205, 1202, 1199, 1197, 1194, 1191,
274*b2055c35SXin Li 1188, 1186, 1183, 1180, 1178, 1175, 1172, 1170,
275*b2055c35SXin Li 1167, 1165, 1162, 1159, 1157, 1154, 1152, 1149,
276*b2055c35SXin Li 1147, 1144, 1142, 1139, 1137, 1134, 1132, 1129,
277*b2055c35SXin Li 1127, 1125, 1122, 1120, 1117, 1115, 1113, 1110,
278*b2055c35SXin Li 1108, 1106, 1103, 1101, 1099, 1096, 1094, 1092,
279*b2055c35SXin Li 1089, 1087, 1085, 1083, 1081, 1078, 1076, 1074,
280*b2055c35SXin Li 1072, 1069, 1067, 1065, 1063, 1061, 1059, 1057,
281*b2055c35SXin Li 1054, 1052, 1050, 1048, 1046, 1044, 1042, 1040,
282*b2055c35SXin Li 1038, 1036, 1034, 1032, 1030, 1028, 1026, 1024,
283*b2055c35SXin Li 1022, 1020, 1018, 1016, 1014, 1012, 1010, 1008,
284*b2055c35SXin Li 1006, 1004, 1002, 1000, 998, 996, 994, 992,
285*b2055c35SXin Li 991, 989, 987, 985, 983, 981, 979, 978,
286*b2055c35SXin Li 976, 974, 972, 970, 969, 967, 965, 963,
287*b2055c35SXin Li 961, 960, 958, 956, 954, 953, 951, 949,
288*b2055c35SXin Li 948, 946, 944, 942, 941, 939, 937, 936,
289*b2055c35SXin Li 934, 932, 931, 929, 927, 926, 924, 923,
290*b2055c35SXin Li 921, 919, 918, 916, 914, 913, 911, 910,
291*b2055c35SXin Li 908, 907, 905, 903, 902, 900, 899, 897,
292*b2055c35SXin Li 896, 894, 893, 891, 890, 888, 887, 885,
293*b2055c35SXin Li 884, 882, 881, 879, 878, 876, 875, 873,
294*b2055c35SXin Li 872, 870, 869, 868, 866, 865, 863, 862,
295*b2055c35SXin Li 860, 859, 858, 856, 855, 853, 852, 851,
296*b2055c35SXin Li 849, 848, 846, 845, 844, 842, 841, 840,
297*b2055c35SXin Li 838, 837, 836, 834, 833, 832, 830, 829,
298*b2055c35SXin Li 828, 826, 825, 824, 823, 821, 820, 819,
299*b2055c35SXin Li 817, 816, 815, 814, 812, 811, 810, 809,
300*b2055c35SXin Li 807, 806, 805, 804, 802, 801, 800, 799,
301*b2055c35SXin Li 798, 796, 795, 794, 793, 791, 790, 789,
302*b2055c35SXin Li 788, 787, 786, 784, 783, 782, 781, 780,
303*b2055c35SXin Li 779, 777, 776, 775, 774, 773, 772, 771,
304*b2055c35SXin Li 769, 768, 767, 766, 765, 764, 763, 762,
305*b2055c35SXin Li 760, 759, 758, 757, 756, 755, 754, 753,
306*b2055c35SXin Li 752, 751, 750, 748, 747, 746, 745, 744,
307*b2055c35SXin Li 743, 742, 741, 740, 739, 738, 737, 736,
308*b2055c35SXin Li 735, 734, 733, 732, 731, 730, 729, 728,
309*b2055c35SXin Li 727, 726, 725, 724, 723, 722, 721, 720,
310*b2055c35SXin Li 719, 718, 717, 716, 715, 714, 713, 712,
311*b2055c35SXin Li 711, 710, 709, 708, 707, 706, 705, 704,
312*b2055c35SXin Li 703, 702, 701, 700, 699, 699, 698, 697,
313*b2055c35SXin Li 696, 695, 694, 693, 692, 691, 690, 689,
314*b2055c35SXin Li 688, 688, 687, 686, 685, 684, 683, 682,
315*b2055c35SXin Li 681, 680, 680, 679, 678, 677, 676, 675,
316*b2055c35SXin Li 674, 673, 673, 672, 671, 670, 669, 668,
317*b2055c35SXin Li 667, 667, 666, 665, 664, 663, 662, 661,
318*b2055c35SXin Li 661, 660, 659, 658, 657, 657, 656, 655,
319*b2055c35SXin Li 654, 653, 652, 652, 651, 650, 649, 648,
320*b2055c35SXin Li 648, 647, 646, 645, 644, 644, 643, 642,
321*b2055c35SXin Li 641, 640, 640, 639, 638, 637, 637, 636,
322*b2055c35SXin Li 635, 634, 633, 633, 632, 631, 630, 630,
323*b2055c35SXin Li 629, 628, 627, 627, 626, 625, 624, 624,
324*b2055c35SXin Li 623, 622, 621, 621, 620, 619, 618, 618,
325*b2055c35SXin Li 617, 616, 616, 615, 614, 613, 613, 612,
326*b2055c35SXin Li 611, 611, 610, 609, 608, 608, 607, 606,
327*b2055c35SXin Li 606, 605, 604, 604, 603, 602, 601, 601,
328*b2055c35SXin Li 600, 599, 599, 598, 597, 597, 596, 595,
329*b2055c35SXin Li 595, 594, 593, 593, 592, 591, 591, 590,
330*b2055c35SXin Li 589, 589, 588, 587, 587, 586, 585, 585,
331*b2055c35SXin Li 584, 583, 583, 582, 581, 581, 580, 579,
332*b2055c35SXin Li 579, 578, 578, 577, 576, 576, 575, 574,
333*b2055c35SXin Li 574, 573, 572, 572, 571, 571, 570, 569,
334*b2055c35SXin Li 569, 568, 568, 567, 566, 566, 565, 564,
335*b2055c35SXin Li 564, 563, 563, 562, 561, 561, 560, 560,
336*b2055c35SXin Li 559, 558, 558, 557, 557, 556, 555, 555,
337*b2055c35SXin Li 554, 554, 553, 553, 552, 551, 551, 550,
338*b2055c35SXin Li 550, 549, 548, 548, 547, 547, 546, 546,
339*b2055c35SXin Li 545, 544, 544, 543, 543, 542, 542, 541,
340*b2055c35SXin Li 541, 540, 539, 539, 538, 538, 537, 537,
341*b2055c35SXin Li 536, 536, 535, 534, 534, 533, 533, 532,
342*b2055c35SXin Li 532, 531, 531, 530, 530, 529, 529, 528,
343*b2055c35SXin Li 527, 527, 526, 526, 525, 525, 524, 524,
344*b2055c35SXin Li 523, 523, 522, 522, 521, 521, 520, 520,
345*b2055c35SXin Li 519, 519, 518, 518, 517, 517, 516, 516,
346*b2055c35SXin Li 515, 515, 514, 514
347*b2055c35SXin Li };
348*b2055c35SXin Li
349*b2055c35SXin Li // Note that LinearToGamma() expects the values to be premultiplied by 4,
350*b2055c35SXin Li // so we incorporate this factor 4 inside the DIVIDE_BY_ALPHA macro directly.
351*b2055c35SXin Li #define DIVIDE_BY_ALPHA(sum, a) (((sum) * kInvAlpha[(a)]) >> (kAlphaFix - 2))
352*b2055c35SXin Li
353*b2055c35SXin Li #else
354*b2055c35SXin Li
355*b2055c35SXin Li #define DIVIDE_BY_ALPHA(sum, a) (4 * (sum) / (a))
356*b2055c35SXin Li
357*b2055c35SXin Li #endif // USE_INVERSE_ALPHA_TABLE
358*b2055c35SXin Li
LinearToGammaWeighted(const uint8_t * src,const uint8_t * a_ptr,uint32_t total_a,int step,int rgb_stride)359*b2055c35SXin Li static WEBP_INLINE int LinearToGammaWeighted(const uint8_t* src,
360*b2055c35SXin Li const uint8_t* a_ptr,
361*b2055c35SXin Li uint32_t total_a, int step,
362*b2055c35SXin Li int rgb_stride) {
363*b2055c35SXin Li const uint32_t sum =
364*b2055c35SXin Li a_ptr[0] * GammaToLinear(src[0]) +
365*b2055c35SXin Li a_ptr[step] * GammaToLinear(src[step]) +
366*b2055c35SXin Li a_ptr[rgb_stride] * GammaToLinear(src[rgb_stride]) +
367*b2055c35SXin Li a_ptr[rgb_stride + step] * GammaToLinear(src[rgb_stride + step]);
368*b2055c35SXin Li assert(total_a > 0 && total_a <= 4 * 0xff);
369*b2055c35SXin Li #if defined(USE_INVERSE_ALPHA_TABLE)
370*b2055c35SXin Li assert((uint64_t)sum * kInvAlpha[total_a] < ((uint64_t)1 << 32));
371*b2055c35SXin Li #endif
372*b2055c35SXin Li return LinearToGamma(DIVIDE_BY_ALPHA(sum, total_a), 0);
373*b2055c35SXin Li }
374*b2055c35SXin Li
ConvertRowToY(const uint8_t * const r_ptr,const uint8_t * const g_ptr,const uint8_t * const b_ptr,int step,uint8_t * const dst_y,int width,VP8Random * const rg)375*b2055c35SXin Li static WEBP_INLINE void ConvertRowToY(const uint8_t* const r_ptr,
376*b2055c35SXin Li const uint8_t* const g_ptr,
377*b2055c35SXin Li const uint8_t* const b_ptr,
378*b2055c35SXin Li int step,
379*b2055c35SXin Li uint8_t* const dst_y,
380*b2055c35SXin Li int width,
381*b2055c35SXin Li VP8Random* const rg) {
382*b2055c35SXin Li int i, j;
383*b2055c35SXin Li for (i = 0, j = 0; i < width; i += 1, j += step) {
384*b2055c35SXin Li dst_y[i] = RGBToY(r_ptr[j], g_ptr[j], b_ptr[j], rg);
385*b2055c35SXin Li }
386*b2055c35SXin Li }
387*b2055c35SXin Li
AccumulateRGBA(const uint8_t * const r_ptr,const uint8_t * const g_ptr,const uint8_t * const b_ptr,const uint8_t * const a_ptr,int rgb_stride,uint16_t * dst,int width)388*b2055c35SXin Li static WEBP_INLINE void AccumulateRGBA(const uint8_t* const r_ptr,
389*b2055c35SXin Li const uint8_t* const g_ptr,
390*b2055c35SXin Li const uint8_t* const b_ptr,
391*b2055c35SXin Li const uint8_t* const a_ptr,
392*b2055c35SXin Li int rgb_stride,
393*b2055c35SXin Li uint16_t* dst, int width) {
394*b2055c35SXin Li int i, j;
395*b2055c35SXin Li // we loop over 2x2 blocks and produce one R/G/B/A value for each.
396*b2055c35SXin Li for (i = 0, j = 0; i < (width >> 1); i += 1, j += 2 * 4, dst += 4) {
397*b2055c35SXin Li const uint32_t a = SUM4ALPHA(a_ptr + j);
398*b2055c35SXin Li int r, g, b;
399*b2055c35SXin Li if (a == 4 * 0xff || a == 0) {
400*b2055c35SXin Li r = SUM4(r_ptr + j, 4);
401*b2055c35SXin Li g = SUM4(g_ptr + j, 4);
402*b2055c35SXin Li b = SUM4(b_ptr + j, 4);
403*b2055c35SXin Li } else {
404*b2055c35SXin Li r = LinearToGammaWeighted(r_ptr + j, a_ptr + j, a, 4, rgb_stride);
405*b2055c35SXin Li g = LinearToGammaWeighted(g_ptr + j, a_ptr + j, a, 4, rgb_stride);
406*b2055c35SXin Li b = LinearToGammaWeighted(b_ptr + j, a_ptr + j, a, 4, rgb_stride);
407*b2055c35SXin Li }
408*b2055c35SXin Li dst[0] = r;
409*b2055c35SXin Li dst[1] = g;
410*b2055c35SXin Li dst[2] = b;
411*b2055c35SXin Li dst[3] = a;
412*b2055c35SXin Li }
413*b2055c35SXin Li if (width & 1) {
414*b2055c35SXin Li const uint32_t a = 2u * SUM2ALPHA(a_ptr + j);
415*b2055c35SXin Li int r, g, b;
416*b2055c35SXin Li if (a == 4 * 0xff || a == 0) {
417*b2055c35SXin Li r = SUM2(r_ptr + j);
418*b2055c35SXin Li g = SUM2(g_ptr + j);
419*b2055c35SXin Li b = SUM2(b_ptr + j);
420*b2055c35SXin Li } else {
421*b2055c35SXin Li r = LinearToGammaWeighted(r_ptr + j, a_ptr + j, a, 0, rgb_stride);
422*b2055c35SXin Li g = LinearToGammaWeighted(g_ptr + j, a_ptr + j, a, 0, rgb_stride);
423*b2055c35SXin Li b = LinearToGammaWeighted(b_ptr + j, a_ptr + j, a, 0, rgb_stride);
424*b2055c35SXin Li }
425*b2055c35SXin Li dst[0] = r;
426*b2055c35SXin Li dst[1] = g;
427*b2055c35SXin Li dst[2] = b;
428*b2055c35SXin Li dst[3] = a;
429*b2055c35SXin Li }
430*b2055c35SXin Li }
431*b2055c35SXin Li
AccumulateRGB(const uint8_t * const r_ptr,const uint8_t * const g_ptr,const uint8_t * const b_ptr,int step,int rgb_stride,uint16_t * dst,int width)432*b2055c35SXin Li static WEBP_INLINE void AccumulateRGB(const uint8_t* const r_ptr,
433*b2055c35SXin Li const uint8_t* const g_ptr,
434*b2055c35SXin Li const uint8_t* const b_ptr,
435*b2055c35SXin Li int step, int rgb_stride,
436*b2055c35SXin Li uint16_t* dst, int width) {
437*b2055c35SXin Li int i, j;
438*b2055c35SXin Li for (i = 0, j = 0; i < (width >> 1); i += 1, j += 2 * step, dst += 4) {
439*b2055c35SXin Li dst[0] = SUM4(r_ptr + j, step);
440*b2055c35SXin Li dst[1] = SUM4(g_ptr + j, step);
441*b2055c35SXin Li dst[2] = SUM4(b_ptr + j, step);
442*b2055c35SXin Li // MemorySanitizer may raise false positives with data that passes through
443*b2055c35SXin Li // RGBA32PackedToPlanar_16b_SSE41() due to incorrect modeling of shuffles.
444*b2055c35SXin Li // See https://crbug.com/webp/573.
445*b2055c35SXin Li #ifdef WEBP_MSAN
446*b2055c35SXin Li dst[3] = 0;
447*b2055c35SXin Li #endif
448*b2055c35SXin Li }
449*b2055c35SXin Li if (width & 1) {
450*b2055c35SXin Li dst[0] = SUM2(r_ptr + j);
451*b2055c35SXin Li dst[1] = SUM2(g_ptr + j);
452*b2055c35SXin Li dst[2] = SUM2(b_ptr + j);
453*b2055c35SXin Li #ifdef WEBP_MSAN
454*b2055c35SXin Li dst[3] = 0;
455*b2055c35SXin Li #endif
456*b2055c35SXin Li }
457*b2055c35SXin Li }
458*b2055c35SXin Li
ConvertRowsToUV(const uint16_t * rgb,uint8_t * const dst_u,uint8_t * const dst_v,int width,VP8Random * const rg)459*b2055c35SXin Li static WEBP_INLINE void ConvertRowsToUV(const uint16_t* rgb,
460*b2055c35SXin Li uint8_t* const dst_u,
461*b2055c35SXin Li uint8_t* const dst_v,
462*b2055c35SXin Li int width,
463*b2055c35SXin Li VP8Random* const rg) {
464*b2055c35SXin Li int i;
465*b2055c35SXin Li for (i = 0; i < width; i += 1, rgb += 4) {
466*b2055c35SXin Li const int r = rgb[0], g = rgb[1], b = rgb[2];
467*b2055c35SXin Li dst_u[i] = RGBToU(r, g, b, rg);
468*b2055c35SXin Li dst_v[i] = RGBToV(r, g, b, rg);
469*b2055c35SXin Li }
470*b2055c35SXin Li }
471*b2055c35SXin Li
472*b2055c35SXin Li extern void SharpYuvInit(VP8CPUInfo cpu_info_func);
473*b2055c35SXin Li
ImportYUVAFromRGBA(const uint8_t * r_ptr,const uint8_t * g_ptr,const uint8_t * b_ptr,const uint8_t * a_ptr,int step,int rgb_stride,float dithering,int use_iterative_conversion,WebPPicture * const picture)474*b2055c35SXin Li static int ImportYUVAFromRGBA(const uint8_t* r_ptr,
475*b2055c35SXin Li const uint8_t* g_ptr,
476*b2055c35SXin Li const uint8_t* b_ptr,
477*b2055c35SXin Li const uint8_t* a_ptr,
478*b2055c35SXin Li int step, // bytes per pixel
479*b2055c35SXin Li int rgb_stride, // bytes per scanline
480*b2055c35SXin Li float dithering,
481*b2055c35SXin Li int use_iterative_conversion,
482*b2055c35SXin Li WebPPicture* const picture) {
483*b2055c35SXin Li int y;
484*b2055c35SXin Li const int width = picture->width;
485*b2055c35SXin Li const int height = picture->height;
486*b2055c35SXin Li const int has_alpha = CheckNonOpaque(a_ptr, width, height, step, rgb_stride);
487*b2055c35SXin Li const int is_rgb = (r_ptr < b_ptr); // otherwise it's bgr
488*b2055c35SXin Li
489*b2055c35SXin Li picture->colorspace = has_alpha ? WEBP_YUV420A : WEBP_YUV420;
490*b2055c35SXin Li picture->use_argb = 0;
491*b2055c35SXin Li
492*b2055c35SXin Li // disable smart conversion if source is too small (overkill).
493*b2055c35SXin Li if (width < kMinDimensionIterativeConversion ||
494*b2055c35SXin Li height < kMinDimensionIterativeConversion) {
495*b2055c35SXin Li use_iterative_conversion = 0;
496*b2055c35SXin Li }
497*b2055c35SXin Li
498*b2055c35SXin Li if (!WebPPictureAllocYUVA(picture)) {
499*b2055c35SXin Li return 0;
500*b2055c35SXin Li }
501*b2055c35SXin Li if (has_alpha) {
502*b2055c35SXin Li assert(step == 4);
503*b2055c35SXin Li #if defined(USE_GAMMA_COMPRESSION) && defined(USE_INVERSE_ALPHA_TABLE)
504*b2055c35SXin Li assert(kAlphaFix + GAMMA_FIX <= 31);
505*b2055c35SXin Li #endif
506*b2055c35SXin Li }
507*b2055c35SXin Li
508*b2055c35SXin Li if (use_iterative_conversion) {
509*b2055c35SXin Li SharpYuvInit(VP8GetCPUInfo);
510*b2055c35SXin Li if (!PreprocessARGB(r_ptr, g_ptr, b_ptr, step, rgb_stride, picture)) {
511*b2055c35SXin Li return 0;
512*b2055c35SXin Li }
513*b2055c35SXin Li if (has_alpha) {
514*b2055c35SXin Li WebPExtractAlpha(a_ptr, rgb_stride, width, height,
515*b2055c35SXin Li picture->a, picture->a_stride);
516*b2055c35SXin Li }
517*b2055c35SXin Li } else {
518*b2055c35SXin Li const int uv_width = (width + 1) >> 1;
519*b2055c35SXin Li int use_dsp = (step == 3); // use special function in this case
520*b2055c35SXin Li // temporary storage for accumulated R/G/B values during conversion to U/V
521*b2055c35SXin Li uint16_t* const tmp_rgb =
522*b2055c35SXin Li (uint16_t*)WebPSafeMalloc(4 * uv_width, sizeof(*tmp_rgb));
523*b2055c35SXin Li uint8_t* dst_y = picture->y;
524*b2055c35SXin Li uint8_t* dst_u = picture->u;
525*b2055c35SXin Li uint8_t* dst_v = picture->v;
526*b2055c35SXin Li uint8_t* dst_a = picture->a;
527*b2055c35SXin Li
528*b2055c35SXin Li VP8Random base_rg;
529*b2055c35SXin Li VP8Random* rg = NULL;
530*b2055c35SXin Li if (dithering > 0.) {
531*b2055c35SXin Li VP8InitRandom(&base_rg, dithering);
532*b2055c35SXin Li rg = &base_rg;
533*b2055c35SXin Li use_dsp = 0; // can't use dsp in this case
534*b2055c35SXin Li }
535*b2055c35SXin Li WebPInitConvertARGBToYUV();
536*b2055c35SXin Li InitGammaTables();
537*b2055c35SXin Li
538*b2055c35SXin Li if (tmp_rgb == NULL) {
539*b2055c35SXin Li return WebPEncodingSetError(picture, VP8_ENC_ERROR_OUT_OF_MEMORY);
540*b2055c35SXin Li }
541*b2055c35SXin Li
542*b2055c35SXin Li // Downsample Y/U/V planes, two rows at a time
543*b2055c35SXin Li for (y = 0; y < (height >> 1); ++y) {
544*b2055c35SXin Li int rows_have_alpha = has_alpha;
545*b2055c35SXin Li if (use_dsp) {
546*b2055c35SXin Li if (is_rgb) {
547*b2055c35SXin Li WebPConvertRGB24ToY(r_ptr, dst_y, width);
548*b2055c35SXin Li WebPConvertRGB24ToY(r_ptr + rgb_stride,
549*b2055c35SXin Li dst_y + picture->y_stride, width);
550*b2055c35SXin Li } else {
551*b2055c35SXin Li WebPConvertBGR24ToY(b_ptr, dst_y, width);
552*b2055c35SXin Li WebPConvertBGR24ToY(b_ptr + rgb_stride,
553*b2055c35SXin Li dst_y + picture->y_stride, width);
554*b2055c35SXin Li }
555*b2055c35SXin Li } else {
556*b2055c35SXin Li ConvertRowToY(r_ptr, g_ptr, b_ptr, step, dst_y, width, rg);
557*b2055c35SXin Li ConvertRowToY(r_ptr + rgb_stride,
558*b2055c35SXin Li g_ptr + rgb_stride,
559*b2055c35SXin Li b_ptr + rgb_stride, step,
560*b2055c35SXin Li dst_y + picture->y_stride, width, rg);
561*b2055c35SXin Li }
562*b2055c35SXin Li dst_y += 2 * picture->y_stride;
563*b2055c35SXin Li if (has_alpha) {
564*b2055c35SXin Li rows_have_alpha &= !WebPExtractAlpha(a_ptr, rgb_stride, width, 2,
565*b2055c35SXin Li dst_a, picture->a_stride);
566*b2055c35SXin Li dst_a += 2 * picture->a_stride;
567*b2055c35SXin Li }
568*b2055c35SXin Li // Collect averaged R/G/B(/A)
569*b2055c35SXin Li if (!rows_have_alpha) {
570*b2055c35SXin Li AccumulateRGB(r_ptr, g_ptr, b_ptr, step, rgb_stride, tmp_rgb, width);
571*b2055c35SXin Li } else {
572*b2055c35SXin Li AccumulateRGBA(r_ptr, g_ptr, b_ptr, a_ptr, rgb_stride, tmp_rgb, width);
573*b2055c35SXin Li }
574*b2055c35SXin Li // Convert to U/V
575*b2055c35SXin Li if (rg == NULL) {
576*b2055c35SXin Li WebPConvertRGBA32ToUV(tmp_rgb, dst_u, dst_v, uv_width);
577*b2055c35SXin Li } else {
578*b2055c35SXin Li ConvertRowsToUV(tmp_rgb, dst_u, dst_v, uv_width, rg);
579*b2055c35SXin Li }
580*b2055c35SXin Li dst_u += picture->uv_stride;
581*b2055c35SXin Li dst_v += picture->uv_stride;
582*b2055c35SXin Li r_ptr += 2 * rgb_stride;
583*b2055c35SXin Li b_ptr += 2 * rgb_stride;
584*b2055c35SXin Li g_ptr += 2 * rgb_stride;
585*b2055c35SXin Li if (has_alpha) a_ptr += 2 * rgb_stride;
586*b2055c35SXin Li }
587*b2055c35SXin Li if (height & 1) { // extra last row
588*b2055c35SXin Li int row_has_alpha = has_alpha;
589*b2055c35SXin Li if (use_dsp) {
590*b2055c35SXin Li if (r_ptr < b_ptr) {
591*b2055c35SXin Li WebPConvertRGB24ToY(r_ptr, dst_y, width);
592*b2055c35SXin Li } else {
593*b2055c35SXin Li WebPConvertBGR24ToY(b_ptr, dst_y, width);
594*b2055c35SXin Li }
595*b2055c35SXin Li } else {
596*b2055c35SXin Li ConvertRowToY(r_ptr, g_ptr, b_ptr, step, dst_y, width, rg);
597*b2055c35SXin Li }
598*b2055c35SXin Li if (row_has_alpha) {
599*b2055c35SXin Li row_has_alpha &= !WebPExtractAlpha(a_ptr, 0, width, 1, dst_a, 0);
600*b2055c35SXin Li }
601*b2055c35SXin Li // Collect averaged R/G/B(/A)
602*b2055c35SXin Li if (!row_has_alpha) {
603*b2055c35SXin Li // Collect averaged R/G/B
604*b2055c35SXin Li AccumulateRGB(r_ptr, g_ptr, b_ptr, step, /* rgb_stride = */ 0,
605*b2055c35SXin Li tmp_rgb, width);
606*b2055c35SXin Li } else {
607*b2055c35SXin Li AccumulateRGBA(r_ptr, g_ptr, b_ptr, a_ptr, /* rgb_stride = */ 0,
608*b2055c35SXin Li tmp_rgb, width);
609*b2055c35SXin Li }
610*b2055c35SXin Li if (rg == NULL) {
611*b2055c35SXin Li WebPConvertRGBA32ToUV(tmp_rgb, dst_u, dst_v, uv_width);
612*b2055c35SXin Li } else {
613*b2055c35SXin Li ConvertRowsToUV(tmp_rgb, dst_u, dst_v, uv_width, rg);
614*b2055c35SXin Li }
615*b2055c35SXin Li }
616*b2055c35SXin Li WebPSafeFree(tmp_rgb);
617*b2055c35SXin Li }
618*b2055c35SXin Li return 1;
619*b2055c35SXin Li }
620*b2055c35SXin Li
621*b2055c35SXin Li #undef SUM4
622*b2055c35SXin Li #undef SUM2
623*b2055c35SXin Li #undef SUM4ALPHA
624*b2055c35SXin Li #undef SUM2ALPHA
625*b2055c35SXin Li
626*b2055c35SXin Li //------------------------------------------------------------------------------
627*b2055c35SXin Li // call for ARGB->YUVA conversion
628*b2055c35SXin Li
PictureARGBToYUVA(WebPPicture * picture,WebPEncCSP colorspace,float dithering,int use_iterative_conversion)629*b2055c35SXin Li static int PictureARGBToYUVA(WebPPicture* picture, WebPEncCSP colorspace,
630*b2055c35SXin Li float dithering, int use_iterative_conversion) {
631*b2055c35SXin Li if (picture == NULL) return 0;
632*b2055c35SXin Li if (picture->argb == NULL) {
633*b2055c35SXin Li return WebPEncodingSetError(picture, VP8_ENC_ERROR_NULL_PARAMETER);
634*b2055c35SXin Li } else if ((colorspace & WEBP_CSP_UV_MASK) != WEBP_YUV420) {
635*b2055c35SXin Li return WebPEncodingSetError(picture, VP8_ENC_ERROR_INVALID_CONFIGURATION);
636*b2055c35SXin Li } else {
637*b2055c35SXin Li const uint8_t* const argb = (const uint8_t*)picture->argb;
638*b2055c35SXin Li const uint8_t* const a = argb + CHANNEL_OFFSET(0);
639*b2055c35SXin Li const uint8_t* const r = argb + CHANNEL_OFFSET(1);
640*b2055c35SXin Li const uint8_t* const g = argb + CHANNEL_OFFSET(2);
641*b2055c35SXin Li const uint8_t* const b = argb + CHANNEL_OFFSET(3);
642*b2055c35SXin Li
643*b2055c35SXin Li picture->colorspace = WEBP_YUV420;
644*b2055c35SXin Li return ImportYUVAFromRGBA(r, g, b, a, 4, 4 * picture->argb_stride,
645*b2055c35SXin Li dithering, use_iterative_conversion, picture);
646*b2055c35SXin Li }
647*b2055c35SXin Li }
648*b2055c35SXin Li
WebPPictureARGBToYUVADithered(WebPPicture * picture,WebPEncCSP colorspace,float dithering)649*b2055c35SXin Li int WebPPictureARGBToYUVADithered(WebPPicture* picture, WebPEncCSP colorspace,
650*b2055c35SXin Li float dithering) {
651*b2055c35SXin Li return PictureARGBToYUVA(picture, colorspace, dithering, 0);
652*b2055c35SXin Li }
653*b2055c35SXin Li
WebPPictureARGBToYUVA(WebPPicture * picture,WebPEncCSP colorspace)654*b2055c35SXin Li int WebPPictureARGBToYUVA(WebPPicture* picture, WebPEncCSP colorspace) {
655*b2055c35SXin Li return PictureARGBToYUVA(picture, colorspace, 0.f, 0);
656*b2055c35SXin Li }
657*b2055c35SXin Li
WebPPictureSharpARGBToYUVA(WebPPicture * picture)658*b2055c35SXin Li int WebPPictureSharpARGBToYUVA(WebPPicture* picture) {
659*b2055c35SXin Li return PictureARGBToYUVA(picture, WEBP_YUV420, 0.f, 1);
660*b2055c35SXin Li }
661*b2055c35SXin Li // for backward compatibility
WebPPictureSmartARGBToYUVA(WebPPicture * picture)662*b2055c35SXin Li int WebPPictureSmartARGBToYUVA(WebPPicture* picture) {
663*b2055c35SXin Li return WebPPictureSharpARGBToYUVA(picture);
664*b2055c35SXin Li }
665*b2055c35SXin Li
666*b2055c35SXin Li //------------------------------------------------------------------------------
667*b2055c35SXin Li // call for YUVA -> ARGB conversion
668*b2055c35SXin Li
WebPPictureYUVAToARGB(WebPPicture * picture)669*b2055c35SXin Li int WebPPictureYUVAToARGB(WebPPicture* picture) {
670*b2055c35SXin Li if (picture == NULL) return 0;
671*b2055c35SXin Li if (picture->y == NULL || picture->u == NULL || picture->v == NULL) {
672*b2055c35SXin Li return WebPEncodingSetError(picture, VP8_ENC_ERROR_NULL_PARAMETER);
673*b2055c35SXin Li }
674*b2055c35SXin Li if ((picture->colorspace & WEBP_CSP_ALPHA_BIT) && picture->a == NULL) {
675*b2055c35SXin Li return WebPEncodingSetError(picture, VP8_ENC_ERROR_NULL_PARAMETER);
676*b2055c35SXin Li }
677*b2055c35SXin Li if ((picture->colorspace & WEBP_CSP_UV_MASK) != WEBP_YUV420) {
678*b2055c35SXin Li return WebPEncodingSetError(picture, VP8_ENC_ERROR_INVALID_CONFIGURATION);
679*b2055c35SXin Li }
680*b2055c35SXin Li // Allocate a new argb buffer (discarding the previous one).
681*b2055c35SXin Li if (!WebPPictureAllocARGB(picture)) return 0;
682*b2055c35SXin Li picture->use_argb = 1;
683*b2055c35SXin Li
684*b2055c35SXin Li // Convert
685*b2055c35SXin Li {
686*b2055c35SXin Li int y;
687*b2055c35SXin Li const int width = picture->width;
688*b2055c35SXin Li const int height = picture->height;
689*b2055c35SXin Li const int argb_stride = 4 * picture->argb_stride;
690*b2055c35SXin Li uint8_t* dst = (uint8_t*)picture->argb;
691*b2055c35SXin Li const uint8_t* cur_u = picture->u, *cur_v = picture->v, *cur_y = picture->y;
692*b2055c35SXin Li WebPUpsampleLinePairFunc upsample =
693*b2055c35SXin Li WebPGetLinePairConverter(ALPHA_OFFSET > 0);
694*b2055c35SXin Li
695*b2055c35SXin Li // First row, with replicated top samples.
696*b2055c35SXin Li upsample(cur_y, NULL, cur_u, cur_v, cur_u, cur_v, dst, NULL, width);
697*b2055c35SXin Li cur_y += picture->y_stride;
698*b2055c35SXin Li dst += argb_stride;
699*b2055c35SXin Li // Center rows.
700*b2055c35SXin Li for (y = 1; y + 1 < height; y += 2) {
701*b2055c35SXin Li const uint8_t* const top_u = cur_u;
702*b2055c35SXin Li const uint8_t* const top_v = cur_v;
703*b2055c35SXin Li cur_u += picture->uv_stride;
704*b2055c35SXin Li cur_v += picture->uv_stride;
705*b2055c35SXin Li upsample(cur_y, cur_y + picture->y_stride, top_u, top_v, cur_u, cur_v,
706*b2055c35SXin Li dst, dst + argb_stride, width);
707*b2055c35SXin Li cur_y += 2 * picture->y_stride;
708*b2055c35SXin Li dst += 2 * argb_stride;
709*b2055c35SXin Li }
710*b2055c35SXin Li // Last row (if needed), with replicated bottom samples.
711*b2055c35SXin Li if (height > 1 && !(height & 1)) {
712*b2055c35SXin Li upsample(cur_y, NULL, cur_u, cur_v, cur_u, cur_v, dst, NULL, width);
713*b2055c35SXin Li }
714*b2055c35SXin Li // Insert alpha values if needed, in replacement for the default 0xff ones.
715*b2055c35SXin Li if (picture->colorspace & WEBP_CSP_ALPHA_BIT) {
716*b2055c35SXin Li for (y = 0; y < height; ++y) {
717*b2055c35SXin Li uint32_t* const argb_dst = picture->argb + y * picture->argb_stride;
718*b2055c35SXin Li const uint8_t* const src = picture->a + y * picture->a_stride;
719*b2055c35SXin Li int x;
720*b2055c35SXin Li for (x = 0; x < width; ++x) {
721*b2055c35SXin Li argb_dst[x] = (argb_dst[x] & 0x00ffffffu) | ((uint32_t)src[x] << 24);
722*b2055c35SXin Li }
723*b2055c35SXin Li }
724*b2055c35SXin Li }
725*b2055c35SXin Li }
726*b2055c35SXin Li return 1;
727*b2055c35SXin Li }
728*b2055c35SXin Li
729*b2055c35SXin Li //------------------------------------------------------------------------------
730*b2055c35SXin Li // automatic import / conversion
731*b2055c35SXin Li
Import(WebPPicture * const picture,const uint8_t * rgb,int rgb_stride,int step,int swap_rb,int import_alpha)732*b2055c35SXin Li static int Import(WebPPicture* const picture,
733*b2055c35SXin Li const uint8_t* rgb, int rgb_stride,
734*b2055c35SXin Li int step, int swap_rb, int import_alpha) {
735*b2055c35SXin Li int y;
736*b2055c35SXin Li // swap_rb -> b,g,r,a , !swap_rb -> r,g,b,a
737*b2055c35SXin Li const uint8_t* r_ptr = rgb + (swap_rb ? 2 : 0);
738*b2055c35SXin Li const uint8_t* g_ptr = rgb + 1;
739*b2055c35SXin Li const uint8_t* b_ptr = rgb + (swap_rb ? 0 : 2);
740*b2055c35SXin Li const int width = picture->width;
741*b2055c35SXin Li const int height = picture->height;
742*b2055c35SXin Li
743*b2055c35SXin Li if (abs(rgb_stride) < (import_alpha ? 4 : 3) * width) return 0;
744*b2055c35SXin Li
745*b2055c35SXin Li if (!picture->use_argb) {
746*b2055c35SXin Li const uint8_t* a_ptr = import_alpha ? rgb + 3 : NULL;
747*b2055c35SXin Li return ImportYUVAFromRGBA(r_ptr, g_ptr, b_ptr, a_ptr, step, rgb_stride,
748*b2055c35SXin Li 0.f /* no dithering */, 0, picture);
749*b2055c35SXin Li }
750*b2055c35SXin Li if (!WebPPictureAlloc(picture)) return 0;
751*b2055c35SXin Li
752*b2055c35SXin Li VP8LDspInit();
753*b2055c35SXin Li WebPInitAlphaProcessing();
754*b2055c35SXin Li
755*b2055c35SXin Li if (import_alpha) {
756*b2055c35SXin Li // dst[] byte order is {a,r,g,b} for big-endian, {b,g,r,a} for little endian
757*b2055c35SXin Li uint32_t* dst = picture->argb;
758*b2055c35SXin Li const int do_copy = (ALPHA_OFFSET == 3) && swap_rb;
759*b2055c35SXin Li assert(step == 4);
760*b2055c35SXin Li if (do_copy) {
761*b2055c35SXin Li for (y = 0; y < height; ++y) {
762*b2055c35SXin Li memcpy(dst, rgb, width * 4);
763*b2055c35SXin Li rgb += rgb_stride;
764*b2055c35SXin Li dst += picture->argb_stride;
765*b2055c35SXin Li }
766*b2055c35SXin Li } else {
767*b2055c35SXin Li for (y = 0; y < height; ++y) {
768*b2055c35SXin Li #ifdef WORDS_BIGENDIAN
769*b2055c35SXin Li // BGRA or RGBA input order.
770*b2055c35SXin Li const uint8_t* a_ptr = rgb + 3;
771*b2055c35SXin Li WebPPackARGB(a_ptr, r_ptr, g_ptr, b_ptr, width, dst);
772*b2055c35SXin Li r_ptr += rgb_stride;
773*b2055c35SXin Li g_ptr += rgb_stride;
774*b2055c35SXin Li b_ptr += rgb_stride;
775*b2055c35SXin Li #else
776*b2055c35SXin Li // RGBA input order. Need to swap R and B.
777*b2055c35SXin Li VP8LConvertBGRAToRGBA((const uint32_t*)rgb, width, (uint8_t*)dst);
778*b2055c35SXin Li #endif
779*b2055c35SXin Li rgb += rgb_stride;
780*b2055c35SXin Li dst += picture->argb_stride;
781*b2055c35SXin Li }
782*b2055c35SXin Li }
783*b2055c35SXin Li } else {
784*b2055c35SXin Li uint32_t* dst = picture->argb;
785*b2055c35SXin Li assert(step >= 3);
786*b2055c35SXin Li for (y = 0; y < height; ++y) {
787*b2055c35SXin Li WebPPackRGB(r_ptr, g_ptr, b_ptr, width, step, dst);
788*b2055c35SXin Li r_ptr += rgb_stride;
789*b2055c35SXin Li g_ptr += rgb_stride;
790*b2055c35SXin Li b_ptr += rgb_stride;
791*b2055c35SXin Li dst += picture->argb_stride;
792*b2055c35SXin Li }
793*b2055c35SXin Li }
794*b2055c35SXin Li return 1;
795*b2055c35SXin Li }
796*b2055c35SXin Li
797*b2055c35SXin Li // Public API
798*b2055c35SXin Li
799*b2055c35SXin Li #if !defined(WEBP_REDUCE_CSP)
800*b2055c35SXin Li
WebPPictureImportBGR(WebPPicture * picture,const uint8_t * bgr,int bgr_stride)801*b2055c35SXin Li int WebPPictureImportBGR(WebPPicture* picture,
802*b2055c35SXin Li const uint8_t* bgr, int bgr_stride) {
803*b2055c35SXin Li return (picture != NULL && bgr != NULL)
804*b2055c35SXin Li ? Import(picture, bgr, bgr_stride, 3, 1, 0)
805*b2055c35SXin Li : 0;
806*b2055c35SXin Li }
807*b2055c35SXin Li
WebPPictureImportBGRA(WebPPicture * picture,const uint8_t * bgra,int bgra_stride)808*b2055c35SXin Li int WebPPictureImportBGRA(WebPPicture* picture,
809*b2055c35SXin Li const uint8_t* bgra, int bgra_stride) {
810*b2055c35SXin Li return (picture != NULL && bgra != NULL)
811*b2055c35SXin Li ? Import(picture, bgra, bgra_stride, 4, 1, 1)
812*b2055c35SXin Li : 0;
813*b2055c35SXin Li }
814*b2055c35SXin Li
815*b2055c35SXin Li
WebPPictureImportBGRX(WebPPicture * picture,const uint8_t * bgrx,int bgrx_stride)816*b2055c35SXin Li int WebPPictureImportBGRX(WebPPicture* picture,
817*b2055c35SXin Li const uint8_t* bgrx, int bgrx_stride) {
818*b2055c35SXin Li return (picture != NULL && bgrx != NULL)
819*b2055c35SXin Li ? Import(picture, bgrx, bgrx_stride, 4, 1, 0)
820*b2055c35SXin Li : 0;
821*b2055c35SXin Li }
822*b2055c35SXin Li
823*b2055c35SXin Li #endif // WEBP_REDUCE_CSP
824*b2055c35SXin Li
WebPPictureImportRGB(WebPPicture * picture,const uint8_t * rgb,int rgb_stride)825*b2055c35SXin Li int WebPPictureImportRGB(WebPPicture* picture,
826*b2055c35SXin Li const uint8_t* rgb, int rgb_stride) {
827*b2055c35SXin Li return (picture != NULL && rgb != NULL)
828*b2055c35SXin Li ? Import(picture, rgb, rgb_stride, 3, 0, 0)
829*b2055c35SXin Li : 0;
830*b2055c35SXin Li }
831*b2055c35SXin Li
WebPPictureImportRGBA(WebPPicture * picture,const uint8_t * rgba,int rgba_stride)832*b2055c35SXin Li int WebPPictureImportRGBA(WebPPicture* picture,
833*b2055c35SXin Li const uint8_t* rgba, int rgba_stride) {
834*b2055c35SXin Li return (picture != NULL && rgba != NULL)
835*b2055c35SXin Li ? Import(picture, rgba, rgba_stride, 4, 0, 1)
836*b2055c35SXin Li : 0;
837*b2055c35SXin Li }
838*b2055c35SXin Li
WebPPictureImportRGBX(WebPPicture * picture,const uint8_t * rgbx,int rgbx_stride)839*b2055c35SXin Li int WebPPictureImportRGBX(WebPPicture* picture,
840*b2055c35SXin Li const uint8_t* rgbx, int rgbx_stride) {
841*b2055c35SXin Li return (picture != NULL && rgbx != NULL)
842*b2055c35SXin Li ? Import(picture, rgbx, rgbx_stride, 4, 0, 0)
843*b2055c35SXin Li : 0;
844*b2055c35SXin Li }
845*b2055c35SXin Li
846*b2055c35SXin Li //------------------------------------------------------------------------------
847