picture_csp_enc.c source code [engine/third_party/libwebp/src/enc/picture_csp_enc.c]

1	// Copyright 2014 Google Inc. All Rights Reserved.
2	//
3	// Use of this source code is governed by a BSD-style license
4	// that can be found in the COPYING file in the root of the source
5	// tree. An additional intellectual property rights grant can be found
6	// in the file PATENTS. All contributing project authors may
7	// be found in the AUTHORS file in the root of the source tree.
8	// -----------------------------------------------------------------------------
9	//
10	// WebPPicture utils for colorspace conversion
11	//
12	// Author: Skal (pascal.massimino@gmail.com)
13
14	#include <assert.h>
15	#include <stdlib.h>
16	#include <math.h>
17
18	#include "./vp8i_enc.h"
19	#include "../utils/random_utils.h"
20	#include "../utils/utils.h"
21	#include "../dsp/yuv.h"
22
23	// Uncomment to disable gamma-compression during RGB->U/V averaging
24	#define USE_GAMMA_COMPRESSION
25
26	// If defined, use table to compute x / alpha.
27	#define USE_INVERSE_ALPHA_TABLE
28
29	static const union {
30	uint32_t argb;
31	uint8_t bytes[`4`];
32	} test_endian = { `0xff000000u` };
33	#define ALPHA_IS_LAST (test_endian.bytes[3] == 0xff)
34
35	//------------------------------------------------------------------------------
36	// Detection of non-trivial transparency
37
38	// Returns true if alpha[] has non-0xff values.
39	static int CheckNonOpaque(const uint8_t* alpha, int width, int height,
40	int x_step, int y_step) {
41	if (alpha == NULL) return `0`;
42	while (height-- > `0`) {
43	int x;
44	for (x = `0`; x < width * x_step; x += x_step) {
45	if (alpha[x] != `0xff`) return `1`; // TODO(skal): check 4/8 bytes at a time.
46	}
47	alpha += y_step;
48	}
49	return `0`;
50	}
51
52	// Checking for the presence of non-opaque alpha.
53	int WebPPictureHasTransparency(const WebPPicture* picture) {
54	if (picture == NULL) return `0`;
55	if (!picture->use_argb) {
56	return CheckNonOpaque(picture->a, picture->width, picture->height,
57	`1`, picture->a_stride);
58	} else {
59	int x, y;
60	const uint32_t* argb = picture->argb;
61	if (argb == NULL) return `0`;
62	for (y = `0`; y < picture->height; ++y) {
63	for (x = `0`; x < picture->width; ++x) {
64	if (argb[x] < `0xff000000u`) return `1`; // test any alpha values != 0xff
65	}
66	argb += picture->argb_stride;
67	}
68	}
69	return `0`;
70	}
71
72	//------------------------------------------------------------------------------
73	// Code for gamma correction
74
75	#if defined(USE_GAMMA_COMPRESSION)
76
77	// gamma-compensates loss of resolution during chroma subsampling
78	#define kGamma 0.80 // for now we use a different gamma value than kGammaF
79	#define kGammaFix 12 // fixed-point precision for linear values
80	#define kGammaScale ((1 << kGammaFix) - 1)
81	#define kGammaTabFix 7 // fixed-point fractional bits precision
82	#define kGammaTabScale (1 << kGammaTabFix)
83	#define kGammaTabRounder (kGammaTabScale >> 1)
84	#define kGammaTabSize (1 << (kGammaFix - kGammaTabFix))
85
86	static int kLinearToGammaTab[kGammaTabSize + `1`];
87	static uint16_t kGammaToLinearTab[`256`];
88	static volatile int kGammaTablesOk = `0`;
89
90	static WEBP_TSAN_IGNORE_FUNCTION void InitGammaTables(void) {
91	if (!kGammaTablesOk) {
92	int v;
93	const double scale = (double)(`1` << kGammaTabFix) / kGammaScale;
94	const double norm = `1.` / `255.`;
95	for (v = `0`; v <= `255`; ++v) {
96	kGammaToLinearTab[v] =
97	(uint16_t)(pow(norm * v, kGamma) * kGammaScale + `.5`);
98	}
99	for (v = `0`; v <= kGammaTabSize; ++v) {
100	kLinearToGammaTab[v] = (int)(`255.` * pow(scale * v, `1.` / kGamma) + `.5`);
101	}
102	kGammaTablesOk = `1`;
103	}
104	}
105
106	static WEBP_INLINE uint32_t GammaToLinear(uint8_t v) {
107	return kGammaToLinearTab[v];
108	}
109
110	static WEBP_INLINE int Interpolate(int v) {
111	const int tab_pos = v >> (kGammaTabFix + `2`); // integer part
112	const int x = v & ((kGammaTabScale << `2`) - `1`); // fractional part
113	const int v0 = kLinearToGammaTab[tab_pos];
114	const int v1 = kLinearToGammaTab[tab_pos + `1`];
115	const int y = v1 * x + v0 * ((kGammaTabScale << `2`) - x); // interpolate
116	assert(tab_pos + `1` < kGammaTabSize + `1`);
117	return y;
118	}
119
120	// Convert a linear value 'v' to YUV_FIX+2 fixed-point precision
121	// U/V value, suitable for RGBToU/V calls.
122	static WEBP_INLINE int LinearToGamma(uint32_t base_value, int shift) {
123	const int y = Interpolate(base_value << shift); // final uplifted value
124	return (y + kGammaTabRounder) >> kGammaTabFix; // descale
125	}
126
127	#else
128
129	static WEBP_TSAN_IGNORE_FUNCTION void InitGammaTables(void) {}
130	static WEBP_INLINE uint32_t GammaToLinear(uint8_t v) { return v; }
131	static WEBP_INLINE int LinearToGamma(uint32_t base_value, int shift) {
132	return (int)(base_value << shift);
133	}
134
135	#endif // USE_GAMMA_COMPRESSION
136
137	//------------------------------------------------------------------------------
138	// RGB -> YUV conversion
139
140	static int RGBToY(int r, int g, int b, VP8Random* const rg) {
141	return (rg == NULL) ? VP8RGBToY(r, g, b, YUV_HALF)
142	: VP8RGBToY(r, g, b, VP8RandomBits(rg, YUV_FIX));
143	}
144
145	static int RGBToU(int r, int g, int b, VP8Random* const rg) {
146	return (rg == NULL) ? VP8RGBToU(r, g, b, YUV_HALF << `2`)
147	: VP8RGBToU(r, g, b, VP8RandomBits(rg, YUV_FIX + `2`));
148	}
149
150	static int RGBToV(int r, int g, int b, VP8Random* const rg) {
151	return (rg == NULL) ? VP8RGBToV(r, g, b, YUV_HALF << `2`)
152	: VP8RGBToV(r, g, b, VP8RandomBits(rg, YUV_FIX + `2`));
153	}
154
155	//------------------------------------------------------------------------------
156	// Sharp RGB->YUV conversion
157
158	static const int kNumIterations = `4`;
159	static const int kMinDimensionIterativeConversion = `4`;
160
161	// We could use SFIX=0 and only uint8_t for fixed_y_t, but it produces some
162	// banding sometimes. Better use extra precision.
163	#define SFIX 2 // fixed-point precision of RGB and Y/W
164	typedef int16_t fixed_t; // signed type with extra SFIX precision for UV
165	typedef uint16_t fixed_y_t; // unsigned type with extra SFIX precision for W
166
167	#define SHALF (1 << SFIX >> 1)
168	#define MAX_Y_T ((256 << SFIX) - 1)
169	#define SROUNDER (1 << (YUV_FIX + SFIX - 1))
170
171	#if defined(USE_GAMMA_COMPRESSION)
172
173	// float variant of gamma-correction
174	// We use tables of different size and precision for the Rec709
175	// transfer function.
176	#define kGammaF (1./0.45)
177	static float kGammaToLinearTabF[MAX_Y_T + `1`]; // size scales with Y_FIX
178	static float kLinearToGammaTabF[kGammaTabSize + `2`];
179	static volatile int kGammaTablesFOk = `0`;
180
181	static WEBP_TSAN_IGNORE_FUNCTION void InitGammaTablesF(void) {
182	if (!kGammaTablesFOk) {
183	int v;
184	const double norm = `1.` / MAX_Y_T;
185	const double scale = `1.` / kGammaTabSize;
186	const double a = `0.099`;
187	const double thresh = `0.018`;
188	for (v = `0`; v <= MAX_Y_T; ++v) {
189	const double g = norm * v;
190	if (g <= thresh * `4.5`) {
191	kGammaToLinearTabF[v] = (float)(g / `4.5`);
192	} else {
193	const double a_rec = `1.` / (`1.` + a);
194	kGammaToLinearTabF[v] = (float)pow(a_rec * (g + a), kGammaF);
195	}
196	}
197	for (v = `0`; v <= kGammaTabSize; ++v) {
198	const double g = scale * v;
199	double value;
200	if (g <= thresh) {
201	value = `4.5` * g;
202	} else {
203	value = (`1.` + a) * pow(g, `1.` / kGammaF) - a;
204	}
205	kLinearToGammaTabF[v] = (float)(MAX_Y_T * value);
206	}
207	// to prevent small rounding errors to cause read-overflow:
208	kLinearToGammaTabF[kGammaTabSize + `1`] = kLinearToGammaTabF[kGammaTabSize];
209	kGammaTablesFOk = `1`;
210	}
211	}
212
213	static WEBP_INLINE float GammaToLinearF(int v) {
214	return kGammaToLinearTabF[v];
215	}
216
217	static WEBP_INLINE int LinearToGammaF(float value) {
218	const float v = value * kGammaTabSize;
219	const int tab_pos = (int)v;
220	const float x = v - (float)tab_pos; // fractional part
221	const float v0 = kLinearToGammaTabF[tab_pos + `0`];
222	const float v1 = kLinearToGammaTabF[tab_pos + `1`];
223	const float y = v1 * x + v0 * (`1.f` - x); // interpolate
224	return (int)(y + `.5`);
225	}
226
227	#else
228
229	static WEBP_TSAN_IGNORE_FUNCTION void InitGammaTablesF(void) {}
230	static WEBP_INLINE float GammaToLinearF(int v) {
231	const float norm = `1.f` / MAX_Y_T;
232	return norm * v;
233	}
234	static WEBP_INLINE int LinearToGammaF(float value) {
235	return (int)(MAX_Y_T * value + `.5`);
236	}
237
238	#endif // USE_GAMMA_COMPRESSION
239
240	//------------------------------------------------------------------------------
241
242	static uint8_t clip_8b(fixed_t v) {
243	return (!(v & ~`0xff`)) ? (uint8_t)v : (v < `0`) ? `0u` : `255u`;
244	}
245
246	static fixed_y_t clip_y(int y) {
247	return (!(y & ~MAX_Y_T)) ? (fixed_y_t)y : (y < `0`) ? `0` : MAX_Y_T;
248	}
249
250	//------------------------------------------------------------------------------
251
252	static int RGBToGray(int r, int g, int b) {
253	const int luma = `13933` * r + `46871` * g + `4732` * b + YUV_HALF;
254	return (luma >> YUV_FIX);
255	}
256
257	static float RGBToGrayF(float r, float g, float b) {
258	return (float)(`0.2126` * r + `0.7152` * g + `0.0722` * b);
259	}
260
261	static int ScaleDown(int a, int b, int c, int d) {
262	const float A = GammaToLinearF(a);
263	const float B = GammaToLinearF(b);
264	const float C = GammaToLinearF(c);
265	const float D = GammaToLinearF(d);
266	return LinearToGammaF(`0.25f` * (A + B + C + D));
267	}
268
269	static WEBP_INLINE void UpdateW(const fixed_y_t* src, fixed_y_t* dst, int w) {
270	int i;
271	for (i = `0`; i < w; ++i) {
272	const float R = GammaToLinearF(src[`0` * w + i]);
273	const float G = GammaToLinearF(src[`1` * w + i]);
274	const float B = GammaToLinearF(src[`2` * w + i]);
275	const float Y = RGBToGrayF(R, G, B);
276	dst[i] = (fixed_y_t)LinearToGammaF(Y);
277	}
278	}
279
280	static void UpdateChroma(const fixed_y_t* src1, const fixed_y_t* src2,
281	fixed_t* dst, int uv_w) {
282	int i;
283	for (i = `0`; i < uv_w; ++i) {
284	const int r = ScaleDown(src1[`0` * uv_w + `0`], src1[`0` * uv_w + `1`],
285	src2[`0` * uv_w + `0`], src2[`0` * uv_w + `1`]);
286	const int g = ScaleDown(src1[`2` * uv_w + `0`], src1[`2` * uv_w + `1`],
287	src2[`2` * uv_w + `0`], src2[`2` * uv_w + `1`]);
288	const int b = ScaleDown(src1[`4` * uv_w + `0`], src1[`4` * uv_w + `1`],
289	src2[`4` * uv_w + `0`], src2[`4` * uv_w + `1`]);
290	const int W = RGBToGray(r, g, b);
291	dst[`0` * uv_w] = (fixed_t)(r - W);
292	dst[`1` * uv_w] = (fixed_t)(g - W);
293	dst[`2` * uv_w] = (fixed_t)(b - W);
294	dst += `1`;
295	src1 += `2`;
296	src2 += `2`;
297	}
298	}
299
300	static void StoreGray(const fixed_y_t* rgb, fixed_y_t* y, int w) {
301	int i;
302	for (i = `0`; i < w; ++i) {
303	y[i] = RGBToGray(rgb[`0` * w + i], rgb[`1` * w + i], rgb[`2` * w + i]);
304	}
305	}
306
307	//------------------------------------------------------------------------------
308
309	static WEBP_INLINE fixed_y_t Filter2(int A, int B, int W0) {
310	const int v0 = (A * `3` + B + `2`) >> `2`;
311	return clip_y(v0 + W0);
312	}
313
314	//------------------------------------------------------------------------------
315
316	static WEBP_INLINE fixed_y_t UpLift(uint8_t a) { // 8bit -> SFIX
317	return ((fixed_y_t)a << SFIX) \| SHALF;
318	}
319
320	static void ImportOneRow(const uint8_t* const r_ptr,
321	const uint8_t* const g_ptr,
322	const uint8_t* const b_ptr,
323	int step,
324	int pic_width,
325	fixed_y_t* const dst) {
326	int i;
327	const int w = (pic_width + `1`) & ~`1`;
328	for (i = `0`; i < pic_width; ++i) {
329	const int off = i * step;
330	dst[i + `0` * w] = UpLift(r_ptr[off]);
331	dst[i + `1` * w] = UpLift(g_ptr[off]);
332	dst[i + `2` * w] = UpLift(b_ptr[off]);
333	}
334	if (pic_width & `1`) { // replicate rightmost pixel
335	dst[pic_width + `0` * w] = dst[pic_width + `0` * w - `1`];
336	dst[pic_width + `1` * w] = dst[pic_width + `1` * w - `1`];
337	dst[pic_width + `2` * w] = dst[pic_width + `2` * w - `1`];
338	}
339	}
340
341	static void InterpolateTwoRows(const fixed_y_t* const best_y,
342	const fixed_t* prev_uv,
343	const fixed_t* cur_uv,
344	const fixed_t* next_uv,
345	int w,
346	fixed_y_t* out1,
347	fixed_y_t* out2) {
348	const int uv_w = w >> `1`;
349	const int len = (w - `1`) >> `1`; // length to filter
350	int k = `3`;
351	while (k-- > `0`) { // process each R/G/B segments in turn
352	// special boundary case for i==0
353	out1[`0`] = Filter2(cur_uv[`0`], prev_uv[`0`], best_y[`0`]);
354	out2[`0`] = Filter2(cur_uv[`0`], next_uv[`0`], best_y[w]);
355
356	WebPSharpYUVFilterRow(cur_uv, prev_uv, len, best_y + `0` + `1`, out1 + `1`);
357	WebPSharpYUVFilterRow(cur_uv, next_uv, len, best_y + w + `1`, out2 + `1`);
358
359	// special boundary case for i == w - 1 when w is even
360	if (!(w & `1`)) {
361	out1[w - `1`] = Filter2(cur_uv[uv_w - `1`], prev_uv[uv_w - `1`],
362	best_y[w - `1` + `0`]);
363	out2[w - `1`] = Filter2(cur_uv[uv_w - `1`], next_uv[uv_w - `1`],
364	best_y[w - `1` + w]);
365	}
366	out1 += w;
367	out2 += w;
368	prev_uv += uv_w;
369	cur_uv += uv_w;
370	next_uv += uv_w;
371	}
372	}
373
374	static WEBP_INLINE uint8_t ConvertRGBToY(int r, int g, int b) {
375	const int luma = `16839` * r + `33059` * g + `6420` * b + SROUNDER;
376	return clip_8b(`16` + (luma >> (YUV_FIX + SFIX)));
377	}
378
379	static WEBP_INLINE uint8_t ConvertRGBToU(int r, int g, int b) {
380	const int u = -`9719` * r - `19081` * g + `28800` * b + SROUNDER;
381	return clip_8b(`128` + (u >> (YUV_FIX + SFIX)));
382	}
383
384	static WEBP_INLINE uint8_t ConvertRGBToV(int r, int g, int b) {
385	const int v = +`28800` * r - `24116` * g - `4684` * b + SROUNDER;
386	return clip_8b(`128` + (v >> (YUV_FIX + SFIX)));
387	}
388
389	static int ConvertWRGBToYUV(const fixed_y_t* best_y, const fixed_t* best_uv,
390	WebPPicture* const picture) {
391	int i, j;
392	uint8_t* dst_y = picture->y;
393	uint8_t* dst_u = picture->u;
394	uint8_t* dst_v = picture->v;
395	const fixed_t* const best_uv_base = best_uv;
396	const int w = (picture->width + `1`) & ~`1`;
397	const int h = (picture->height + `1`) & ~`1`;
398	const int uv_w = w >> `1`;
399	const int uv_h = h >> `1`;
400	for (best_uv = best_uv_base, j = `0`; j < picture->height; ++j) {
401	for (i = `0`; i < picture->width; ++i) {
402	const int off = (i >> `1`);
403	const int W = best_y[i];
404	const int r = best_uv[off + `0` * uv_w] + W;
405	const int g = best_uv[off + `1` * uv_w] + W;
406	const int b = best_uv[off + `2` * uv_w] + W;
407	dst_y[i] = ConvertRGBToY(r, g, b);
408	}
409	best_y += w;
410	best_uv += (j & `1`) * `3` * uv_w;
411	dst_y += picture->y_stride;
412	}
413	for (best_uv = best_uv_base, j = `0`; j < uv_h; ++j) {
414	for (i = `0`; i < uv_w; ++i) {
415	const int off = i;
416	const int r = best_uv[off + `0` * uv_w];
417	const int g = best_uv[off + `1` * uv_w];
418	const int b = best_uv[off + `2` * uv_w];
419	dst_u[i] = ConvertRGBToU(r, g, b);
420	dst_v[i] = ConvertRGBToV(r, g, b);
421	}
422	best_uv += `3` * uv_w;
423	dst_u += picture->uv_stride;
424	dst_v += picture->uv_stride;
425	}
426	return `1`;
427	}
428
429	//------------------------------------------------------------------------------
430	// Main function
431
432	#define SAFE_ALLOC(W, H, T) ((T)WebPSafeMalloc((W) (H), sizeof(T)))
433
434	static int PreprocessARGB(const uint8_t* r_ptr,
435	const uint8_t* g_ptr,
436	const uint8_t* b_ptr,
437	int step, int rgb_stride,
438	WebPPicture* const picture) {
439	// we expand the right/bottom border if needed
440	const int w = (picture->width + `1`) & ~`1`;
441	const int h = (picture->height + `1`) & ~`1`;
442	const int uv_w = w >> `1`;
443	const int uv_h = h >> `1`;
444	uint64_t prev_diff_y_sum = ~`0`;
445	int j, iter;
446
447	// TODO(skal): allocate one big memory chunk. But for now, it's easier
448	// for valgrind debugging to have several chunks.
449	fixed_y_t* const tmp_buffer = SAFE_ALLOC(w * `3`, `2`, fixed_y_t); // scratch
450	fixed_y_t* const best_y_base = SAFE_ALLOC(w, h, fixed_y_t);
451	fixed_y_t* const target_y_base = SAFE_ALLOC(w, h, fixed_y_t);
452	fixed_y_t* const best_rgb_y = SAFE_ALLOC(w, `2`, fixed_y_t);
453	fixed_t* const best_uv_base = SAFE_ALLOC(uv_w * `3`, uv_h, fixed_t);
454	fixed_t* const target_uv_base = SAFE_ALLOC(uv_w * `3`, uv_h, fixed_t);
455	fixed_t* const best_rgb_uv = SAFE_ALLOC(uv_w * `3`, `1`, fixed_t);
456	fixed_y_t* best_y = best_y_base;
457	fixed_y_t* target_y = target_y_base;
458	fixed_t* best_uv = best_uv_base;
459	fixed_t* target_uv = target_uv_base;
460	const uint64_t diff_y_threshold = (uint64_t)(`3.0` * w * h);
461	int ok;
462
463	if (best_y_base == NULL \|\| best_uv_base == NULL \|\|
464	target_y_base == NULL \|\| target_uv_base == NULL \|\|
465	best_rgb_y == NULL \|\| best_rgb_uv == NULL \|\|
466	tmp_buffer == NULL) {
467	ok = WebPEncodingSetError(picture, VP8_ENC_ERROR_OUT_OF_MEMORY);
468	goto End;
469	}
470	assert(picture->width >= kMinDimensionIterativeConversion);
471	assert(picture->height >= kMinDimensionIterativeConversion);
472
473	WebPInitConvertARGBToYUV();
474
475	// Import RGB samples to W/RGB representation.
476	for (j = `0`; j < picture->height; j += `2`) {
477	const int is_last_row = (j == picture->height - `1`);
478	fixed_y_t* const src1 = tmp_buffer + `0` * w;
479	fixed_y_t* const src2 = tmp_buffer + `3` * w;
480
481	// prepare two rows of input
482	ImportOneRow(r_ptr, g_ptr, b_ptr, step, picture->width, src1);
483	if (!is_last_row) {
484	ImportOneRow(r_ptr + rgb_stride, g_ptr + rgb_stride, b_ptr + rgb_stride,
485	step, picture->width, src2);
486	} else {
487	memcpy(src2, src1, `3` * w * sizeof(*src2));
488	}
489	StoreGray(src1, best_y + `0`, w);
490	StoreGray(src2, best_y + w, w);
491
492	UpdateW(src1, target_y, w);
493	UpdateW(src2, target_y + w, w);
494	UpdateChroma(src1, src2, target_uv, uv_w);
495	memcpy(best_uv, target_uv, `3` * uv_w * sizeof(*best_uv));
496	best_y += `2` * w;
497	best_uv += `3` * uv_w;
498	target_y += `2` * w;
499	target_uv += `3` * uv_w;
500	r_ptr += `2` * rgb_stride;
501	g_ptr += `2` * rgb_stride;
502	b_ptr += `2` * rgb_stride;
503	}
504
505	// Iterate and resolve clipping conflicts.
506	for (iter = `0`; iter < kNumIterations; ++iter) {
507	const fixed_t* cur_uv = best_uv_base;
508	const fixed_t* prev_uv = best_uv_base;
509	uint64_t diff_y_sum = `0`;
510
511	best_y = best_y_base;
512	best_uv = best_uv_base;
513	target_y = target_y_base;
514	target_uv = target_uv_base;
515	for (j = `0`; j < h; j += `2`) {
516	fixed_y_t* const src1 = tmp_buffer + `0` * w;
517	fixed_y_t* const src2 = tmp_buffer + `3` * w;
518	{
519	const fixed_t* const next_uv = cur_uv + ((j < h - `2`) ? `3` * uv_w : `0`);
520	InterpolateTwoRows(best_y, prev_uv, cur_uv, next_uv, w, src1, src2);
521	prev_uv = cur_uv;
522	cur_uv = next_uv;
523	}
524
525	UpdateW(src1, best_rgb_y + `0` * w, w);
526	UpdateW(src2, best_rgb_y + `1` * w, w);
527	UpdateChroma(src1, src2, best_rgb_uv, uv_w);
528
529	// update two rows of Y and one row of RGB
530	diff_y_sum += WebPSharpYUVUpdateY(target_y, best_rgb_y, best_y, `2` * w);
531	WebPSharpYUVUpdateRGB(target_uv, best_rgb_uv, best_uv, `3` * uv_w);
532
533	best_y += `2` * w;
534	best_uv += `3` * uv_w;
535	target_y += `2` * w;
536	target_uv += `3` * uv_w;
537	}
538	// test exit condition
539	if (iter > `0`) {
540	if (diff_y_sum < diff_y_threshold) break;
541	if (diff_y_sum > prev_diff_y_sum) break;
542	}
543	prev_diff_y_sum = diff_y_sum;
544	}
545	// final reconstruction
546	ok = ConvertWRGBToYUV(best_y_base, best_uv_base, picture);
547
548	End:
549	WebPSafeFree(best_y_base);
550	WebPSafeFree(best_uv_base);
551	WebPSafeFree(target_y_base);
552	WebPSafeFree(target_uv_base);
553	WebPSafeFree(best_rgb_y);
554	WebPSafeFree(best_rgb_uv);
555	WebPSafeFree(tmp_buffer);
556	return ok;
557	}
558	#undef SAFE_ALLOC
559
560	//------------------------------------------------------------------------------
561	// "Fast" regular RGB->YUV
562
563	#define SUM4(ptr, step) LinearToGamma( \
564	GammaToLinear((ptr)[0]) + \
565	GammaToLinear((ptr)[(step)]) + \
566	GammaToLinear((ptr)[rgb_stride]) + \
567	GammaToLinear((ptr)[rgb_stride + (step)]), 0) \
568
569	#define SUM2(ptr) \
570	LinearToGamma(GammaToLinear((ptr)[0]) + GammaToLinear((ptr)[rgb_stride]), 1)
571
572	#define SUM2ALPHA(ptr) ((ptr)[0] + (ptr)[rgb_stride])
573	#define SUM4ALPHA(ptr) (SUM2ALPHA(ptr) + SUM2ALPHA((ptr) + 4))
574
575	#if defined(USE_INVERSE_ALPHA_TABLE)
576
577	static const int kAlphaFix = `19`;
578	// Following table is (1 << kAlphaFix) / a. The (v kInvAlpha[a]) >> kAlphaFix*
579	// formula is then equal to v / a in most (99.6%) cases. Note that this table
580	// and constant are adjusted very tightly to fit 32b arithmetic.
581	// In particular, they use the fact that the operands for 'v / a' are actually
582	// derived as v = (a0.p0 + a1.p1 + a2.p2 + a3.p3) and a = a0 + a1 + a2 + a3
583	// with ai in [0..255] and pi in [0..1<<kGammaFix). The constraint to avoid
584	// overflow is: kGammaFix + kAlphaFix <= 31.
585	static const uint32_t kInvAlpha[`4` * `0xff` + `1`] = {
586	`0`, / alpha = 0 /
587	`524288`, `262144`, `174762`, `131072`, `104857`, `87381`, `74898`, `65536`,
588	`58254`, `52428`, `47662`, `43690`, `40329`, `37449`, `34952`, `32768`,
589	`30840`, `29127`, `27594`, `26214`, `24966`, `23831`, `22795`, `21845`,
590	`20971`, `20164`, `19418`, `18724`, `18078`, `17476`, `16912`, `16384`,
591	`15887`, `15420`, `14979`, `14563`, `14169`, `13797`, `13443`, `13107`,
592	`12787`, `12483`, `12192`, `11915`, `11650`, `11397`, `11155`, `10922`,
593	`10699`, `10485`, `10280`, `10082`, `9892`, `9709`, `9532`, `9362`,
594	`9198`, `9039`, `8886`, `8738`, `8594`, `8456`, `8322`, `8192`,
595	`8065`, `7943`, `7825`, `7710`, `7598`, `7489`, `7384`, `7281`,
596	`7182`, `7084`, `6990`, `6898`, `6808`, `6721`, `6636`, `6553`,
597	`6472`, `6393`, `6316`, `6241`, `6168`, `6096`, `6026`, `5957`,
598	`5890`, `5825`, `5761`, `5698`, `5637`, `5577`, `5518`, `5461`,
599	`5405`, `5349`, `5295`, `5242`, `5190`, `5140`, `5090`, `5041`,
600	`4993`, `4946`, `4899`, `4854`, `4809`, `4766`, `4723`, `4681`,
601	`4639`, `4599`, `4559`, `4519`, `4481`, `4443`, `4405`, `4369`,
602	`4332`, `4297`, `4262`, `4228`, `4194`, `4161`, `4128`, `4096`,
603	`4064`, `4032`, `4002`, `3971`, `3942`, `3912`, `3883`, `3855`,
604	`3826`, `3799`, `3771`, `3744`, `3718`, `3692`, `3666`, `3640`,
605	`3615`, `3591`, `3566`, `3542`, `3518`, `3495`, `3472`, `3449`,
606	`3426`, `3404`, `3382`, `3360`, `3339`, `3318`, `3297`, `3276`,
607	`3256`, `3236`, `3216`, `3196`, `3177`, `3158`, `3139`, `3120`,
608	`3102`, `3084`, `3066`, `3048`, `3030`, `3013`, `2995`, `2978`,
609	`2962`, `2945`, `2928`, `2912`, `2896`, `2880`, `2864`, `2849`,
610	`2833`, `2818`, `2803`, `2788`, `2774`, `2759`, `2744`, `2730`,
611	`2716`, `2702`, `2688`, `2674`, `2661`, `2647`, `2634`, `2621`,
612	`2608`, `2595`, `2582`, `2570`, `2557`, `2545`, `2532`, `2520`,
613	`2508`, `2496`, `2484`, `2473`, `2461`, `2449`, `2438`, `2427`,
614	`2416`, `2404`, `2394`, `2383`, `2372`, `2361`, `2351`, `2340`,
615	`2330`, `2319`, `2309`, `2299`, `2289`, `2279`, `2269`, `2259`,
616	`2250`, `2240`, `2231`, `2221`, `2212`, `2202`, `2193`, `2184`,
617	`2175`, `2166`, `2157`, `2148`, `2139`, `2131`, `2122`, `2114`,
618	`2105`, `2097`, `2088`, `2080`, `2072`, `2064`, `2056`, `2048`,
619	`2040`, `2032`, `2024`, `2016`, `2008`, `2001`, `1993`, `1985`,
620	`1978`, `1971`, `1963`, `1956`, `1949`, `1941`, `1934`, `1927`,
621	`1920`, `1913`, `1906`, `1899`, `1892`, `1885`, `1879`, `1872`,
622	`1865`, `1859`, `1852`, `1846`, `1839`, `1833`, `1826`, `1820`,
623	`1814`, `1807`, `1801`, `1795`, `1789`, `1783`, `1777`, `1771`,
624	`1765`, `1759`, `1753`, `1747`, `1741`, `1736`, `1730`, `1724`,
625	`1718`, `1713`, `1707`, `1702`, `1696`, `1691`, `1685`, `1680`,
626	`1675`, `1669`, `1664`, `1659`, `1653`, `1648`, `1643`, `1638`,
627	`1633`, `1628`, `1623`, `1618`, `1613`, `1608`, `1603`, `1598`,
628	`1593`, `1588`, `1583`, `1579`, `1574`, `1569`, `1565`, `1560`,
629	`1555`, `1551`, `1546`, `1542`, `1537`, `1533`, `1528`, `1524`,
630	`1519`, `1515`, `1510`, `1506`, `1502`, `1497`, `1493`, `1489`,
631	`1485`, `1481`, `1476`, `1472`, `1468`, `1464`, `1460`, `1456`,
632	`1452`, `1448`, `1444`, `1440`, `1436`, `1432`, `1428`, `1424`,
633	`1420`, `1416`, `1413`, `1409`, `1405`, `1401`, `1398`, `1394`,
634	`1390`, `1387`, `1383`, `1379`, `1376`, `1372`, `1368`, `1365`,
635	`1361`, `1358`, `1354`, `1351`, `1347`, `1344`, `1340`, `1337`,
636	`1334`, `1330`, `1327`, `1323`, `1320`, `1317`, `1314`, `1310`,
637	`1307`, `1304`, `1300`, `1297`, `1294`, `1291`, `1288`, `1285`,
638	`1281`, `1278`, `1275`, `1272`, `1269`, `1266`, `1263`, `1260`,
639	`1257`, `1254`, `1251`, `1248`, `1245`, `1242`, `1239`, `1236`,
640	`1233`, `1230`, `1227`, `1224`, `1222`, `1219`, `1216`, `1213`,
641	`1210`, `1208`, `1205`, `1202`, `1199`, `1197`, `1194`, `1191`,
642	`1188`, `1186`, `1183`, `1180`, `1178`, `1175`, `1172`, `1170`,
643	`1167`, `1165`, `1162`, `1159`, `1157`, `1154`, `1152`, `1149`,
644	`1147`, `1144`, `1142`, `1139`, `1137`, `1134`, `1132`, `1129`,
645	`1127`, `1125`, `1122`, `1120`, `1117`, `1115`, `1113`, `1110`,
646	`1108`, `1106`, `1103`, `1101`, `1099`, `1096`, `1094`, `1092`,
647	`1089`, `1087`, `1085`, `1083`, `1081`, `1078`, `1076`, `1074`,
648	`1072`, `1069`, `1067`, `1065`, `1063`, `1061`, `1059`, `1057`,
649	`1054`, `1052`, `1050`, `1048`, `1046`, `1044`, `1042`, `1040`,
650	`1038`, `1036`, `1034`, `1032`, `1030`, `1028`, `1026`, `1024`,
651	`1022`, `1020`, `1018`, `1016`, `1014`, `1012`, `1010`, `1008`,
652	`1006`, `1004`, `1002`, `1000`, `998`, `996`, `994`, `992`,
653	`991`, `989`, `987`, `985`, `983`, `981`, `979`, `978`,
654	`976`, `974`, `972`, `970`, `969`, `967`, `965`, `963`,
655	`961`, `960`, `958`, `956`, `954`, `953`, `951`, `949`,
656	`948`, `946`, `944`, `942`, `941`, `939`, `937`, `936`,
657	`934`, `932`, `931`, `929`, `927`, `926`, `924`, `923`,
658	`921`, `919`, `918`, `916`, `914`, `913`, `911`, `910`,
659	`908`, `907`, `905`, `903`, `902`, `900`, `899`, `897`,
660	`896`, `894`, `893`, `891`, `890`, `888`, `887`, `885`,
661	`884`, `882`, `881`, `879`, `878`, `876`, `875`, `873`,
662	`872`, `870`, `869`, `868`, `866`, `865`, `863`, `862`,
663	`860`, `859`, `858`, `856`, `855`, `853`, `852`, `851`,
664	`849`, `848`, `846`, `845`, `844`, `842`, `841`, `840`,
665	`838`, `837`, `836`, `834`, `833`, `832`, `830`, `829`,
666	`828`, `826`, `825`, `824`, `823`, `821`, `820`, `819`,
667	`817`, `816`, `815`, `814`, `812`, `811`, `810`, `809`,
668	`807`, `806`, `805`, `804`, `802`, `801`, `800`, `799`,
669	`798`, `796`, `795`, `794`, `793`, `791`, `790`, `789`,
670	`788`, `787`, `786`, `784`, `783`, `782`, `781`, `780`,
671	`779`, `777`, `776`, `775`, `774`, `773`, `772`, `771`,
672	`769`, `768`, `767`, `766`, `765`, `764`, `763`, `762`,
673	`760`, `759`, `758`, `757`, `756`, `755`, `754`, `753`,
674	`752`, `751`, `750`, `748`, `747`, `746`, `745`, `744`,
675	`743`, `742`, `741`, `740`, `739`, `738`, `737`, `736`,
676	`735`, `734`, `733`, `732`, `731`, `730`, `729`, `728`,
677	`727`, `726`, `725`, `724`, `723`, `722`, `721`, `720`,
678	`719`, `718`, `717`, `716`, `715`, `714`, `713`, `712`,
679	`711`, `710`, `709`, `708`, `707`, `706`, `705`, `704`,
680	`703`, `702`, `701`, `700`, `699`, `699`, `698`, `697`,
681	`696`, `695`, `694`, `693`, `692`, `691`, `690`, `689`,
682	`688`, `688`, `687`, `686`, `685`, `684`, `683`, `682`,
683	`681`, `680`, `680`, `679`, `678`, `677`, `676`, `675`,
684	`674`, `673`, `673`, `672`, `671`, `670`, `669`, `668`,
685	`667`, `667`, `666`, `665`, `664`, `663`, `662`, `661`,
686	`661`, `660`, `659`, `658`, `657`, `657`, `656`, `655`,
687	`654`, `653`, `652`, `652`, `651`, `650`, `649`, `648`,
688	`648`, `647`, `646`, `645`, `644`, `644`, `643`, `642`,
689	`641`, `640`, `640`, `639`, `638`, `637`, `637`, `636`,
690	`635`, `634`, `633`, `633`, `632`, `631`, `630`, `630`,
691	`629`, `628`, `627`, `627`, `626`, `625`, `624`, `624`,
692	`623`, `622`, `621`, `621`, `620`, `619`, `618`, `618`,
693	`617`, `616`, `616`, `615`, `614`, `613`, `613`, `612`,
694	`611`, `611`, `610`, `609`, `608`, `608`, `607`, `606`,
695	`606`, `605`, `604`, `604`, `603`, `602`, `601`, `601`,
696	`600`, `599`, `599`, `598`, `597`, `597`, `596`, `595`,
697	`595`, `594`, `593`, `593`, `592`, `591`, `591`, `590`,
698	`589`, `589`, `588`, `587`, `587`, `586`, `585`, `585`,
699	`584`, `583`, `583`, `582`, `581`, `581`, `580`, `579`,
700	`579`, `578`, `578`, `577`, `576`, `576`, `575`, `574`,
701	`574`, `573`, `572`, `572`, `571`, `571`, `570`, `569`,
702	`569`, `568`, `568`, `567`, `566`, `566`, `565`, `564`,
703	`564`, `563`, `563`, `562`, `561`, `561`, `560`, `560`,
704	`559`, `558`, `558`, `557`, `557`, `556`, `555`, `555`,
705	`554`, `554`, `553`, `553`, `552`, `551`, `551`, `550`,
706	`550`, `549`, `548`, `548`, `547`, `547`, `546`, `546`,
707	`545`, `544`, `544`, `543`, `543`, `542`, `542`, `541`,
708	`541`, `540`, `539`, `539`, `538`, `538`, `537`, `537`,
709	`536`, `536`, `535`, `534`, `534`, `533`, `533`, `532`,
710	`532`, `531`, `531`, `530`, `530`, `529`, `529`, `528`,
711	`527`, `527`, `526`, `526`, `525`, `525`, `524`, `524`,
712	`523`, `523`, `522`, `522`, `521`, `521`, `520`, `520`,
713	`519`, `519`, `518`, `518`, `517`, `517`, `516`, `516`,
714	`515`, `515`, `514`, `514`
715	};
716
717	// Note that LinearToGamma() expects the values to be premultiplied by 4,
718	// so we incorporate this factor 4 inside the DIVIDE_BY_ALPHA macro directly.
719	#define DIVIDE_BY_ALPHA(sum, a) (((sum) * kInvAlpha[(a)]) >> (kAlphaFix - 2))
720
721	#else
722
723	#define DIVIDE_BY_ALPHA(sum, a) (4 * (sum) / (a))
724
725	#endif // USE_INVERSE_ALPHA_TABLE
726
727	static WEBP_INLINE int LinearToGammaWeighted(const uint8_t* src,
728	const uint8_t* a_ptr,
729	uint32_t total_a, int step,
730	int rgb_stride) {
731	const uint32_t sum =
732	a_ptr[`0`] * GammaToLinear(src[`0`]) +
733	a_ptr[step] * GammaToLinear(src[step]) +
734	a_ptr[rgb_stride] * GammaToLinear(src[rgb_stride]) +
735	a_ptr[rgb_stride + step] * GammaToLinear(src[rgb_stride + step]);
736	assert(total_a > `0` && total_a <= `4` * `0xff`);
737	#if defined(USE_INVERSE_ALPHA_TABLE)
738	assert((uint64_t)sum * kInvAlpha[total_a] < ((uint64_t)`1` << `32`));
739	#endif
740	return LinearToGamma(DIVIDE_BY_ALPHA(sum, total_a), `0`);
741	}
742
743	static WEBP_INLINE void ConvertRowToY(const uint8_t* const r_ptr,
744	const uint8_t* const g_ptr,
745	const uint8_t* const b_ptr,
746	int step,
747	uint8_t* const dst_y,
748	int width,
749	VP8Random* const rg) {
750	int i, j;
751	for (i = `0`, j = `0`; i < width; i += `1`, j += step) {
752	dst_y[i] = RGBToY(r_ptr[j], g_ptr[j], b_ptr[j], rg);
753	}
754	}
755
756	static WEBP_INLINE void AccumulateRGBA(const uint8_t* const r_ptr,
757	const uint8_t* const g_ptr,
758	const uint8_t* const b_ptr,
759	const uint8_t* const a_ptr,
760	int rgb_stride,
761	uint16_t* dst, int width) {
762	int i, j;
763	// we loop over 2x2 blocks and produce one R/G/B/A value for each.
764	for (i = `0`, j = `0`; i < (width >> `1`); i += `1`, j += `2` * `4`, dst += `4`) {
765	const uint32_t a = SUM4ALPHA(a_ptr + j);
766	int r, g, b;
767	if (a == `4` * `0xff` \|\| a == `0`) {
768	r = SUM4(r_ptr + j, `4`);
769	g = SUM4(g_ptr + j, `4`);
770	b = SUM4(b_ptr + j, `4`);
771	} else {
772	r = LinearToGammaWeighted(r_ptr + j, a_ptr + j, a, `4`, rgb_stride);
773	g = LinearToGammaWeighted(g_ptr + j, a_ptr + j, a, `4`, rgb_stride);
774	b = LinearToGammaWeighted(b_ptr + j, a_ptr + j, a, `4`, rgb_stride);
775	}
776	dst[`0`] = r;
777	dst[`1`] = g;
778	dst[`2`] = b;
779	dst[`3`] = a;
780	}
781	if (width & `1`) {
782	const uint32_t a = `2u` * SUM2ALPHA(a_ptr + j);
783	int r, g, b;
784	if (a == `4` * `0xff` \|\| a == `0`) {
785	r = SUM2(r_ptr + j);
786	g = SUM2(g_ptr + j);
787	b = SUM2(b_ptr + j);
788	} else {
789	r = LinearToGammaWeighted(r_ptr + j, a_ptr + j, a, `0`, rgb_stride);
790	g = LinearToGammaWeighted(g_ptr + j, a_ptr + j, a, `0`, rgb_stride);
791	b = LinearToGammaWeighted(b_ptr + j, a_ptr + j, a, `0`, rgb_stride);
792	}
793	dst[`0`] = r;
794	dst[`1`] = g;
795	dst[`2`] = b;
796	dst[`3`] = a;
797	}
798	}
799
800	static WEBP_INLINE void AccumulateRGB(const uint8_t* const r_ptr,
801	const uint8_t* const g_ptr,
802	const uint8_t* const b_ptr,
803	int step, int rgb_stride,
804	uint16_t* dst, int width) {
805	int i, j;
806	for (i = `0`, j = `0`; i < (width >> `1`); i += `1`, j += `2` * step, dst += `4`) {
807	dst[`0`] = SUM4(r_ptr + j, step);
808	dst[`1`] = SUM4(g_ptr + j, step);
809	dst[`2`] = SUM4(b_ptr + j, step);
810	}
811	if (width & `1`) {
812	dst[`0`] = SUM2(r_ptr + j);
813	dst[`1`] = SUM2(g_ptr + j);
814	dst[`2`] = SUM2(b_ptr + j);
815	}
816	}
817
818	static WEBP_INLINE void ConvertRowsToUV(const uint16_t* rgb,
819	uint8_t* const dst_u,
820	uint8_t* const dst_v,
821	int width,
822	VP8Random* const rg) {
823	int i;
824	for (i = `0`; i < width; i += `1`, rgb += `4`) {
825	const int r = rgb[`0`], g = rgb[`1`], b = rgb[`2`];
826	dst_u[i] = RGBToU(r, g, b, rg);
827	dst_v[i] = RGBToV(r, g, b, rg);
828	}
829	}
830
831	static int ImportYUVAFromRGBA(const uint8_t* r_ptr,
832	const uint8_t* g_ptr,
833	const uint8_t* b_ptr,
834	const uint8_t* a_ptr,
835	int step, // bytes per pixel
836	int rgb_stride, // bytes per scanline
837	float dithering,
838	int use_iterative_conversion,
839	WebPPicture* const picture) {
840	int y;
841	const int width = picture->width;
842	const int height = picture->height;
843	const int has_alpha = CheckNonOpaque(a_ptr, width, height, step, rgb_stride);
844	const int is_rgb = (r_ptr < b_ptr); // otherwise it's bgr
845
846	picture->colorspace = has_alpha ? WEBP_YUV420A : WEBP_YUV420;
847	picture->use_argb = `0`;
848
849	// disable smart conversion if source is too small (overkill).
850	if (width < kMinDimensionIterativeConversion \|\|
851	height < kMinDimensionIterativeConversion) {
852	use_iterative_conversion = `0`;
853	}
854
855	if (!WebPPictureAllocYUVA(picture, width, height)) {
856	return `0`;
857	}
858	if (has_alpha) {
859	WebPInitAlphaProcessing();
860	assert(step == `4`);
861	#if defined(USE_GAMMA_COMPRESSION) && defined(USE_INVERSE_ALPHA_TABLE)
862	assert(kAlphaFix + kGammaFix <= `31`);
863	#endif
864	}
865
866	if (use_iterative_conversion) {
867	InitGammaTablesF();
868	if (!PreprocessARGB(r_ptr, g_ptr, b_ptr, step, rgb_stride, picture)) {
869	return `0`;
870	}
871	if (has_alpha) {
872	WebPExtractAlpha(a_ptr, rgb_stride, width, height,
873	picture->a, picture->a_stride);
874	}
875	} else {
876	const int uv_width = (width + `1`) >> `1`;
877	int use_dsp = (step == `3`); // use special function in this case
878	// temporary storage for accumulated R/G/B values during conversion to U/V
879	uint16_t* const tmp_rgb =
880	(uint16_t)WebPSafeMalloc(`4` uv_width, sizeof(*tmp_rgb));
881	uint8_t* dst_y = picture->y;
882	uint8_t* dst_u = picture->u;
883	uint8_t* dst_v = picture->v;
884	uint8_t* dst_a = picture->a;
885
886	VP8Random base_rg;
887	VP8Random* rg = NULL;
888	if (dithering > `0.`) {
889	VP8InitRandom(&base_rg, dithering);
890	rg = &base_rg;
891	use_dsp = `0`; // can't use dsp in this case
892	}
893	WebPInitConvertARGBToYUV();
894	InitGammaTables();
895
896	if (tmp_rgb == NULL) return `0`; // malloc error
897
898	// Downsample Y/U/V planes, two rows at a time
899	for (y = `0`; y < (height >> `1`); ++y) {
900	int rows_have_alpha = has_alpha;
901	if (use_dsp) {
902	if (is_rgb) {
903	WebPConvertRGB24ToY(r_ptr, dst_y, width);
904	WebPConvertRGB24ToY(r_ptr + rgb_stride,
905	dst_y + picture->y_stride, width);
906	} else {
907	WebPConvertBGR24ToY(b_ptr, dst_y, width);
908	WebPConvertBGR24ToY(b_ptr + rgb_stride,
909	dst_y + picture->y_stride, width);
910	}
911	} else {
912	ConvertRowToY(r_ptr, g_ptr, b_ptr, step, dst_y, width, rg);
913	ConvertRowToY(r_ptr + rgb_stride,
914	g_ptr + rgb_stride,
915	b_ptr + rgb_stride, step,
916	dst_y + picture->y_stride, width, rg);
917	}
918	dst_y += `2` * picture->y_stride;
919	if (has_alpha) {
920	rows_have_alpha &= !WebPExtractAlpha(a_ptr, rgb_stride, width, `2`,
921	dst_a, picture->a_stride);
922	dst_a += `2` * picture->a_stride;
923	}
924	// Collect averaged R/G/B(/A)
925	if (!rows_have_alpha) {
926	AccumulateRGB(r_ptr, g_ptr, b_ptr, step, rgb_stride, tmp_rgb, width);
927	} else {
928	AccumulateRGBA(r_ptr, g_ptr, b_ptr, a_ptr, rgb_stride, tmp_rgb, width);
929	}
930	// Convert to U/V
931	if (rg == NULL) {
932	WebPConvertRGBA32ToUV(tmp_rgb, dst_u, dst_v, uv_width);
933	} else {
934	ConvertRowsToUV(tmp_rgb, dst_u, dst_v, uv_width, rg);
935	}
936	dst_u += picture->uv_stride;
937	dst_v += picture->uv_stride;
938	r_ptr += `2` * rgb_stride;
939	b_ptr += `2` * rgb_stride;
940	g_ptr += `2` * rgb_stride;
941	if (has_alpha) a_ptr += `2` * rgb_stride;
942	}
943	if (height & `1`) { // extra last row
944	int row_has_alpha = has_alpha;
945	if (use_dsp) {
946	if (r_ptr < b_ptr) {
947	WebPConvertRGB24ToY(r_ptr, dst_y, width);
948	} else {
949	WebPConvertBGR24ToY(b_ptr, dst_y, width);
950	}
951	} else {
952	ConvertRowToY(r_ptr, g_ptr, b_ptr, step, dst_y, width, rg);
953	}
954	if (row_has_alpha) {
955	row_has_alpha &= !WebPExtractAlpha(a_ptr, `0`, width, `1`, dst_a, `0`);
956	}
957	// Collect averaged R/G/B(/A)
958	if (!row_has_alpha) {
959	// Collect averaged R/G/B
960	AccumulateRGB(r_ptr, g_ptr, b_ptr, step, / rgb_stride = / `0`,
961	tmp_rgb, width);
962	} else {
963	AccumulateRGBA(r_ptr, g_ptr, b_ptr, a_ptr, / rgb_stride = / `0`,
964	tmp_rgb, width);
965	}
966	if (rg == NULL) {
967	WebPConvertRGBA32ToUV(tmp_rgb, dst_u, dst_v, uv_width);
968	} else {
969	ConvertRowsToUV(tmp_rgb, dst_u, dst_v, uv_width, rg);
970	}
971	}
972	WebPSafeFree(tmp_rgb);
973	}
974	return `1`;
975	}
976
977	#undef SUM4
978	#undef SUM2
979	#undef SUM4ALPHA
980	#undef SUM2ALPHA
981
982	//------------------------------------------------------------------------------
983	// call for ARGB->YUVA conversion
984
985	static int PictureARGBToYUVA(WebPPicture* picture, WebPEncCSP colorspace,
986	float dithering, int use_iterative_conversion) {
987	if (picture == NULL) return `0`;
988	if (picture->argb == NULL) {
989	return WebPEncodingSetError(picture, VP8_ENC_ERROR_NULL_PARAMETER);
990	} else if ((colorspace & WEBP_CSP_UV_MASK) != WEBP_YUV420) {
991	return WebPEncodingSetError(picture, VP8_ENC_ERROR_INVALID_CONFIGURATION);
992	} else {
993	const uint8_t* const argb = (const uint8_t*)picture->argb;
994	const uint8_t* const r = ALPHA_IS_LAST ? argb + `2` : argb + `1`;
995	const uint8_t* const g = ALPHA_IS_LAST ? argb + `1` : argb + `2`;
996	const uint8_t* const b = ALPHA_IS_LAST ? argb + `0` : argb + `3`;
997	const uint8_t* const a = ALPHA_IS_LAST ? argb + `3` : argb + `0`;
998
999	picture->colorspace = WEBP_YUV420;
1000	return ImportYUVAFromRGBA(r, g, b, a, `4`, `4` * picture->argb_stride,
1001	dithering, use_iterative_conversion, picture);
1002	}
1003	}
1004
1005	int WebPPictureARGBToYUVADithered(WebPPicture* picture, WebPEncCSP colorspace,
1006	float dithering) {
1007	return PictureARGBToYUVA(picture, colorspace, dithering, `0`);
1008	}
1009
1010	int WebPPictureARGBToYUVA(WebPPicture* picture, WebPEncCSP colorspace) {
1011	return PictureARGBToYUVA(picture, colorspace, `0.f`, `0`);
1012	}
1013
1014	int WebPPictureSharpARGBToYUVA(WebPPicture* picture) {
1015	return PictureARGBToYUVA(picture, WEBP_YUV420, `0.f`, `1`);
1016	}
1017	// for backward compatibility
1018	int WebPPictureSmartARGBToYUVA(WebPPicture* picture) {
1019	return WebPPictureSharpARGBToYUVA(picture);
1020	}
1021
1022	//------------------------------------------------------------------------------
1023	// call for YUVA -> ARGB conversion
1024
1025	int WebPPictureYUVAToARGB(WebPPicture* picture) {
1026	if (picture == NULL) return `0`;
1027	if (picture->y == NULL \|\| picture->u == NULL \|\| picture->v == NULL) {
1028	return WebPEncodingSetError(picture, VP8_ENC_ERROR_NULL_PARAMETER);
1029	}
1030	if ((picture->colorspace & WEBP_CSP_ALPHA_BIT) && picture->a == NULL) {
1031	return WebPEncodingSetError(picture, VP8_ENC_ERROR_NULL_PARAMETER);
1032	}
1033	if ((picture->colorspace & WEBP_CSP_UV_MASK) != WEBP_YUV420) {
1034	return WebPEncodingSetError(picture, VP8_ENC_ERROR_INVALID_CONFIGURATION);
1035	}
1036	// Allocate a new argb buffer (discarding the previous one).
1037	if (!WebPPictureAllocARGB(picture, picture->width, picture->height)) return `0`;
1038	picture->use_argb = `1`;
1039
1040	// Convert
1041	{
1042	int y;
1043	const int width = picture->width;
1044	const int height = picture->height;
1045	const int argb_stride = `4` * picture->argb_stride;
1046	uint8_t* dst = (uint8_t*)picture->argb;
1047	const uint8_t cur_u = picture->u, cur_v = picture->v, *cur_y = picture->y;
1048	WebPUpsampleLinePairFunc upsample = WebPGetLinePairConverter(ALPHA_IS_LAST);
1049
1050	// First row, with replicated top samples.
1051	upsample(cur_y, NULL, cur_u, cur_v, cur_u, cur_v, dst, NULL, width);
1052	cur_y += picture->y_stride;
1053	dst += argb_stride;
1054	// Center rows.
1055	for (y = `1`; y + `1` < height; y += `2`) {
1056	const uint8_t* const top_u = cur_u;
1057	const uint8_t* const top_v = cur_v;
1058	cur_u += picture->uv_stride;
1059	cur_v += picture->uv_stride;
1060	upsample(cur_y, cur_y + picture->y_stride, top_u, top_v, cur_u, cur_v,
1061	dst, dst + argb_stride, width);
1062	cur_y += `2` * picture->y_stride;
1063	dst += `2` * argb_stride;
1064	}
1065	// Last row (if needed), with replicated bottom samples.
1066	if (height > `1` && !(height & `1`)) {
1067	upsample(cur_y, NULL, cur_u, cur_v, cur_u, cur_v, dst, NULL, width);
1068	}
1069	// Insert alpha values if needed, in replacement for the default 0xff ones.
1070	if (picture->colorspace & WEBP_CSP_ALPHA_BIT) {
1071	for (y = `0`; y < height; ++y) {
1072	uint32_t* const argb_dst = picture->argb + y * picture->argb_stride;
1073	const uint8_t* const src = picture->a + y * picture->a_stride;
1074	int x;
1075	for (x = `0`; x < width; ++x) {
1076	argb_dst[x] = (argb_dst[x] & `0x00ffffffu`) \| ((uint32_t)src[x] << `24`);
1077	}
1078	}
1079	}
1080	}
1081	return `1`;
1082	}
1083
1084	//------------------------------------------------------------------------------
1085	// automatic import / conversion
1086
1087	static int Import(WebPPicture* const picture,
1088	const uint8_t* const rgb, int rgb_stride,
1089	int step, int swap_rb, int import_alpha) {
1090	int y;
1091	const uint8_t* r_ptr = rgb + (swap_rb ? `2` : `0`);
1092	const uint8_t* g_ptr = rgb + `1`;
1093	const uint8_t* b_ptr = rgb + (swap_rb ? `0` : `2`);
1094	const uint8_t* a_ptr = import_alpha ? rgb + `3` : NULL;
1095	const int width = picture->width;
1096	const int height = picture->height;
1097
1098	if (!picture->use_argb) {
1099	return ImportYUVAFromRGBA(r_ptr, g_ptr, b_ptr, a_ptr, step, rgb_stride,
1100	`0.f` / no dithering /, `0`, picture);
1101	}
1102	if (!WebPPictureAlloc(picture)) return `0`;
1103
1104	VP8EncDspARGBInit();
1105
1106	if (import_alpha) {
1107	uint32_t* dst = picture->argb;
1108	assert(step == `4`);
1109	for (y = `0`; y < height; ++y) {
1110	VP8PackARGB(a_ptr, r_ptr, g_ptr, b_ptr, width, dst);
1111	a_ptr += rgb_stride;
1112	r_ptr += rgb_stride;
1113	g_ptr += rgb_stride;
1114	b_ptr += rgb_stride;
1115	dst += picture->argb_stride;
1116	}
1117	} else {
1118	uint32_t* dst = picture->argb;
1119	assert(step >= `3`);
1120	for (y = `0`; y < height; ++y) {
1121	VP8PackRGB(r_ptr, g_ptr, b_ptr, width, step, dst);
1122	r_ptr += rgb_stride;
1123	g_ptr += rgb_stride;
1124	b_ptr += rgb_stride;
1125	dst += picture->argb_stride;
1126	}
1127	}
1128	return `1`;
1129	}
1130
1131	// Public API
1132
1133	int WebPPictureImportRGB(WebPPicture* picture,
1134	const uint8_t* rgb, int rgb_stride) {
1135	return (picture != NULL && rgb != NULL)
1136	? Import(picture, rgb, rgb_stride, `3`, `0`, `0`)
1137	: `0`;
1138	}
1139
1140	int WebPPictureImportBGR(WebPPicture* picture,
1141	const uint8_t* rgb, int rgb_stride) {
1142	return (picture != NULL && rgb != NULL)
1143	? Import(picture, rgb, rgb_stride, `3`, `1`, `0`)
1144	: `0`;
1145	}
1146
1147	int WebPPictureImportRGBA(WebPPicture* picture,
1148	const uint8_t* rgba, int rgba_stride) {
1149	return (picture != NULL && rgba != NULL)
1150	? Import(picture, rgba, rgba_stride, `4`, `0`, `1`)
1151	: `0`;
1152	}
1153
1154	int WebPPictureImportBGRA(WebPPicture* picture,
1155	const uint8_t* rgba, int rgba_stride) {
1156	return (picture != NULL && rgba != NULL)
1157	? Import(picture, rgba, rgba_stride, `4`, `1`, `1`)
1158	: `0`;
1159	}
1160
1161	int WebPPictureImportRGBX(WebPPicture* picture,
1162	const uint8_t* rgba, int rgba_stride) {
1163	return (picture != NULL && rgba != NULL)
1164	? Import(picture, rgba, rgba_stride, `4`, `0`, `0`)
1165	: `0`;
1166	}
1167
1168	int WebPPictureImportBGRX(WebPPicture* picture,
1169	const uint8_t* rgba, int rgba_stride) {
1170	return (picture != NULL && rgba != NULL)
1171	? Import(picture, rgba, rgba_stride, `4`, `1`, `0`)
1172	: `0`;
1173	}
1174
1175	//------------------------------------------------------------------------------
1176

Browse the source code of engine/third_party/libwebp/src/enc/picture_csp_enc.c