1 | // Copyright 2014 Google Inc. All Rights Reserved. |
2 | // |
3 | // Use of this source code is governed by a BSD-style license |
4 | // that can be found in the COPYING file in the root of the source |
5 | // tree. An additional intellectual property rights grant can be found |
6 | // in the file PATENTS. All contributing project authors may |
7 | // be found in the AUTHORS file in the root of the source tree. |
8 | // ----------------------------------------------------------------------------- |
9 | // |
10 | // WebPPicture utils for colorspace conversion |
11 | // |
12 | // Author: Skal (pascal.massimino@gmail.com) |
13 | |
14 | #include <assert.h> |
15 | #include <stdlib.h> |
16 | #include <math.h> |
17 | |
18 | #include "./vp8i_enc.h" |
19 | #include "../utils/random_utils.h" |
20 | #include "../utils/utils.h" |
21 | #include "../dsp/yuv.h" |
22 | |
23 | // Uncomment to disable gamma-compression during RGB->U/V averaging |
24 | #define USE_GAMMA_COMPRESSION |
25 | |
26 | // If defined, use table to compute x / alpha. |
27 | #define USE_INVERSE_ALPHA_TABLE |
28 | |
29 | static const union { |
30 | uint32_t argb; |
31 | uint8_t bytes[4]; |
32 | } test_endian = { 0xff000000u }; |
33 | #define ALPHA_IS_LAST (test_endian.bytes[3] == 0xff) |
34 | |
35 | //------------------------------------------------------------------------------ |
36 | // Detection of non-trivial transparency |
37 | |
38 | // Returns true if alpha[] has non-0xff values. |
39 | static int CheckNonOpaque(const uint8_t* alpha, int width, int height, |
40 | int x_step, int y_step) { |
41 | if (alpha == NULL) return 0; |
42 | while (height-- > 0) { |
43 | int x; |
44 | for (x = 0; x < width * x_step; x += x_step) { |
45 | if (alpha[x] != 0xff) return 1; // TODO(skal): check 4/8 bytes at a time. |
46 | } |
47 | alpha += y_step; |
48 | } |
49 | return 0; |
50 | } |
51 | |
52 | // Checking for the presence of non-opaque alpha. |
53 | int WebPPictureHasTransparency(const WebPPicture* picture) { |
54 | if (picture == NULL) return 0; |
55 | if (!picture->use_argb) { |
56 | return CheckNonOpaque(picture->a, picture->width, picture->height, |
57 | 1, picture->a_stride); |
58 | } else { |
59 | int x, y; |
60 | const uint32_t* argb = picture->argb; |
61 | if (argb == NULL) return 0; |
62 | for (y = 0; y < picture->height; ++y) { |
63 | for (x = 0; x < picture->width; ++x) { |
64 | if (argb[x] < 0xff000000u) return 1; // test any alpha values != 0xff |
65 | } |
66 | argb += picture->argb_stride; |
67 | } |
68 | } |
69 | return 0; |
70 | } |
71 | |
72 | //------------------------------------------------------------------------------ |
73 | // Code for gamma correction |
74 | |
75 | #if defined(USE_GAMMA_COMPRESSION) |
76 | |
77 | // gamma-compensates loss of resolution during chroma subsampling |
78 | #define kGamma 0.80 // for now we use a different gamma value than kGammaF |
79 | #define kGammaFix 12 // fixed-point precision for linear values |
80 | #define kGammaScale ((1 << kGammaFix) - 1) |
81 | #define kGammaTabFix 7 // fixed-point fractional bits precision |
82 | #define kGammaTabScale (1 << kGammaTabFix) |
83 | #define kGammaTabRounder (kGammaTabScale >> 1) |
84 | #define kGammaTabSize (1 << (kGammaFix - kGammaTabFix)) |
85 | |
86 | static int kLinearToGammaTab[kGammaTabSize + 1]; |
87 | static uint16_t kGammaToLinearTab[256]; |
88 | static volatile int kGammaTablesOk = 0; |
89 | |
90 | static WEBP_TSAN_IGNORE_FUNCTION void InitGammaTables(void) { |
91 | if (!kGammaTablesOk) { |
92 | int v; |
93 | const double scale = (double)(1 << kGammaTabFix) / kGammaScale; |
94 | const double norm = 1. / 255.; |
95 | for (v = 0; v <= 255; ++v) { |
96 | kGammaToLinearTab[v] = |
97 | (uint16_t)(pow(norm * v, kGamma) * kGammaScale + .5); |
98 | } |
99 | for (v = 0; v <= kGammaTabSize; ++v) { |
100 | kLinearToGammaTab[v] = (int)(255. * pow(scale * v, 1. / kGamma) + .5); |
101 | } |
102 | kGammaTablesOk = 1; |
103 | } |
104 | } |
105 | |
106 | static WEBP_INLINE uint32_t GammaToLinear(uint8_t v) { |
107 | return kGammaToLinearTab[v]; |
108 | } |
109 | |
110 | static WEBP_INLINE int Interpolate(int v) { |
111 | const int tab_pos = v >> (kGammaTabFix + 2); // integer part |
112 | const int x = v & ((kGammaTabScale << 2) - 1); // fractional part |
113 | const int v0 = kLinearToGammaTab[tab_pos]; |
114 | const int v1 = kLinearToGammaTab[tab_pos + 1]; |
115 | const int y = v1 * x + v0 * ((kGammaTabScale << 2) - x); // interpolate |
116 | assert(tab_pos + 1 < kGammaTabSize + 1); |
117 | return y; |
118 | } |
119 | |
120 | // Convert a linear value 'v' to YUV_FIX+2 fixed-point precision |
121 | // U/V value, suitable for RGBToU/V calls. |
122 | static WEBP_INLINE int LinearToGamma(uint32_t base_value, int shift) { |
123 | const int y = Interpolate(base_value << shift); // final uplifted value |
124 | return (y + kGammaTabRounder) >> kGammaTabFix; // descale |
125 | } |
126 | |
127 | #else |
128 | |
129 | static WEBP_TSAN_IGNORE_FUNCTION void InitGammaTables(void) {} |
130 | static WEBP_INLINE uint32_t GammaToLinear(uint8_t v) { return v; } |
131 | static WEBP_INLINE int LinearToGamma(uint32_t base_value, int shift) { |
132 | return (int)(base_value << shift); |
133 | } |
134 | |
135 | #endif // USE_GAMMA_COMPRESSION |
136 | |
137 | //------------------------------------------------------------------------------ |
138 | // RGB -> YUV conversion |
139 | |
140 | static int RGBToY(int r, int g, int b, VP8Random* const rg) { |
141 | return (rg == NULL) ? VP8RGBToY(r, g, b, YUV_HALF) |
142 | : VP8RGBToY(r, g, b, VP8RandomBits(rg, YUV_FIX)); |
143 | } |
144 | |
145 | static int RGBToU(int r, int g, int b, VP8Random* const rg) { |
146 | return (rg == NULL) ? VP8RGBToU(r, g, b, YUV_HALF << 2) |
147 | : VP8RGBToU(r, g, b, VP8RandomBits(rg, YUV_FIX + 2)); |
148 | } |
149 | |
150 | static int RGBToV(int r, int g, int b, VP8Random* const rg) { |
151 | return (rg == NULL) ? VP8RGBToV(r, g, b, YUV_HALF << 2) |
152 | : VP8RGBToV(r, g, b, VP8RandomBits(rg, YUV_FIX + 2)); |
153 | } |
154 | |
155 | //------------------------------------------------------------------------------ |
156 | // Sharp RGB->YUV conversion |
157 | |
158 | static const int kNumIterations = 4; |
159 | static const int kMinDimensionIterativeConversion = 4; |
160 | |
161 | // We could use SFIX=0 and only uint8_t for fixed_y_t, but it produces some |
162 | // banding sometimes. Better use extra precision. |
163 | #define SFIX 2 // fixed-point precision of RGB and Y/W |
164 | typedef int16_t fixed_t; // signed type with extra SFIX precision for UV |
165 | typedef uint16_t fixed_y_t; // unsigned type with extra SFIX precision for W |
166 | |
167 | #define SHALF (1 << SFIX >> 1) |
168 | #define MAX_Y_T ((256 << SFIX) - 1) |
169 | #define SROUNDER (1 << (YUV_FIX + SFIX - 1)) |
170 | |
171 | #if defined(USE_GAMMA_COMPRESSION) |
172 | |
173 | // float variant of gamma-correction |
174 | // We use tables of different size and precision for the Rec709 |
175 | // transfer function. |
176 | #define kGammaF (1./0.45) |
177 | static float kGammaToLinearTabF[MAX_Y_T + 1]; // size scales with Y_FIX |
178 | static float kLinearToGammaTabF[kGammaTabSize + 2]; |
179 | static volatile int kGammaTablesFOk = 0; |
180 | |
181 | static WEBP_TSAN_IGNORE_FUNCTION void InitGammaTablesF(void) { |
182 | if (!kGammaTablesFOk) { |
183 | int v; |
184 | const double norm = 1. / MAX_Y_T; |
185 | const double scale = 1. / kGammaTabSize; |
186 | const double a = 0.099; |
187 | const double thresh = 0.018; |
188 | for (v = 0; v <= MAX_Y_T; ++v) { |
189 | const double g = norm * v; |
190 | if (g <= thresh * 4.5) { |
191 | kGammaToLinearTabF[v] = (float)(g / 4.5); |
192 | } else { |
193 | const double a_rec = 1. / (1. + a); |
194 | kGammaToLinearTabF[v] = (float)pow(a_rec * (g + a), kGammaF); |
195 | } |
196 | } |
197 | for (v = 0; v <= kGammaTabSize; ++v) { |
198 | const double g = scale * v; |
199 | double value; |
200 | if (g <= thresh) { |
201 | value = 4.5 * g; |
202 | } else { |
203 | value = (1. + a) * pow(g, 1. / kGammaF) - a; |
204 | } |
205 | kLinearToGammaTabF[v] = (float)(MAX_Y_T * value); |
206 | } |
207 | // to prevent small rounding errors to cause read-overflow: |
208 | kLinearToGammaTabF[kGammaTabSize + 1] = kLinearToGammaTabF[kGammaTabSize]; |
209 | kGammaTablesFOk = 1; |
210 | } |
211 | } |
212 | |
213 | static WEBP_INLINE float GammaToLinearF(int v) { |
214 | return kGammaToLinearTabF[v]; |
215 | } |
216 | |
217 | static WEBP_INLINE int LinearToGammaF(float value) { |
218 | const float v = value * kGammaTabSize; |
219 | const int tab_pos = (int)v; |
220 | const float x = v - (float)tab_pos; // fractional part |
221 | const float v0 = kLinearToGammaTabF[tab_pos + 0]; |
222 | const float v1 = kLinearToGammaTabF[tab_pos + 1]; |
223 | const float y = v1 * x + v0 * (1.f - x); // interpolate |
224 | return (int)(y + .5); |
225 | } |
226 | |
227 | #else |
228 | |
229 | static WEBP_TSAN_IGNORE_FUNCTION void InitGammaTablesF(void) {} |
230 | static WEBP_INLINE float GammaToLinearF(int v) { |
231 | const float norm = 1.f / MAX_Y_T; |
232 | return norm * v; |
233 | } |
234 | static WEBP_INLINE int LinearToGammaF(float value) { |
235 | return (int)(MAX_Y_T * value + .5); |
236 | } |
237 | |
238 | #endif // USE_GAMMA_COMPRESSION |
239 | |
240 | //------------------------------------------------------------------------------ |
241 | |
242 | static uint8_t clip_8b(fixed_t v) { |
243 | return (!(v & ~0xff)) ? (uint8_t)v : (v < 0) ? 0u : 255u; |
244 | } |
245 | |
246 | static fixed_y_t clip_y(int y) { |
247 | return (!(y & ~MAX_Y_T)) ? (fixed_y_t)y : (y < 0) ? 0 : MAX_Y_T; |
248 | } |
249 | |
250 | //------------------------------------------------------------------------------ |
251 | |
252 | static int RGBToGray(int r, int g, int b) { |
253 | const int luma = 13933 * r + 46871 * g + 4732 * b + YUV_HALF; |
254 | return (luma >> YUV_FIX); |
255 | } |
256 | |
257 | static float RGBToGrayF(float r, float g, float b) { |
258 | return (float)(0.2126 * r + 0.7152 * g + 0.0722 * b); |
259 | } |
260 | |
261 | static int ScaleDown(int a, int b, int c, int d) { |
262 | const float A = GammaToLinearF(a); |
263 | const float B = GammaToLinearF(b); |
264 | const float C = GammaToLinearF(c); |
265 | const float D = GammaToLinearF(d); |
266 | return LinearToGammaF(0.25f * (A + B + C + D)); |
267 | } |
268 | |
269 | static WEBP_INLINE void UpdateW(const fixed_y_t* src, fixed_y_t* dst, int w) { |
270 | int i; |
271 | for (i = 0; i < w; ++i) { |
272 | const float R = GammaToLinearF(src[0 * w + i]); |
273 | const float G = GammaToLinearF(src[1 * w + i]); |
274 | const float B = GammaToLinearF(src[2 * w + i]); |
275 | const float Y = RGBToGrayF(R, G, B); |
276 | dst[i] = (fixed_y_t)LinearToGammaF(Y); |
277 | } |
278 | } |
279 | |
280 | static void UpdateChroma(const fixed_y_t* src1, const fixed_y_t* src2, |
281 | fixed_t* dst, int uv_w) { |
282 | int i; |
283 | for (i = 0; i < uv_w; ++i) { |
284 | const int r = ScaleDown(src1[0 * uv_w + 0], src1[0 * uv_w + 1], |
285 | src2[0 * uv_w + 0], src2[0 * uv_w + 1]); |
286 | const int g = ScaleDown(src1[2 * uv_w + 0], src1[2 * uv_w + 1], |
287 | src2[2 * uv_w + 0], src2[2 * uv_w + 1]); |
288 | const int b = ScaleDown(src1[4 * uv_w + 0], src1[4 * uv_w + 1], |
289 | src2[4 * uv_w + 0], src2[4 * uv_w + 1]); |
290 | const int W = RGBToGray(r, g, b); |
291 | dst[0 * uv_w] = (fixed_t)(r - W); |
292 | dst[1 * uv_w] = (fixed_t)(g - W); |
293 | dst[2 * uv_w] = (fixed_t)(b - W); |
294 | dst += 1; |
295 | src1 += 2; |
296 | src2 += 2; |
297 | } |
298 | } |
299 | |
300 | static void StoreGray(const fixed_y_t* rgb, fixed_y_t* y, int w) { |
301 | int i; |
302 | for (i = 0; i < w; ++i) { |
303 | y[i] = RGBToGray(rgb[0 * w + i], rgb[1 * w + i], rgb[2 * w + i]); |
304 | } |
305 | } |
306 | |
307 | //------------------------------------------------------------------------------ |
308 | |
309 | static WEBP_INLINE fixed_y_t Filter2(int A, int B, int W0) { |
310 | const int v0 = (A * 3 + B + 2) >> 2; |
311 | return clip_y(v0 + W0); |
312 | } |
313 | |
314 | //------------------------------------------------------------------------------ |
315 | |
316 | static WEBP_INLINE fixed_y_t UpLift(uint8_t a) { // 8bit -> SFIX |
317 | return ((fixed_y_t)a << SFIX) | SHALF; |
318 | } |
319 | |
320 | static void ImportOneRow(const uint8_t* const r_ptr, |
321 | const uint8_t* const g_ptr, |
322 | const uint8_t* const b_ptr, |
323 | int step, |
324 | int pic_width, |
325 | fixed_y_t* const dst) { |
326 | int i; |
327 | const int w = (pic_width + 1) & ~1; |
328 | for (i = 0; i < pic_width; ++i) { |
329 | const int off = i * step; |
330 | dst[i + 0 * w] = UpLift(r_ptr[off]); |
331 | dst[i + 1 * w] = UpLift(g_ptr[off]); |
332 | dst[i + 2 * w] = UpLift(b_ptr[off]); |
333 | } |
334 | if (pic_width & 1) { // replicate rightmost pixel |
335 | dst[pic_width + 0 * w] = dst[pic_width + 0 * w - 1]; |
336 | dst[pic_width + 1 * w] = dst[pic_width + 1 * w - 1]; |
337 | dst[pic_width + 2 * w] = dst[pic_width + 2 * w - 1]; |
338 | } |
339 | } |
340 | |
341 | static void InterpolateTwoRows(const fixed_y_t* const best_y, |
342 | const fixed_t* prev_uv, |
343 | const fixed_t* cur_uv, |
344 | const fixed_t* next_uv, |
345 | int w, |
346 | fixed_y_t* out1, |
347 | fixed_y_t* out2) { |
348 | const int uv_w = w >> 1; |
349 | const int len = (w - 1) >> 1; // length to filter |
350 | int k = 3; |
351 | while (k-- > 0) { // process each R/G/B segments in turn |
352 | // special boundary case for i==0 |
353 | out1[0] = Filter2(cur_uv[0], prev_uv[0], best_y[0]); |
354 | out2[0] = Filter2(cur_uv[0], next_uv[0], best_y[w]); |
355 | |
356 | WebPSharpYUVFilterRow(cur_uv, prev_uv, len, best_y + 0 + 1, out1 + 1); |
357 | WebPSharpYUVFilterRow(cur_uv, next_uv, len, best_y + w + 1, out2 + 1); |
358 | |
359 | // special boundary case for i == w - 1 when w is even |
360 | if (!(w & 1)) { |
361 | out1[w - 1] = Filter2(cur_uv[uv_w - 1], prev_uv[uv_w - 1], |
362 | best_y[w - 1 + 0]); |
363 | out2[w - 1] = Filter2(cur_uv[uv_w - 1], next_uv[uv_w - 1], |
364 | best_y[w - 1 + w]); |
365 | } |
366 | out1 += w; |
367 | out2 += w; |
368 | prev_uv += uv_w; |
369 | cur_uv += uv_w; |
370 | next_uv += uv_w; |
371 | } |
372 | } |
373 | |
374 | static WEBP_INLINE uint8_t ConvertRGBToY(int r, int g, int b) { |
375 | const int luma = 16839 * r + 33059 * g + 6420 * b + SROUNDER; |
376 | return clip_8b(16 + (luma >> (YUV_FIX + SFIX))); |
377 | } |
378 | |
379 | static WEBP_INLINE uint8_t ConvertRGBToU(int r, int g, int b) { |
380 | const int u = -9719 * r - 19081 * g + 28800 * b + SROUNDER; |
381 | return clip_8b(128 + (u >> (YUV_FIX + SFIX))); |
382 | } |
383 | |
384 | static WEBP_INLINE uint8_t ConvertRGBToV(int r, int g, int b) { |
385 | const int v = +28800 * r - 24116 * g - 4684 * b + SROUNDER; |
386 | return clip_8b(128 + (v >> (YUV_FIX + SFIX))); |
387 | } |
388 | |
389 | static int ConvertWRGBToYUV(const fixed_y_t* best_y, const fixed_t* best_uv, |
390 | WebPPicture* const picture) { |
391 | int i, j; |
392 | uint8_t* dst_y = picture->y; |
393 | uint8_t* dst_u = picture->u; |
394 | uint8_t* dst_v = picture->v; |
395 | const fixed_t* const best_uv_base = best_uv; |
396 | const int w = (picture->width + 1) & ~1; |
397 | const int h = (picture->height + 1) & ~1; |
398 | const int uv_w = w >> 1; |
399 | const int uv_h = h >> 1; |
400 | for (best_uv = best_uv_base, j = 0; j < picture->height; ++j) { |
401 | for (i = 0; i < picture->width; ++i) { |
402 | const int off = (i >> 1); |
403 | const int W = best_y[i]; |
404 | const int r = best_uv[off + 0 * uv_w] + W; |
405 | const int g = best_uv[off + 1 * uv_w] + W; |
406 | const int b = best_uv[off + 2 * uv_w] + W; |
407 | dst_y[i] = ConvertRGBToY(r, g, b); |
408 | } |
409 | best_y += w; |
410 | best_uv += (j & 1) * 3 * uv_w; |
411 | dst_y += picture->y_stride; |
412 | } |
413 | for (best_uv = best_uv_base, j = 0; j < uv_h; ++j) { |
414 | for (i = 0; i < uv_w; ++i) { |
415 | const int off = i; |
416 | const int r = best_uv[off + 0 * uv_w]; |
417 | const int g = best_uv[off + 1 * uv_w]; |
418 | const int b = best_uv[off + 2 * uv_w]; |
419 | dst_u[i] = ConvertRGBToU(r, g, b); |
420 | dst_v[i] = ConvertRGBToV(r, g, b); |
421 | } |
422 | best_uv += 3 * uv_w; |
423 | dst_u += picture->uv_stride; |
424 | dst_v += picture->uv_stride; |
425 | } |
426 | return 1; |
427 | } |
428 | |
429 | //------------------------------------------------------------------------------ |
430 | // Main function |
431 | |
432 | #define SAFE_ALLOC(W, H, T) ((T*)WebPSafeMalloc((W) * (H), sizeof(T))) |
433 | |
434 | static int PreprocessARGB(const uint8_t* r_ptr, |
435 | const uint8_t* g_ptr, |
436 | const uint8_t* b_ptr, |
437 | int step, int rgb_stride, |
438 | WebPPicture* const picture) { |
439 | // we expand the right/bottom border if needed |
440 | const int w = (picture->width + 1) & ~1; |
441 | const int h = (picture->height + 1) & ~1; |
442 | const int uv_w = w >> 1; |
443 | const int uv_h = h >> 1; |
444 | uint64_t prev_diff_y_sum = ~0; |
445 | int j, iter; |
446 | |
447 | // TODO(skal): allocate one big memory chunk. But for now, it's easier |
448 | // for valgrind debugging to have several chunks. |
449 | fixed_y_t* const tmp_buffer = SAFE_ALLOC(w * 3, 2, fixed_y_t); // scratch |
450 | fixed_y_t* const best_y_base = SAFE_ALLOC(w, h, fixed_y_t); |
451 | fixed_y_t* const target_y_base = SAFE_ALLOC(w, h, fixed_y_t); |
452 | fixed_y_t* const best_rgb_y = SAFE_ALLOC(w, 2, fixed_y_t); |
453 | fixed_t* const best_uv_base = SAFE_ALLOC(uv_w * 3, uv_h, fixed_t); |
454 | fixed_t* const target_uv_base = SAFE_ALLOC(uv_w * 3, uv_h, fixed_t); |
455 | fixed_t* const best_rgb_uv = SAFE_ALLOC(uv_w * 3, 1, fixed_t); |
456 | fixed_y_t* best_y = best_y_base; |
457 | fixed_y_t* target_y = target_y_base; |
458 | fixed_t* best_uv = best_uv_base; |
459 | fixed_t* target_uv = target_uv_base; |
460 | const uint64_t diff_y_threshold = (uint64_t)(3.0 * w * h); |
461 | int ok; |
462 | |
463 | if (best_y_base == NULL || best_uv_base == NULL || |
464 | target_y_base == NULL || target_uv_base == NULL || |
465 | best_rgb_y == NULL || best_rgb_uv == NULL || |
466 | tmp_buffer == NULL) { |
467 | ok = WebPEncodingSetError(picture, VP8_ENC_ERROR_OUT_OF_MEMORY); |
468 | goto End; |
469 | } |
470 | assert(picture->width >= kMinDimensionIterativeConversion); |
471 | assert(picture->height >= kMinDimensionIterativeConversion); |
472 | |
473 | WebPInitConvertARGBToYUV(); |
474 | |
475 | // Import RGB samples to W/RGB representation. |
476 | for (j = 0; j < picture->height; j += 2) { |
477 | const int is_last_row = (j == picture->height - 1); |
478 | fixed_y_t* const src1 = tmp_buffer + 0 * w; |
479 | fixed_y_t* const src2 = tmp_buffer + 3 * w; |
480 | |
481 | // prepare two rows of input |
482 | ImportOneRow(r_ptr, g_ptr, b_ptr, step, picture->width, src1); |
483 | if (!is_last_row) { |
484 | ImportOneRow(r_ptr + rgb_stride, g_ptr + rgb_stride, b_ptr + rgb_stride, |
485 | step, picture->width, src2); |
486 | } else { |
487 | memcpy(src2, src1, 3 * w * sizeof(*src2)); |
488 | } |
489 | StoreGray(src1, best_y + 0, w); |
490 | StoreGray(src2, best_y + w, w); |
491 | |
492 | UpdateW(src1, target_y, w); |
493 | UpdateW(src2, target_y + w, w); |
494 | UpdateChroma(src1, src2, target_uv, uv_w); |
495 | memcpy(best_uv, target_uv, 3 * uv_w * sizeof(*best_uv)); |
496 | best_y += 2 * w; |
497 | best_uv += 3 * uv_w; |
498 | target_y += 2 * w; |
499 | target_uv += 3 * uv_w; |
500 | r_ptr += 2 * rgb_stride; |
501 | g_ptr += 2 * rgb_stride; |
502 | b_ptr += 2 * rgb_stride; |
503 | } |
504 | |
505 | // Iterate and resolve clipping conflicts. |
506 | for (iter = 0; iter < kNumIterations; ++iter) { |
507 | const fixed_t* cur_uv = best_uv_base; |
508 | const fixed_t* prev_uv = best_uv_base; |
509 | uint64_t diff_y_sum = 0; |
510 | |
511 | best_y = best_y_base; |
512 | best_uv = best_uv_base; |
513 | target_y = target_y_base; |
514 | target_uv = target_uv_base; |
515 | for (j = 0; j < h; j += 2) { |
516 | fixed_y_t* const src1 = tmp_buffer + 0 * w; |
517 | fixed_y_t* const src2 = tmp_buffer + 3 * w; |
518 | { |
519 | const fixed_t* const next_uv = cur_uv + ((j < h - 2) ? 3 * uv_w : 0); |
520 | InterpolateTwoRows(best_y, prev_uv, cur_uv, next_uv, w, src1, src2); |
521 | prev_uv = cur_uv; |
522 | cur_uv = next_uv; |
523 | } |
524 | |
525 | UpdateW(src1, best_rgb_y + 0 * w, w); |
526 | UpdateW(src2, best_rgb_y + 1 * w, w); |
527 | UpdateChroma(src1, src2, best_rgb_uv, uv_w); |
528 | |
529 | // update two rows of Y and one row of RGB |
530 | diff_y_sum += WebPSharpYUVUpdateY(target_y, best_rgb_y, best_y, 2 * w); |
531 | WebPSharpYUVUpdateRGB(target_uv, best_rgb_uv, best_uv, 3 * uv_w); |
532 | |
533 | best_y += 2 * w; |
534 | best_uv += 3 * uv_w; |
535 | target_y += 2 * w; |
536 | target_uv += 3 * uv_w; |
537 | } |
538 | // test exit condition |
539 | if (iter > 0) { |
540 | if (diff_y_sum < diff_y_threshold) break; |
541 | if (diff_y_sum > prev_diff_y_sum) break; |
542 | } |
543 | prev_diff_y_sum = diff_y_sum; |
544 | } |
545 | // final reconstruction |
546 | ok = ConvertWRGBToYUV(best_y_base, best_uv_base, picture); |
547 | |
548 | End: |
549 | WebPSafeFree(best_y_base); |
550 | WebPSafeFree(best_uv_base); |
551 | WebPSafeFree(target_y_base); |
552 | WebPSafeFree(target_uv_base); |
553 | WebPSafeFree(best_rgb_y); |
554 | WebPSafeFree(best_rgb_uv); |
555 | WebPSafeFree(tmp_buffer); |
556 | return ok; |
557 | } |
558 | #undef SAFE_ALLOC |
559 | |
560 | //------------------------------------------------------------------------------ |
561 | // "Fast" regular RGB->YUV |
562 | |
563 | #define SUM4(ptr, step) LinearToGamma( \ |
564 | GammaToLinear((ptr)[0]) + \ |
565 | GammaToLinear((ptr)[(step)]) + \ |
566 | GammaToLinear((ptr)[rgb_stride]) + \ |
567 | GammaToLinear((ptr)[rgb_stride + (step)]), 0) \ |
568 | |
569 | #define SUM2(ptr) \ |
570 | LinearToGamma(GammaToLinear((ptr)[0]) + GammaToLinear((ptr)[rgb_stride]), 1) |
571 | |
572 | #define SUM2ALPHA(ptr) ((ptr)[0] + (ptr)[rgb_stride]) |
573 | #define SUM4ALPHA(ptr) (SUM2ALPHA(ptr) + SUM2ALPHA((ptr) + 4)) |
574 | |
575 | #if defined(USE_INVERSE_ALPHA_TABLE) |
576 | |
577 | static const int kAlphaFix = 19; |
578 | // Following table is (1 << kAlphaFix) / a. The (v * kInvAlpha[a]) >> kAlphaFix |
579 | // formula is then equal to v / a in most (99.6%) cases. Note that this table |
580 | // and constant are adjusted very tightly to fit 32b arithmetic. |
581 | // In particular, they use the fact that the operands for 'v / a' are actually |
582 | // derived as v = (a0.p0 + a1.p1 + a2.p2 + a3.p3) and a = a0 + a1 + a2 + a3 |
583 | // with ai in [0..255] and pi in [0..1<<kGammaFix). The constraint to avoid |
584 | // overflow is: kGammaFix + kAlphaFix <= 31. |
585 | static const uint32_t kInvAlpha[4 * 0xff + 1] = { |
586 | 0, /* alpha = 0 */ |
587 | 524288, 262144, 174762, 131072, 104857, 87381, 74898, 65536, |
588 | 58254, 52428, 47662, 43690, 40329, 37449, 34952, 32768, |
589 | 30840, 29127, 27594, 26214, 24966, 23831, 22795, 21845, |
590 | 20971, 20164, 19418, 18724, 18078, 17476, 16912, 16384, |
591 | 15887, 15420, 14979, 14563, 14169, 13797, 13443, 13107, |
592 | 12787, 12483, 12192, 11915, 11650, 11397, 11155, 10922, |
593 | 10699, 10485, 10280, 10082, 9892, 9709, 9532, 9362, |
594 | 9198, 9039, 8886, 8738, 8594, 8456, 8322, 8192, |
595 | 8065, 7943, 7825, 7710, 7598, 7489, 7384, 7281, |
596 | 7182, 7084, 6990, 6898, 6808, 6721, 6636, 6553, |
597 | 6472, 6393, 6316, 6241, 6168, 6096, 6026, 5957, |
598 | 5890, 5825, 5761, 5698, 5637, 5577, 5518, 5461, |
599 | 5405, 5349, 5295, 5242, 5190, 5140, 5090, 5041, |
600 | 4993, 4946, 4899, 4854, 4809, 4766, 4723, 4681, |
601 | 4639, 4599, 4559, 4519, 4481, 4443, 4405, 4369, |
602 | 4332, 4297, 4262, 4228, 4194, 4161, 4128, 4096, |
603 | 4064, 4032, 4002, 3971, 3942, 3912, 3883, 3855, |
604 | 3826, 3799, 3771, 3744, 3718, 3692, 3666, 3640, |
605 | 3615, 3591, 3566, 3542, 3518, 3495, 3472, 3449, |
606 | 3426, 3404, 3382, 3360, 3339, 3318, 3297, 3276, |
607 | 3256, 3236, 3216, 3196, 3177, 3158, 3139, 3120, |
608 | 3102, 3084, 3066, 3048, 3030, 3013, 2995, 2978, |
609 | 2962, 2945, 2928, 2912, 2896, 2880, 2864, 2849, |
610 | 2833, 2818, 2803, 2788, 2774, 2759, 2744, 2730, |
611 | 2716, 2702, 2688, 2674, 2661, 2647, 2634, 2621, |
612 | 2608, 2595, 2582, 2570, 2557, 2545, 2532, 2520, |
613 | 2508, 2496, 2484, 2473, 2461, 2449, 2438, 2427, |
614 | 2416, 2404, 2394, 2383, 2372, 2361, 2351, 2340, |
615 | 2330, 2319, 2309, 2299, 2289, 2279, 2269, 2259, |
616 | 2250, 2240, 2231, 2221, 2212, 2202, 2193, 2184, |
617 | 2175, 2166, 2157, 2148, 2139, 2131, 2122, 2114, |
618 | 2105, 2097, 2088, 2080, 2072, 2064, 2056, 2048, |
619 | 2040, 2032, 2024, 2016, 2008, 2001, 1993, 1985, |
620 | 1978, 1971, 1963, 1956, 1949, 1941, 1934, 1927, |
621 | 1920, 1913, 1906, 1899, 1892, 1885, 1879, 1872, |
622 | 1865, 1859, 1852, 1846, 1839, 1833, 1826, 1820, |
623 | 1814, 1807, 1801, 1795, 1789, 1783, 1777, 1771, |
624 | 1765, 1759, 1753, 1747, 1741, 1736, 1730, 1724, |
625 | 1718, 1713, 1707, 1702, 1696, 1691, 1685, 1680, |
626 | 1675, 1669, 1664, 1659, 1653, 1648, 1643, 1638, |
627 | 1633, 1628, 1623, 1618, 1613, 1608, 1603, 1598, |
628 | 1593, 1588, 1583, 1579, 1574, 1569, 1565, 1560, |
629 | 1555, 1551, 1546, 1542, 1537, 1533, 1528, 1524, |
630 | 1519, 1515, 1510, 1506, 1502, 1497, 1493, 1489, |
631 | 1485, 1481, 1476, 1472, 1468, 1464, 1460, 1456, |
632 | 1452, 1448, 1444, 1440, 1436, 1432, 1428, 1424, |
633 | 1420, 1416, 1413, 1409, 1405, 1401, 1398, 1394, |
634 | 1390, 1387, 1383, 1379, 1376, 1372, 1368, 1365, |
635 | 1361, 1358, 1354, 1351, 1347, 1344, 1340, 1337, |
636 | 1334, 1330, 1327, 1323, 1320, 1317, 1314, 1310, |
637 | 1307, 1304, 1300, 1297, 1294, 1291, 1288, 1285, |
638 | 1281, 1278, 1275, 1272, 1269, 1266, 1263, 1260, |
639 | 1257, 1254, 1251, 1248, 1245, 1242, 1239, 1236, |
640 | 1233, 1230, 1227, 1224, 1222, 1219, 1216, 1213, |
641 | 1210, 1208, 1205, 1202, 1199, 1197, 1194, 1191, |
642 | 1188, 1186, 1183, 1180, 1178, 1175, 1172, 1170, |
643 | 1167, 1165, 1162, 1159, 1157, 1154, 1152, 1149, |
644 | 1147, 1144, 1142, 1139, 1137, 1134, 1132, 1129, |
645 | 1127, 1125, 1122, 1120, 1117, 1115, 1113, 1110, |
646 | 1108, 1106, 1103, 1101, 1099, 1096, 1094, 1092, |
647 | 1089, 1087, 1085, 1083, 1081, 1078, 1076, 1074, |
648 | 1072, 1069, 1067, 1065, 1063, 1061, 1059, 1057, |
649 | 1054, 1052, 1050, 1048, 1046, 1044, 1042, 1040, |
650 | 1038, 1036, 1034, 1032, 1030, 1028, 1026, 1024, |
651 | 1022, 1020, 1018, 1016, 1014, 1012, 1010, 1008, |
652 | 1006, 1004, 1002, 1000, 998, 996, 994, 992, |
653 | 991, 989, 987, 985, 983, 981, 979, 978, |
654 | 976, 974, 972, 970, 969, 967, 965, 963, |
655 | 961, 960, 958, 956, 954, 953, 951, 949, |
656 | 948, 946, 944, 942, 941, 939, 937, 936, |
657 | 934, 932, 931, 929, 927, 926, 924, 923, |
658 | 921, 919, 918, 916, 914, 913, 911, 910, |
659 | 908, 907, 905, 903, 902, 900, 899, 897, |
660 | 896, 894, 893, 891, 890, 888, 887, 885, |
661 | 884, 882, 881, 879, 878, 876, 875, 873, |
662 | 872, 870, 869, 868, 866, 865, 863, 862, |
663 | 860, 859, 858, 856, 855, 853, 852, 851, |
664 | 849, 848, 846, 845, 844, 842, 841, 840, |
665 | 838, 837, 836, 834, 833, 832, 830, 829, |
666 | 828, 826, 825, 824, 823, 821, 820, 819, |
667 | 817, 816, 815, 814, 812, 811, 810, 809, |
668 | 807, 806, 805, 804, 802, 801, 800, 799, |
669 | 798, 796, 795, 794, 793, 791, 790, 789, |
670 | 788, 787, 786, 784, 783, 782, 781, 780, |
671 | 779, 777, 776, 775, 774, 773, 772, 771, |
672 | 769, 768, 767, 766, 765, 764, 763, 762, |
673 | 760, 759, 758, 757, 756, 755, 754, 753, |
674 | 752, 751, 750, 748, 747, 746, 745, 744, |
675 | 743, 742, 741, 740, 739, 738, 737, 736, |
676 | 735, 734, 733, 732, 731, 730, 729, 728, |
677 | 727, 726, 725, 724, 723, 722, 721, 720, |
678 | 719, 718, 717, 716, 715, 714, 713, 712, |
679 | 711, 710, 709, 708, 707, 706, 705, 704, |
680 | 703, 702, 701, 700, 699, 699, 698, 697, |
681 | 696, 695, 694, 693, 692, 691, 690, 689, |
682 | 688, 688, 687, 686, 685, 684, 683, 682, |
683 | 681, 680, 680, 679, 678, 677, 676, 675, |
684 | 674, 673, 673, 672, 671, 670, 669, 668, |
685 | 667, 667, 666, 665, 664, 663, 662, 661, |
686 | 661, 660, 659, 658, 657, 657, 656, 655, |
687 | 654, 653, 652, 652, 651, 650, 649, 648, |
688 | 648, 647, 646, 645, 644, 644, 643, 642, |
689 | 641, 640, 640, 639, 638, 637, 637, 636, |
690 | 635, 634, 633, 633, 632, 631, 630, 630, |
691 | 629, 628, 627, 627, 626, 625, 624, 624, |
692 | 623, 622, 621, 621, 620, 619, 618, 618, |
693 | 617, 616, 616, 615, 614, 613, 613, 612, |
694 | 611, 611, 610, 609, 608, 608, 607, 606, |
695 | 606, 605, 604, 604, 603, 602, 601, 601, |
696 | 600, 599, 599, 598, 597, 597, 596, 595, |
697 | 595, 594, 593, 593, 592, 591, 591, 590, |
698 | 589, 589, 588, 587, 587, 586, 585, 585, |
699 | 584, 583, 583, 582, 581, 581, 580, 579, |
700 | 579, 578, 578, 577, 576, 576, 575, 574, |
701 | 574, 573, 572, 572, 571, 571, 570, 569, |
702 | 569, 568, 568, 567, 566, 566, 565, 564, |
703 | 564, 563, 563, 562, 561, 561, 560, 560, |
704 | 559, 558, 558, 557, 557, 556, 555, 555, |
705 | 554, 554, 553, 553, 552, 551, 551, 550, |
706 | 550, 549, 548, 548, 547, 547, 546, 546, |
707 | 545, 544, 544, 543, 543, 542, 542, 541, |
708 | 541, 540, 539, 539, 538, 538, 537, 537, |
709 | 536, 536, 535, 534, 534, 533, 533, 532, |
710 | 532, 531, 531, 530, 530, 529, 529, 528, |
711 | 527, 527, 526, 526, 525, 525, 524, 524, |
712 | 523, 523, 522, 522, 521, 521, 520, 520, |
713 | 519, 519, 518, 518, 517, 517, 516, 516, |
714 | 515, 515, 514, 514 |
715 | }; |
716 | |
717 | // Note that LinearToGamma() expects the values to be premultiplied by 4, |
718 | // so we incorporate this factor 4 inside the DIVIDE_BY_ALPHA macro directly. |
719 | #define DIVIDE_BY_ALPHA(sum, a) (((sum) * kInvAlpha[(a)]) >> (kAlphaFix - 2)) |
720 | |
721 | #else |
722 | |
723 | #define DIVIDE_BY_ALPHA(sum, a) (4 * (sum) / (a)) |
724 | |
725 | #endif // USE_INVERSE_ALPHA_TABLE |
726 | |
727 | static WEBP_INLINE int LinearToGammaWeighted(const uint8_t* src, |
728 | const uint8_t* a_ptr, |
729 | uint32_t total_a, int step, |
730 | int rgb_stride) { |
731 | const uint32_t sum = |
732 | a_ptr[0] * GammaToLinear(src[0]) + |
733 | a_ptr[step] * GammaToLinear(src[step]) + |
734 | a_ptr[rgb_stride] * GammaToLinear(src[rgb_stride]) + |
735 | a_ptr[rgb_stride + step] * GammaToLinear(src[rgb_stride + step]); |
736 | assert(total_a > 0 && total_a <= 4 * 0xff); |
737 | #if defined(USE_INVERSE_ALPHA_TABLE) |
738 | assert((uint64_t)sum * kInvAlpha[total_a] < ((uint64_t)1 << 32)); |
739 | #endif |
740 | return LinearToGamma(DIVIDE_BY_ALPHA(sum, total_a), 0); |
741 | } |
742 | |
743 | static WEBP_INLINE void ConvertRowToY(const uint8_t* const r_ptr, |
744 | const uint8_t* const g_ptr, |
745 | const uint8_t* const b_ptr, |
746 | int step, |
747 | uint8_t* const dst_y, |
748 | int width, |
749 | VP8Random* const rg) { |
750 | int i, j; |
751 | for (i = 0, j = 0; i < width; i += 1, j += step) { |
752 | dst_y[i] = RGBToY(r_ptr[j], g_ptr[j], b_ptr[j], rg); |
753 | } |
754 | } |
755 | |
756 | static WEBP_INLINE void AccumulateRGBA(const uint8_t* const r_ptr, |
757 | const uint8_t* const g_ptr, |
758 | const uint8_t* const b_ptr, |
759 | const uint8_t* const a_ptr, |
760 | int rgb_stride, |
761 | uint16_t* dst, int width) { |
762 | int i, j; |
763 | // we loop over 2x2 blocks and produce one R/G/B/A value for each. |
764 | for (i = 0, j = 0; i < (width >> 1); i += 1, j += 2 * 4, dst += 4) { |
765 | const uint32_t a = SUM4ALPHA(a_ptr + j); |
766 | int r, g, b; |
767 | if (a == 4 * 0xff || a == 0) { |
768 | r = SUM4(r_ptr + j, 4); |
769 | g = SUM4(g_ptr + j, 4); |
770 | b = SUM4(b_ptr + j, 4); |
771 | } else { |
772 | r = LinearToGammaWeighted(r_ptr + j, a_ptr + j, a, 4, rgb_stride); |
773 | g = LinearToGammaWeighted(g_ptr + j, a_ptr + j, a, 4, rgb_stride); |
774 | b = LinearToGammaWeighted(b_ptr + j, a_ptr + j, a, 4, rgb_stride); |
775 | } |
776 | dst[0] = r; |
777 | dst[1] = g; |
778 | dst[2] = b; |
779 | dst[3] = a; |
780 | } |
781 | if (width & 1) { |
782 | const uint32_t a = 2u * SUM2ALPHA(a_ptr + j); |
783 | int r, g, b; |
784 | if (a == 4 * 0xff || a == 0) { |
785 | r = SUM2(r_ptr + j); |
786 | g = SUM2(g_ptr + j); |
787 | b = SUM2(b_ptr + j); |
788 | } else { |
789 | r = LinearToGammaWeighted(r_ptr + j, a_ptr + j, a, 0, rgb_stride); |
790 | g = LinearToGammaWeighted(g_ptr + j, a_ptr + j, a, 0, rgb_stride); |
791 | b = LinearToGammaWeighted(b_ptr + j, a_ptr + j, a, 0, rgb_stride); |
792 | } |
793 | dst[0] = r; |
794 | dst[1] = g; |
795 | dst[2] = b; |
796 | dst[3] = a; |
797 | } |
798 | } |
799 | |
800 | static WEBP_INLINE void AccumulateRGB(const uint8_t* const r_ptr, |
801 | const uint8_t* const g_ptr, |
802 | const uint8_t* const b_ptr, |
803 | int step, int rgb_stride, |
804 | uint16_t* dst, int width) { |
805 | int i, j; |
806 | for (i = 0, j = 0; i < (width >> 1); i += 1, j += 2 * step, dst += 4) { |
807 | dst[0] = SUM4(r_ptr + j, step); |
808 | dst[1] = SUM4(g_ptr + j, step); |
809 | dst[2] = SUM4(b_ptr + j, step); |
810 | } |
811 | if (width & 1) { |
812 | dst[0] = SUM2(r_ptr + j); |
813 | dst[1] = SUM2(g_ptr + j); |
814 | dst[2] = SUM2(b_ptr + j); |
815 | } |
816 | } |
817 | |
818 | static WEBP_INLINE void ConvertRowsToUV(const uint16_t* rgb, |
819 | uint8_t* const dst_u, |
820 | uint8_t* const dst_v, |
821 | int width, |
822 | VP8Random* const rg) { |
823 | int i; |
824 | for (i = 0; i < width; i += 1, rgb += 4) { |
825 | const int r = rgb[0], g = rgb[1], b = rgb[2]; |
826 | dst_u[i] = RGBToU(r, g, b, rg); |
827 | dst_v[i] = RGBToV(r, g, b, rg); |
828 | } |
829 | } |
830 | |
831 | static int ImportYUVAFromRGBA(const uint8_t* r_ptr, |
832 | const uint8_t* g_ptr, |
833 | const uint8_t* b_ptr, |
834 | const uint8_t* a_ptr, |
835 | int step, // bytes per pixel |
836 | int rgb_stride, // bytes per scanline |
837 | float dithering, |
838 | int use_iterative_conversion, |
839 | WebPPicture* const picture) { |
840 | int y; |
841 | const int width = picture->width; |
842 | const int height = picture->height; |
843 | const int has_alpha = CheckNonOpaque(a_ptr, width, height, step, rgb_stride); |
844 | const int is_rgb = (r_ptr < b_ptr); // otherwise it's bgr |
845 | |
846 | picture->colorspace = has_alpha ? WEBP_YUV420A : WEBP_YUV420; |
847 | picture->use_argb = 0; |
848 | |
849 | // disable smart conversion if source is too small (overkill). |
850 | if (width < kMinDimensionIterativeConversion || |
851 | height < kMinDimensionIterativeConversion) { |
852 | use_iterative_conversion = 0; |
853 | } |
854 | |
855 | if (!WebPPictureAllocYUVA(picture, width, height)) { |
856 | return 0; |
857 | } |
858 | if (has_alpha) { |
859 | WebPInitAlphaProcessing(); |
860 | assert(step == 4); |
861 | #if defined(USE_GAMMA_COMPRESSION) && defined(USE_INVERSE_ALPHA_TABLE) |
862 | assert(kAlphaFix + kGammaFix <= 31); |
863 | #endif |
864 | } |
865 | |
866 | if (use_iterative_conversion) { |
867 | InitGammaTablesF(); |
868 | if (!PreprocessARGB(r_ptr, g_ptr, b_ptr, step, rgb_stride, picture)) { |
869 | return 0; |
870 | } |
871 | if (has_alpha) { |
872 | WebPExtractAlpha(a_ptr, rgb_stride, width, height, |
873 | picture->a, picture->a_stride); |
874 | } |
875 | } else { |
876 | const int uv_width = (width + 1) >> 1; |
877 | int use_dsp = (step == 3); // use special function in this case |
878 | // temporary storage for accumulated R/G/B values during conversion to U/V |
879 | uint16_t* const tmp_rgb = |
880 | (uint16_t*)WebPSafeMalloc(4 * uv_width, sizeof(*tmp_rgb)); |
881 | uint8_t* dst_y = picture->y; |
882 | uint8_t* dst_u = picture->u; |
883 | uint8_t* dst_v = picture->v; |
884 | uint8_t* dst_a = picture->a; |
885 | |
886 | VP8Random base_rg; |
887 | VP8Random* rg = NULL; |
888 | if (dithering > 0.) { |
889 | VP8InitRandom(&base_rg, dithering); |
890 | rg = &base_rg; |
891 | use_dsp = 0; // can't use dsp in this case |
892 | } |
893 | WebPInitConvertARGBToYUV(); |
894 | InitGammaTables(); |
895 | |
896 | if (tmp_rgb == NULL) return 0; // malloc error |
897 | |
898 | // Downsample Y/U/V planes, two rows at a time |
899 | for (y = 0; y < (height >> 1); ++y) { |
900 | int rows_have_alpha = has_alpha; |
901 | if (use_dsp) { |
902 | if (is_rgb) { |
903 | WebPConvertRGB24ToY(r_ptr, dst_y, width); |
904 | WebPConvertRGB24ToY(r_ptr + rgb_stride, |
905 | dst_y + picture->y_stride, width); |
906 | } else { |
907 | WebPConvertBGR24ToY(b_ptr, dst_y, width); |
908 | WebPConvertBGR24ToY(b_ptr + rgb_stride, |
909 | dst_y + picture->y_stride, width); |
910 | } |
911 | } else { |
912 | ConvertRowToY(r_ptr, g_ptr, b_ptr, step, dst_y, width, rg); |
913 | ConvertRowToY(r_ptr + rgb_stride, |
914 | g_ptr + rgb_stride, |
915 | b_ptr + rgb_stride, step, |
916 | dst_y + picture->y_stride, width, rg); |
917 | } |
918 | dst_y += 2 * picture->y_stride; |
919 | if (has_alpha) { |
920 | rows_have_alpha &= !WebPExtractAlpha(a_ptr, rgb_stride, width, 2, |
921 | dst_a, picture->a_stride); |
922 | dst_a += 2 * picture->a_stride; |
923 | } |
924 | // Collect averaged R/G/B(/A) |
925 | if (!rows_have_alpha) { |
926 | AccumulateRGB(r_ptr, g_ptr, b_ptr, step, rgb_stride, tmp_rgb, width); |
927 | } else { |
928 | AccumulateRGBA(r_ptr, g_ptr, b_ptr, a_ptr, rgb_stride, tmp_rgb, width); |
929 | } |
930 | // Convert to U/V |
931 | if (rg == NULL) { |
932 | WebPConvertRGBA32ToUV(tmp_rgb, dst_u, dst_v, uv_width); |
933 | } else { |
934 | ConvertRowsToUV(tmp_rgb, dst_u, dst_v, uv_width, rg); |
935 | } |
936 | dst_u += picture->uv_stride; |
937 | dst_v += picture->uv_stride; |
938 | r_ptr += 2 * rgb_stride; |
939 | b_ptr += 2 * rgb_stride; |
940 | g_ptr += 2 * rgb_stride; |
941 | if (has_alpha) a_ptr += 2 * rgb_stride; |
942 | } |
943 | if (height & 1) { // extra last row |
944 | int row_has_alpha = has_alpha; |
945 | if (use_dsp) { |
946 | if (r_ptr < b_ptr) { |
947 | WebPConvertRGB24ToY(r_ptr, dst_y, width); |
948 | } else { |
949 | WebPConvertBGR24ToY(b_ptr, dst_y, width); |
950 | } |
951 | } else { |
952 | ConvertRowToY(r_ptr, g_ptr, b_ptr, step, dst_y, width, rg); |
953 | } |
954 | if (row_has_alpha) { |
955 | row_has_alpha &= !WebPExtractAlpha(a_ptr, 0, width, 1, dst_a, 0); |
956 | } |
957 | // Collect averaged R/G/B(/A) |
958 | if (!row_has_alpha) { |
959 | // Collect averaged R/G/B |
960 | AccumulateRGB(r_ptr, g_ptr, b_ptr, step, /* rgb_stride = */ 0, |
961 | tmp_rgb, width); |
962 | } else { |
963 | AccumulateRGBA(r_ptr, g_ptr, b_ptr, a_ptr, /* rgb_stride = */ 0, |
964 | tmp_rgb, width); |
965 | } |
966 | if (rg == NULL) { |
967 | WebPConvertRGBA32ToUV(tmp_rgb, dst_u, dst_v, uv_width); |
968 | } else { |
969 | ConvertRowsToUV(tmp_rgb, dst_u, dst_v, uv_width, rg); |
970 | } |
971 | } |
972 | WebPSafeFree(tmp_rgb); |
973 | } |
974 | return 1; |
975 | } |
976 | |
977 | #undef SUM4 |
978 | #undef SUM2 |
979 | #undef SUM4ALPHA |
980 | #undef SUM2ALPHA |
981 | |
982 | //------------------------------------------------------------------------------ |
983 | // call for ARGB->YUVA conversion |
984 | |
985 | static int PictureARGBToYUVA(WebPPicture* picture, WebPEncCSP colorspace, |
986 | float dithering, int use_iterative_conversion) { |
987 | if (picture == NULL) return 0; |
988 | if (picture->argb == NULL) { |
989 | return WebPEncodingSetError(picture, VP8_ENC_ERROR_NULL_PARAMETER); |
990 | } else if ((colorspace & WEBP_CSP_UV_MASK) != WEBP_YUV420) { |
991 | return WebPEncodingSetError(picture, VP8_ENC_ERROR_INVALID_CONFIGURATION); |
992 | } else { |
993 | const uint8_t* const argb = (const uint8_t*)picture->argb; |
994 | const uint8_t* const r = ALPHA_IS_LAST ? argb + 2 : argb + 1; |
995 | const uint8_t* const g = ALPHA_IS_LAST ? argb + 1 : argb + 2; |
996 | const uint8_t* const b = ALPHA_IS_LAST ? argb + 0 : argb + 3; |
997 | const uint8_t* const a = ALPHA_IS_LAST ? argb + 3 : argb + 0; |
998 | |
999 | picture->colorspace = WEBP_YUV420; |
1000 | return ImportYUVAFromRGBA(r, g, b, a, 4, 4 * picture->argb_stride, |
1001 | dithering, use_iterative_conversion, picture); |
1002 | } |
1003 | } |
1004 | |
1005 | int WebPPictureARGBToYUVADithered(WebPPicture* picture, WebPEncCSP colorspace, |
1006 | float dithering) { |
1007 | return PictureARGBToYUVA(picture, colorspace, dithering, 0); |
1008 | } |
1009 | |
1010 | int WebPPictureARGBToYUVA(WebPPicture* picture, WebPEncCSP colorspace) { |
1011 | return PictureARGBToYUVA(picture, colorspace, 0.f, 0); |
1012 | } |
1013 | |
1014 | int WebPPictureSharpARGBToYUVA(WebPPicture* picture) { |
1015 | return PictureARGBToYUVA(picture, WEBP_YUV420, 0.f, 1); |
1016 | } |
1017 | // for backward compatibility |
1018 | int WebPPictureSmartARGBToYUVA(WebPPicture* picture) { |
1019 | return WebPPictureSharpARGBToYUVA(picture); |
1020 | } |
1021 | |
1022 | //------------------------------------------------------------------------------ |
1023 | // call for YUVA -> ARGB conversion |
1024 | |
1025 | int WebPPictureYUVAToARGB(WebPPicture* picture) { |
1026 | if (picture == NULL) return 0; |
1027 | if (picture->y == NULL || picture->u == NULL || picture->v == NULL) { |
1028 | return WebPEncodingSetError(picture, VP8_ENC_ERROR_NULL_PARAMETER); |
1029 | } |
1030 | if ((picture->colorspace & WEBP_CSP_ALPHA_BIT) && picture->a == NULL) { |
1031 | return WebPEncodingSetError(picture, VP8_ENC_ERROR_NULL_PARAMETER); |
1032 | } |
1033 | if ((picture->colorspace & WEBP_CSP_UV_MASK) != WEBP_YUV420) { |
1034 | return WebPEncodingSetError(picture, VP8_ENC_ERROR_INVALID_CONFIGURATION); |
1035 | } |
1036 | // Allocate a new argb buffer (discarding the previous one). |
1037 | if (!WebPPictureAllocARGB(picture, picture->width, picture->height)) return 0; |
1038 | picture->use_argb = 1; |
1039 | |
1040 | // Convert |
1041 | { |
1042 | int y; |
1043 | const int width = picture->width; |
1044 | const int height = picture->height; |
1045 | const int argb_stride = 4 * picture->argb_stride; |
1046 | uint8_t* dst = (uint8_t*)picture->argb; |
1047 | const uint8_t *cur_u = picture->u, *cur_v = picture->v, *cur_y = picture->y; |
1048 | WebPUpsampleLinePairFunc upsample = WebPGetLinePairConverter(ALPHA_IS_LAST); |
1049 | |
1050 | // First row, with replicated top samples. |
1051 | upsample(cur_y, NULL, cur_u, cur_v, cur_u, cur_v, dst, NULL, width); |
1052 | cur_y += picture->y_stride; |
1053 | dst += argb_stride; |
1054 | // Center rows. |
1055 | for (y = 1; y + 1 < height; y += 2) { |
1056 | const uint8_t* const top_u = cur_u; |
1057 | const uint8_t* const top_v = cur_v; |
1058 | cur_u += picture->uv_stride; |
1059 | cur_v += picture->uv_stride; |
1060 | upsample(cur_y, cur_y + picture->y_stride, top_u, top_v, cur_u, cur_v, |
1061 | dst, dst + argb_stride, width); |
1062 | cur_y += 2 * picture->y_stride; |
1063 | dst += 2 * argb_stride; |
1064 | } |
1065 | // Last row (if needed), with replicated bottom samples. |
1066 | if (height > 1 && !(height & 1)) { |
1067 | upsample(cur_y, NULL, cur_u, cur_v, cur_u, cur_v, dst, NULL, width); |
1068 | } |
1069 | // Insert alpha values if needed, in replacement for the default 0xff ones. |
1070 | if (picture->colorspace & WEBP_CSP_ALPHA_BIT) { |
1071 | for (y = 0; y < height; ++y) { |
1072 | uint32_t* const argb_dst = picture->argb + y * picture->argb_stride; |
1073 | const uint8_t* const src = picture->a + y * picture->a_stride; |
1074 | int x; |
1075 | for (x = 0; x < width; ++x) { |
1076 | argb_dst[x] = (argb_dst[x] & 0x00ffffffu) | ((uint32_t)src[x] << 24); |
1077 | } |
1078 | } |
1079 | } |
1080 | } |
1081 | return 1; |
1082 | } |
1083 | |
1084 | //------------------------------------------------------------------------------ |
1085 | // automatic import / conversion |
1086 | |
1087 | static int Import(WebPPicture* const picture, |
1088 | const uint8_t* const rgb, int rgb_stride, |
1089 | int step, int swap_rb, int import_alpha) { |
1090 | int y; |
1091 | const uint8_t* r_ptr = rgb + (swap_rb ? 2 : 0); |
1092 | const uint8_t* g_ptr = rgb + 1; |
1093 | const uint8_t* b_ptr = rgb + (swap_rb ? 0 : 2); |
1094 | const uint8_t* a_ptr = import_alpha ? rgb + 3 : NULL; |
1095 | const int width = picture->width; |
1096 | const int height = picture->height; |
1097 | |
1098 | if (!picture->use_argb) { |
1099 | return ImportYUVAFromRGBA(r_ptr, g_ptr, b_ptr, a_ptr, step, rgb_stride, |
1100 | 0.f /* no dithering */, 0, picture); |
1101 | } |
1102 | if (!WebPPictureAlloc(picture)) return 0; |
1103 | |
1104 | VP8EncDspARGBInit(); |
1105 | |
1106 | if (import_alpha) { |
1107 | uint32_t* dst = picture->argb; |
1108 | assert(step == 4); |
1109 | for (y = 0; y < height; ++y) { |
1110 | VP8PackARGB(a_ptr, r_ptr, g_ptr, b_ptr, width, dst); |
1111 | a_ptr += rgb_stride; |
1112 | r_ptr += rgb_stride; |
1113 | g_ptr += rgb_stride; |
1114 | b_ptr += rgb_stride; |
1115 | dst += picture->argb_stride; |
1116 | } |
1117 | } else { |
1118 | uint32_t* dst = picture->argb; |
1119 | assert(step >= 3); |
1120 | for (y = 0; y < height; ++y) { |
1121 | VP8PackRGB(r_ptr, g_ptr, b_ptr, width, step, dst); |
1122 | r_ptr += rgb_stride; |
1123 | g_ptr += rgb_stride; |
1124 | b_ptr += rgb_stride; |
1125 | dst += picture->argb_stride; |
1126 | } |
1127 | } |
1128 | return 1; |
1129 | } |
1130 | |
1131 | // Public API |
1132 | |
1133 | int WebPPictureImportRGB(WebPPicture* picture, |
1134 | const uint8_t* rgb, int rgb_stride) { |
1135 | return (picture != NULL && rgb != NULL) |
1136 | ? Import(picture, rgb, rgb_stride, 3, 0, 0) |
1137 | : 0; |
1138 | } |
1139 | |
1140 | int WebPPictureImportBGR(WebPPicture* picture, |
1141 | const uint8_t* rgb, int rgb_stride) { |
1142 | return (picture != NULL && rgb != NULL) |
1143 | ? Import(picture, rgb, rgb_stride, 3, 1, 0) |
1144 | : 0; |
1145 | } |
1146 | |
1147 | int WebPPictureImportRGBA(WebPPicture* picture, |
1148 | const uint8_t* rgba, int rgba_stride) { |
1149 | return (picture != NULL && rgba != NULL) |
1150 | ? Import(picture, rgba, rgba_stride, 4, 0, 1) |
1151 | : 0; |
1152 | } |
1153 | |
1154 | int WebPPictureImportBGRA(WebPPicture* picture, |
1155 | const uint8_t* rgba, int rgba_stride) { |
1156 | return (picture != NULL && rgba != NULL) |
1157 | ? Import(picture, rgba, rgba_stride, 4, 1, 1) |
1158 | : 0; |
1159 | } |
1160 | |
1161 | int WebPPictureImportRGBX(WebPPicture* picture, |
1162 | const uint8_t* rgba, int rgba_stride) { |
1163 | return (picture != NULL && rgba != NULL) |
1164 | ? Import(picture, rgba, rgba_stride, 4, 0, 0) |
1165 | : 0; |
1166 | } |
1167 | |
1168 | int WebPPictureImportBGRX(WebPPicture* picture, |
1169 | const uint8_t* rgba, int rgba_stride) { |
1170 | return (picture != NULL && rgba != NULL) |
1171 | ? Import(picture, rgba, rgba_stride, 4, 1, 0) |
1172 | : 0; |
1173 | } |
1174 | |
1175 | //------------------------------------------------------------------------------ |
1176 | |