| 1 | // Copyright 2014 Google Inc. All Rights Reserved. |
| 2 | // |
| 3 | // Use of this source code is governed by a BSD-style license |
| 4 | // that can be found in the COPYING file in the root of the source |
| 5 | // tree. An additional intellectual property rights grant can be found |
| 6 | // in the file PATENTS. All contributing project authors may |
| 7 | // be found in the AUTHORS file in the root of the source tree. |
| 8 | // ----------------------------------------------------------------------------- |
| 9 | // |
| 10 | // WebPPicture utils for colorspace conversion |
| 11 | // |
| 12 | // Author: Skal (pascal.massimino@gmail.com) |
| 13 | |
| 14 | #include <assert.h> |
| 15 | #include <stdlib.h> |
| 16 | #include <math.h> |
| 17 | |
| 18 | #include "./vp8i_enc.h" |
| 19 | #include "../utils/random_utils.h" |
| 20 | #include "../utils/utils.h" |
| 21 | #include "../dsp/yuv.h" |
| 22 | |
| 23 | // Uncomment to disable gamma-compression during RGB->U/V averaging |
| 24 | #define USE_GAMMA_COMPRESSION |
| 25 | |
| 26 | // If defined, use table to compute x / alpha. |
| 27 | #define USE_INVERSE_ALPHA_TABLE |
| 28 | |
| 29 | static const union { |
| 30 | uint32_t argb; |
| 31 | uint8_t bytes[4]; |
| 32 | } test_endian = { 0xff000000u }; |
| 33 | #define ALPHA_IS_LAST (test_endian.bytes[3] == 0xff) |
| 34 | |
| 35 | //------------------------------------------------------------------------------ |
| 36 | // Detection of non-trivial transparency |
| 37 | |
| 38 | // Returns true if alpha[] has non-0xff values. |
| 39 | static int CheckNonOpaque(const uint8_t* alpha, int width, int height, |
| 40 | int x_step, int y_step) { |
| 41 | if (alpha == NULL) return 0; |
| 42 | while (height-- > 0) { |
| 43 | int x; |
| 44 | for (x = 0; x < width * x_step; x += x_step) { |
| 45 | if (alpha[x] != 0xff) return 1; // TODO(skal): check 4/8 bytes at a time. |
| 46 | } |
| 47 | alpha += y_step; |
| 48 | } |
| 49 | return 0; |
| 50 | } |
| 51 | |
| 52 | // Checking for the presence of non-opaque alpha. |
| 53 | int WebPPictureHasTransparency(const WebPPicture* picture) { |
| 54 | if (picture == NULL) return 0; |
| 55 | if (!picture->use_argb) { |
| 56 | return CheckNonOpaque(picture->a, picture->width, picture->height, |
| 57 | 1, picture->a_stride); |
| 58 | } else { |
| 59 | int x, y; |
| 60 | const uint32_t* argb = picture->argb; |
| 61 | if (argb == NULL) return 0; |
| 62 | for (y = 0; y < picture->height; ++y) { |
| 63 | for (x = 0; x < picture->width; ++x) { |
| 64 | if (argb[x] < 0xff000000u) return 1; // test any alpha values != 0xff |
| 65 | } |
| 66 | argb += picture->argb_stride; |
| 67 | } |
| 68 | } |
| 69 | return 0; |
| 70 | } |
| 71 | |
| 72 | //------------------------------------------------------------------------------ |
| 73 | // Code for gamma correction |
| 74 | |
| 75 | #if defined(USE_GAMMA_COMPRESSION) |
| 76 | |
| 77 | // gamma-compensates loss of resolution during chroma subsampling |
| 78 | #define kGamma 0.80 // for now we use a different gamma value than kGammaF |
| 79 | #define kGammaFix 12 // fixed-point precision for linear values |
| 80 | #define kGammaScale ((1 << kGammaFix) - 1) |
| 81 | #define kGammaTabFix 7 // fixed-point fractional bits precision |
| 82 | #define kGammaTabScale (1 << kGammaTabFix) |
| 83 | #define kGammaTabRounder (kGammaTabScale >> 1) |
| 84 | #define kGammaTabSize (1 << (kGammaFix - kGammaTabFix)) |
| 85 | |
| 86 | static int kLinearToGammaTab[kGammaTabSize + 1]; |
| 87 | static uint16_t kGammaToLinearTab[256]; |
| 88 | static volatile int kGammaTablesOk = 0; |
| 89 | |
| 90 | static WEBP_TSAN_IGNORE_FUNCTION void InitGammaTables(void) { |
| 91 | if (!kGammaTablesOk) { |
| 92 | int v; |
| 93 | const double scale = (double)(1 << kGammaTabFix) / kGammaScale; |
| 94 | const double norm = 1. / 255.; |
| 95 | for (v = 0; v <= 255; ++v) { |
| 96 | kGammaToLinearTab[v] = |
| 97 | (uint16_t)(pow(norm * v, kGamma) * kGammaScale + .5); |
| 98 | } |
| 99 | for (v = 0; v <= kGammaTabSize; ++v) { |
| 100 | kLinearToGammaTab[v] = (int)(255. * pow(scale * v, 1. / kGamma) + .5); |
| 101 | } |
| 102 | kGammaTablesOk = 1; |
| 103 | } |
| 104 | } |
| 105 | |
| 106 | static WEBP_INLINE uint32_t GammaToLinear(uint8_t v) { |
| 107 | return kGammaToLinearTab[v]; |
| 108 | } |
| 109 | |
| 110 | static WEBP_INLINE int Interpolate(int v) { |
| 111 | const int tab_pos = v >> (kGammaTabFix + 2); // integer part |
| 112 | const int x = v & ((kGammaTabScale << 2) - 1); // fractional part |
| 113 | const int v0 = kLinearToGammaTab[tab_pos]; |
| 114 | const int v1 = kLinearToGammaTab[tab_pos + 1]; |
| 115 | const int y = v1 * x + v0 * ((kGammaTabScale << 2) - x); // interpolate |
| 116 | assert(tab_pos + 1 < kGammaTabSize + 1); |
| 117 | return y; |
| 118 | } |
| 119 | |
| 120 | // Convert a linear value 'v' to YUV_FIX+2 fixed-point precision |
| 121 | // U/V value, suitable for RGBToU/V calls. |
| 122 | static WEBP_INLINE int LinearToGamma(uint32_t base_value, int shift) { |
| 123 | const int y = Interpolate(base_value << shift); // final uplifted value |
| 124 | return (y + kGammaTabRounder) >> kGammaTabFix; // descale |
| 125 | } |
| 126 | |
| 127 | #else |
| 128 | |
| 129 | static WEBP_TSAN_IGNORE_FUNCTION void InitGammaTables(void) {} |
| 130 | static WEBP_INLINE uint32_t GammaToLinear(uint8_t v) { return v; } |
| 131 | static WEBP_INLINE int LinearToGamma(uint32_t base_value, int shift) { |
| 132 | return (int)(base_value << shift); |
| 133 | } |
| 134 | |
| 135 | #endif // USE_GAMMA_COMPRESSION |
| 136 | |
| 137 | //------------------------------------------------------------------------------ |
| 138 | // RGB -> YUV conversion |
| 139 | |
| 140 | static int RGBToY(int r, int g, int b, VP8Random* const rg) { |
| 141 | return (rg == NULL) ? VP8RGBToY(r, g, b, YUV_HALF) |
| 142 | : VP8RGBToY(r, g, b, VP8RandomBits(rg, YUV_FIX)); |
| 143 | } |
| 144 | |
| 145 | static int RGBToU(int r, int g, int b, VP8Random* const rg) { |
| 146 | return (rg == NULL) ? VP8RGBToU(r, g, b, YUV_HALF << 2) |
| 147 | : VP8RGBToU(r, g, b, VP8RandomBits(rg, YUV_FIX + 2)); |
| 148 | } |
| 149 | |
| 150 | static int RGBToV(int r, int g, int b, VP8Random* const rg) { |
| 151 | return (rg == NULL) ? VP8RGBToV(r, g, b, YUV_HALF << 2) |
| 152 | : VP8RGBToV(r, g, b, VP8RandomBits(rg, YUV_FIX + 2)); |
| 153 | } |
| 154 | |
| 155 | //------------------------------------------------------------------------------ |
| 156 | // Sharp RGB->YUV conversion |
| 157 | |
| 158 | static const int kNumIterations = 4; |
| 159 | static const int kMinDimensionIterativeConversion = 4; |
| 160 | |
| 161 | // We could use SFIX=0 and only uint8_t for fixed_y_t, but it produces some |
| 162 | // banding sometimes. Better use extra precision. |
| 163 | #define SFIX 2 // fixed-point precision of RGB and Y/W |
| 164 | typedef int16_t fixed_t; // signed type with extra SFIX precision for UV |
| 165 | typedef uint16_t fixed_y_t; // unsigned type with extra SFIX precision for W |
| 166 | |
| 167 | #define SHALF (1 << SFIX >> 1) |
| 168 | #define MAX_Y_T ((256 << SFIX) - 1) |
| 169 | #define SROUNDER (1 << (YUV_FIX + SFIX - 1)) |
| 170 | |
| 171 | #if defined(USE_GAMMA_COMPRESSION) |
| 172 | |
| 173 | // float variant of gamma-correction |
| 174 | // We use tables of different size and precision for the Rec709 |
| 175 | // transfer function. |
| 176 | #define kGammaF (1./0.45) |
| 177 | static float kGammaToLinearTabF[MAX_Y_T + 1]; // size scales with Y_FIX |
| 178 | static float kLinearToGammaTabF[kGammaTabSize + 2]; |
| 179 | static volatile int kGammaTablesFOk = 0; |
| 180 | |
| 181 | static WEBP_TSAN_IGNORE_FUNCTION void InitGammaTablesF(void) { |
| 182 | if (!kGammaTablesFOk) { |
| 183 | int v; |
| 184 | const double norm = 1. / MAX_Y_T; |
| 185 | const double scale = 1. / kGammaTabSize; |
| 186 | const double a = 0.099; |
| 187 | const double thresh = 0.018; |
| 188 | for (v = 0; v <= MAX_Y_T; ++v) { |
| 189 | const double g = norm * v; |
| 190 | if (g <= thresh * 4.5) { |
| 191 | kGammaToLinearTabF[v] = (float)(g / 4.5); |
| 192 | } else { |
| 193 | const double a_rec = 1. / (1. + a); |
| 194 | kGammaToLinearTabF[v] = (float)pow(a_rec * (g + a), kGammaF); |
| 195 | } |
| 196 | } |
| 197 | for (v = 0; v <= kGammaTabSize; ++v) { |
| 198 | const double g = scale * v; |
| 199 | double value; |
| 200 | if (g <= thresh) { |
| 201 | value = 4.5 * g; |
| 202 | } else { |
| 203 | value = (1. + a) * pow(g, 1. / kGammaF) - a; |
| 204 | } |
| 205 | kLinearToGammaTabF[v] = (float)(MAX_Y_T * value); |
| 206 | } |
| 207 | // to prevent small rounding errors to cause read-overflow: |
| 208 | kLinearToGammaTabF[kGammaTabSize + 1] = kLinearToGammaTabF[kGammaTabSize]; |
| 209 | kGammaTablesFOk = 1; |
| 210 | } |
| 211 | } |
| 212 | |
| 213 | static WEBP_INLINE float GammaToLinearF(int v) { |
| 214 | return kGammaToLinearTabF[v]; |
| 215 | } |
| 216 | |
| 217 | static WEBP_INLINE int LinearToGammaF(float value) { |
| 218 | const float v = value * kGammaTabSize; |
| 219 | const int tab_pos = (int)v; |
| 220 | const float x = v - (float)tab_pos; // fractional part |
| 221 | const float v0 = kLinearToGammaTabF[tab_pos + 0]; |
| 222 | const float v1 = kLinearToGammaTabF[tab_pos + 1]; |
| 223 | const float y = v1 * x + v0 * (1.f - x); // interpolate |
| 224 | return (int)(y + .5); |
| 225 | } |
| 226 | |
| 227 | #else |
| 228 | |
| 229 | static WEBP_TSAN_IGNORE_FUNCTION void InitGammaTablesF(void) {} |
| 230 | static WEBP_INLINE float GammaToLinearF(int v) { |
| 231 | const float norm = 1.f / MAX_Y_T; |
| 232 | return norm * v; |
| 233 | } |
| 234 | static WEBP_INLINE int LinearToGammaF(float value) { |
| 235 | return (int)(MAX_Y_T * value + .5); |
| 236 | } |
| 237 | |
| 238 | #endif // USE_GAMMA_COMPRESSION |
| 239 | |
| 240 | //------------------------------------------------------------------------------ |
| 241 | |
| 242 | static uint8_t clip_8b(fixed_t v) { |
| 243 | return (!(v & ~0xff)) ? (uint8_t)v : (v < 0) ? 0u : 255u; |
| 244 | } |
| 245 | |
| 246 | static fixed_y_t clip_y(int y) { |
| 247 | return (!(y & ~MAX_Y_T)) ? (fixed_y_t)y : (y < 0) ? 0 : MAX_Y_T; |
| 248 | } |
| 249 | |
| 250 | //------------------------------------------------------------------------------ |
| 251 | |
| 252 | static int RGBToGray(int r, int g, int b) { |
| 253 | const int luma = 13933 * r + 46871 * g + 4732 * b + YUV_HALF; |
| 254 | return (luma >> YUV_FIX); |
| 255 | } |
| 256 | |
| 257 | static float RGBToGrayF(float r, float g, float b) { |
| 258 | return (float)(0.2126 * r + 0.7152 * g + 0.0722 * b); |
| 259 | } |
| 260 | |
| 261 | static int ScaleDown(int a, int b, int c, int d) { |
| 262 | const float A = GammaToLinearF(a); |
| 263 | const float B = GammaToLinearF(b); |
| 264 | const float C = GammaToLinearF(c); |
| 265 | const float D = GammaToLinearF(d); |
| 266 | return LinearToGammaF(0.25f * (A + B + C + D)); |
| 267 | } |
| 268 | |
| 269 | static WEBP_INLINE void UpdateW(const fixed_y_t* src, fixed_y_t* dst, int w) { |
| 270 | int i; |
| 271 | for (i = 0; i < w; ++i) { |
| 272 | const float R = GammaToLinearF(src[0 * w + i]); |
| 273 | const float G = GammaToLinearF(src[1 * w + i]); |
| 274 | const float B = GammaToLinearF(src[2 * w + i]); |
| 275 | const float Y = RGBToGrayF(R, G, B); |
| 276 | dst[i] = (fixed_y_t)LinearToGammaF(Y); |
| 277 | } |
| 278 | } |
| 279 | |
| 280 | static void UpdateChroma(const fixed_y_t* src1, const fixed_y_t* src2, |
| 281 | fixed_t* dst, int uv_w) { |
| 282 | int i; |
| 283 | for (i = 0; i < uv_w; ++i) { |
| 284 | const int r = ScaleDown(src1[0 * uv_w + 0], src1[0 * uv_w + 1], |
| 285 | src2[0 * uv_w + 0], src2[0 * uv_w + 1]); |
| 286 | const int g = ScaleDown(src1[2 * uv_w + 0], src1[2 * uv_w + 1], |
| 287 | src2[2 * uv_w + 0], src2[2 * uv_w + 1]); |
| 288 | const int b = ScaleDown(src1[4 * uv_w + 0], src1[4 * uv_w + 1], |
| 289 | src2[4 * uv_w + 0], src2[4 * uv_w + 1]); |
| 290 | const int W = RGBToGray(r, g, b); |
| 291 | dst[0 * uv_w] = (fixed_t)(r - W); |
| 292 | dst[1 * uv_w] = (fixed_t)(g - W); |
| 293 | dst[2 * uv_w] = (fixed_t)(b - W); |
| 294 | dst += 1; |
| 295 | src1 += 2; |
| 296 | src2 += 2; |
| 297 | } |
| 298 | } |
| 299 | |
| 300 | static void StoreGray(const fixed_y_t* rgb, fixed_y_t* y, int w) { |
| 301 | int i; |
| 302 | for (i = 0; i < w; ++i) { |
| 303 | y[i] = RGBToGray(rgb[0 * w + i], rgb[1 * w + i], rgb[2 * w + i]); |
| 304 | } |
| 305 | } |
| 306 | |
| 307 | //------------------------------------------------------------------------------ |
| 308 | |
| 309 | static WEBP_INLINE fixed_y_t Filter2(int A, int B, int W0) { |
| 310 | const int v0 = (A * 3 + B + 2) >> 2; |
| 311 | return clip_y(v0 + W0); |
| 312 | } |
| 313 | |
| 314 | //------------------------------------------------------------------------------ |
| 315 | |
| 316 | static WEBP_INLINE fixed_y_t UpLift(uint8_t a) { // 8bit -> SFIX |
| 317 | return ((fixed_y_t)a << SFIX) | SHALF; |
| 318 | } |
| 319 | |
| 320 | static void ImportOneRow(const uint8_t* const r_ptr, |
| 321 | const uint8_t* const g_ptr, |
| 322 | const uint8_t* const b_ptr, |
| 323 | int step, |
| 324 | int pic_width, |
| 325 | fixed_y_t* const dst) { |
| 326 | int i; |
| 327 | const int w = (pic_width + 1) & ~1; |
| 328 | for (i = 0; i < pic_width; ++i) { |
| 329 | const int off = i * step; |
| 330 | dst[i + 0 * w] = UpLift(r_ptr[off]); |
| 331 | dst[i + 1 * w] = UpLift(g_ptr[off]); |
| 332 | dst[i + 2 * w] = UpLift(b_ptr[off]); |
| 333 | } |
| 334 | if (pic_width & 1) { // replicate rightmost pixel |
| 335 | dst[pic_width + 0 * w] = dst[pic_width + 0 * w - 1]; |
| 336 | dst[pic_width + 1 * w] = dst[pic_width + 1 * w - 1]; |
| 337 | dst[pic_width + 2 * w] = dst[pic_width + 2 * w - 1]; |
| 338 | } |
| 339 | } |
| 340 | |
| 341 | static void InterpolateTwoRows(const fixed_y_t* const best_y, |
| 342 | const fixed_t* prev_uv, |
| 343 | const fixed_t* cur_uv, |
| 344 | const fixed_t* next_uv, |
| 345 | int w, |
| 346 | fixed_y_t* out1, |
| 347 | fixed_y_t* out2) { |
| 348 | const int uv_w = w >> 1; |
| 349 | const int len = (w - 1) >> 1; // length to filter |
| 350 | int k = 3; |
| 351 | while (k-- > 0) { // process each R/G/B segments in turn |
| 352 | // special boundary case for i==0 |
| 353 | out1[0] = Filter2(cur_uv[0], prev_uv[0], best_y[0]); |
| 354 | out2[0] = Filter2(cur_uv[0], next_uv[0], best_y[w]); |
| 355 | |
| 356 | WebPSharpYUVFilterRow(cur_uv, prev_uv, len, best_y + 0 + 1, out1 + 1); |
| 357 | WebPSharpYUVFilterRow(cur_uv, next_uv, len, best_y + w + 1, out2 + 1); |
| 358 | |
| 359 | // special boundary case for i == w - 1 when w is even |
| 360 | if (!(w & 1)) { |
| 361 | out1[w - 1] = Filter2(cur_uv[uv_w - 1], prev_uv[uv_w - 1], |
| 362 | best_y[w - 1 + 0]); |
| 363 | out2[w - 1] = Filter2(cur_uv[uv_w - 1], next_uv[uv_w - 1], |
| 364 | best_y[w - 1 + w]); |
| 365 | } |
| 366 | out1 += w; |
| 367 | out2 += w; |
| 368 | prev_uv += uv_w; |
| 369 | cur_uv += uv_w; |
| 370 | next_uv += uv_w; |
| 371 | } |
| 372 | } |
| 373 | |
| 374 | static WEBP_INLINE uint8_t ConvertRGBToY(int r, int g, int b) { |
| 375 | const int luma = 16839 * r + 33059 * g + 6420 * b + SROUNDER; |
| 376 | return clip_8b(16 + (luma >> (YUV_FIX + SFIX))); |
| 377 | } |
| 378 | |
| 379 | static WEBP_INLINE uint8_t ConvertRGBToU(int r, int g, int b) { |
| 380 | const int u = -9719 * r - 19081 * g + 28800 * b + SROUNDER; |
| 381 | return clip_8b(128 + (u >> (YUV_FIX + SFIX))); |
| 382 | } |
| 383 | |
| 384 | static WEBP_INLINE uint8_t ConvertRGBToV(int r, int g, int b) { |
| 385 | const int v = +28800 * r - 24116 * g - 4684 * b + SROUNDER; |
| 386 | return clip_8b(128 + (v >> (YUV_FIX + SFIX))); |
| 387 | } |
| 388 | |
| 389 | static int ConvertWRGBToYUV(const fixed_y_t* best_y, const fixed_t* best_uv, |
| 390 | WebPPicture* const picture) { |
| 391 | int i, j; |
| 392 | uint8_t* dst_y = picture->y; |
| 393 | uint8_t* dst_u = picture->u; |
| 394 | uint8_t* dst_v = picture->v; |
| 395 | const fixed_t* const best_uv_base = best_uv; |
| 396 | const int w = (picture->width + 1) & ~1; |
| 397 | const int h = (picture->height + 1) & ~1; |
| 398 | const int uv_w = w >> 1; |
| 399 | const int uv_h = h >> 1; |
| 400 | for (best_uv = best_uv_base, j = 0; j < picture->height; ++j) { |
| 401 | for (i = 0; i < picture->width; ++i) { |
| 402 | const int off = (i >> 1); |
| 403 | const int W = best_y[i]; |
| 404 | const int r = best_uv[off + 0 * uv_w] + W; |
| 405 | const int g = best_uv[off + 1 * uv_w] + W; |
| 406 | const int b = best_uv[off + 2 * uv_w] + W; |
| 407 | dst_y[i] = ConvertRGBToY(r, g, b); |
| 408 | } |
| 409 | best_y += w; |
| 410 | best_uv += (j & 1) * 3 * uv_w; |
| 411 | dst_y += picture->y_stride; |
| 412 | } |
| 413 | for (best_uv = best_uv_base, j = 0; j < uv_h; ++j) { |
| 414 | for (i = 0; i < uv_w; ++i) { |
| 415 | const int off = i; |
| 416 | const int r = best_uv[off + 0 * uv_w]; |
| 417 | const int g = best_uv[off + 1 * uv_w]; |
| 418 | const int b = best_uv[off + 2 * uv_w]; |
| 419 | dst_u[i] = ConvertRGBToU(r, g, b); |
| 420 | dst_v[i] = ConvertRGBToV(r, g, b); |
| 421 | } |
| 422 | best_uv += 3 * uv_w; |
| 423 | dst_u += picture->uv_stride; |
| 424 | dst_v += picture->uv_stride; |
| 425 | } |
| 426 | return 1; |
| 427 | } |
| 428 | |
| 429 | //------------------------------------------------------------------------------ |
| 430 | // Main function |
| 431 | |
| 432 | #define SAFE_ALLOC(W, H, T) ((T*)WebPSafeMalloc((W) * (H), sizeof(T))) |
| 433 | |
| 434 | static int PreprocessARGB(const uint8_t* r_ptr, |
| 435 | const uint8_t* g_ptr, |
| 436 | const uint8_t* b_ptr, |
| 437 | int step, int rgb_stride, |
| 438 | WebPPicture* const picture) { |
| 439 | // we expand the right/bottom border if needed |
| 440 | const int w = (picture->width + 1) & ~1; |
| 441 | const int h = (picture->height + 1) & ~1; |
| 442 | const int uv_w = w >> 1; |
| 443 | const int uv_h = h >> 1; |
| 444 | uint64_t prev_diff_y_sum = ~0; |
| 445 | int j, iter; |
| 446 | |
| 447 | // TODO(skal): allocate one big memory chunk. But for now, it's easier |
| 448 | // for valgrind debugging to have several chunks. |
| 449 | fixed_y_t* const tmp_buffer = SAFE_ALLOC(w * 3, 2, fixed_y_t); // scratch |
| 450 | fixed_y_t* const best_y_base = SAFE_ALLOC(w, h, fixed_y_t); |
| 451 | fixed_y_t* const target_y_base = SAFE_ALLOC(w, h, fixed_y_t); |
| 452 | fixed_y_t* const best_rgb_y = SAFE_ALLOC(w, 2, fixed_y_t); |
| 453 | fixed_t* const best_uv_base = SAFE_ALLOC(uv_w * 3, uv_h, fixed_t); |
| 454 | fixed_t* const target_uv_base = SAFE_ALLOC(uv_w * 3, uv_h, fixed_t); |
| 455 | fixed_t* const best_rgb_uv = SAFE_ALLOC(uv_w * 3, 1, fixed_t); |
| 456 | fixed_y_t* best_y = best_y_base; |
| 457 | fixed_y_t* target_y = target_y_base; |
| 458 | fixed_t* best_uv = best_uv_base; |
| 459 | fixed_t* target_uv = target_uv_base; |
| 460 | const uint64_t diff_y_threshold = (uint64_t)(3.0 * w * h); |
| 461 | int ok; |
| 462 | |
| 463 | if (best_y_base == NULL || best_uv_base == NULL || |
| 464 | target_y_base == NULL || target_uv_base == NULL || |
| 465 | best_rgb_y == NULL || best_rgb_uv == NULL || |
| 466 | tmp_buffer == NULL) { |
| 467 | ok = WebPEncodingSetError(picture, VP8_ENC_ERROR_OUT_OF_MEMORY); |
| 468 | goto End; |
| 469 | } |
| 470 | assert(picture->width >= kMinDimensionIterativeConversion); |
| 471 | assert(picture->height >= kMinDimensionIterativeConversion); |
| 472 | |
| 473 | WebPInitConvertARGBToYUV(); |
| 474 | |
| 475 | // Import RGB samples to W/RGB representation. |
| 476 | for (j = 0; j < picture->height; j += 2) { |
| 477 | const int is_last_row = (j == picture->height - 1); |
| 478 | fixed_y_t* const src1 = tmp_buffer + 0 * w; |
| 479 | fixed_y_t* const src2 = tmp_buffer + 3 * w; |
| 480 | |
| 481 | // prepare two rows of input |
| 482 | ImportOneRow(r_ptr, g_ptr, b_ptr, step, picture->width, src1); |
| 483 | if (!is_last_row) { |
| 484 | ImportOneRow(r_ptr + rgb_stride, g_ptr + rgb_stride, b_ptr + rgb_stride, |
| 485 | step, picture->width, src2); |
| 486 | } else { |
| 487 | memcpy(src2, src1, 3 * w * sizeof(*src2)); |
| 488 | } |
| 489 | StoreGray(src1, best_y + 0, w); |
| 490 | StoreGray(src2, best_y + w, w); |
| 491 | |
| 492 | UpdateW(src1, target_y, w); |
| 493 | UpdateW(src2, target_y + w, w); |
| 494 | UpdateChroma(src1, src2, target_uv, uv_w); |
| 495 | memcpy(best_uv, target_uv, 3 * uv_w * sizeof(*best_uv)); |
| 496 | best_y += 2 * w; |
| 497 | best_uv += 3 * uv_w; |
| 498 | target_y += 2 * w; |
| 499 | target_uv += 3 * uv_w; |
| 500 | r_ptr += 2 * rgb_stride; |
| 501 | g_ptr += 2 * rgb_stride; |
| 502 | b_ptr += 2 * rgb_stride; |
| 503 | } |
| 504 | |
| 505 | // Iterate and resolve clipping conflicts. |
| 506 | for (iter = 0; iter < kNumIterations; ++iter) { |
| 507 | const fixed_t* cur_uv = best_uv_base; |
| 508 | const fixed_t* prev_uv = best_uv_base; |
| 509 | uint64_t diff_y_sum = 0; |
| 510 | |
| 511 | best_y = best_y_base; |
| 512 | best_uv = best_uv_base; |
| 513 | target_y = target_y_base; |
| 514 | target_uv = target_uv_base; |
| 515 | for (j = 0; j < h; j += 2) { |
| 516 | fixed_y_t* const src1 = tmp_buffer + 0 * w; |
| 517 | fixed_y_t* const src2 = tmp_buffer + 3 * w; |
| 518 | { |
| 519 | const fixed_t* const next_uv = cur_uv + ((j < h - 2) ? 3 * uv_w : 0); |
| 520 | InterpolateTwoRows(best_y, prev_uv, cur_uv, next_uv, w, src1, src2); |
| 521 | prev_uv = cur_uv; |
| 522 | cur_uv = next_uv; |
| 523 | } |
| 524 | |
| 525 | UpdateW(src1, best_rgb_y + 0 * w, w); |
| 526 | UpdateW(src2, best_rgb_y + 1 * w, w); |
| 527 | UpdateChroma(src1, src2, best_rgb_uv, uv_w); |
| 528 | |
| 529 | // update two rows of Y and one row of RGB |
| 530 | diff_y_sum += WebPSharpYUVUpdateY(target_y, best_rgb_y, best_y, 2 * w); |
| 531 | WebPSharpYUVUpdateRGB(target_uv, best_rgb_uv, best_uv, 3 * uv_w); |
| 532 | |
| 533 | best_y += 2 * w; |
| 534 | best_uv += 3 * uv_w; |
| 535 | target_y += 2 * w; |
| 536 | target_uv += 3 * uv_w; |
| 537 | } |
| 538 | // test exit condition |
| 539 | if (iter > 0) { |
| 540 | if (diff_y_sum < diff_y_threshold) break; |
| 541 | if (diff_y_sum > prev_diff_y_sum) break; |
| 542 | } |
| 543 | prev_diff_y_sum = diff_y_sum; |
| 544 | } |
| 545 | // final reconstruction |
| 546 | ok = ConvertWRGBToYUV(best_y_base, best_uv_base, picture); |
| 547 | |
| 548 | End: |
| 549 | WebPSafeFree(best_y_base); |
| 550 | WebPSafeFree(best_uv_base); |
| 551 | WebPSafeFree(target_y_base); |
| 552 | WebPSafeFree(target_uv_base); |
| 553 | WebPSafeFree(best_rgb_y); |
| 554 | WebPSafeFree(best_rgb_uv); |
| 555 | WebPSafeFree(tmp_buffer); |
| 556 | return ok; |
| 557 | } |
| 558 | #undef SAFE_ALLOC |
| 559 | |
| 560 | //------------------------------------------------------------------------------ |
| 561 | // "Fast" regular RGB->YUV |
| 562 | |
| 563 | #define SUM4(ptr, step) LinearToGamma( \ |
| 564 | GammaToLinear((ptr)[0]) + \ |
| 565 | GammaToLinear((ptr)[(step)]) + \ |
| 566 | GammaToLinear((ptr)[rgb_stride]) + \ |
| 567 | GammaToLinear((ptr)[rgb_stride + (step)]), 0) \ |
| 568 | |
| 569 | #define SUM2(ptr) \ |
| 570 | LinearToGamma(GammaToLinear((ptr)[0]) + GammaToLinear((ptr)[rgb_stride]), 1) |
| 571 | |
| 572 | #define SUM2ALPHA(ptr) ((ptr)[0] + (ptr)[rgb_stride]) |
| 573 | #define SUM4ALPHA(ptr) (SUM2ALPHA(ptr) + SUM2ALPHA((ptr) + 4)) |
| 574 | |
| 575 | #if defined(USE_INVERSE_ALPHA_TABLE) |
| 576 | |
| 577 | static const int kAlphaFix = 19; |
| 578 | // Following table is (1 << kAlphaFix) / a. The (v * kInvAlpha[a]) >> kAlphaFix |
| 579 | // formula is then equal to v / a in most (99.6%) cases. Note that this table |
| 580 | // and constant are adjusted very tightly to fit 32b arithmetic. |
| 581 | // In particular, they use the fact that the operands for 'v / a' are actually |
| 582 | // derived as v = (a0.p0 + a1.p1 + a2.p2 + a3.p3) and a = a0 + a1 + a2 + a3 |
| 583 | // with ai in [0..255] and pi in [0..1<<kGammaFix). The constraint to avoid |
| 584 | // overflow is: kGammaFix + kAlphaFix <= 31. |
| 585 | static const uint32_t kInvAlpha[4 * 0xff + 1] = { |
| 586 | 0, /* alpha = 0 */ |
| 587 | 524288, 262144, 174762, 131072, 104857, 87381, 74898, 65536, |
| 588 | 58254, 52428, 47662, 43690, 40329, 37449, 34952, 32768, |
| 589 | 30840, 29127, 27594, 26214, 24966, 23831, 22795, 21845, |
| 590 | 20971, 20164, 19418, 18724, 18078, 17476, 16912, 16384, |
| 591 | 15887, 15420, 14979, 14563, 14169, 13797, 13443, 13107, |
| 592 | 12787, 12483, 12192, 11915, 11650, 11397, 11155, 10922, |
| 593 | 10699, 10485, 10280, 10082, 9892, 9709, 9532, 9362, |
| 594 | 9198, 9039, 8886, 8738, 8594, 8456, 8322, 8192, |
| 595 | 8065, 7943, 7825, 7710, 7598, 7489, 7384, 7281, |
| 596 | 7182, 7084, 6990, 6898, 6808, 6721, 6636, 6553, |
| 597 | 6472, 6393, 6316, 6241, 6168, 6096, 6026, 5957, |
| 598 | 5890, 5825, 5761, 5698, 5637, 5577, 5518, 5461, |
| 599 | 5405, 5349, 5295, 5242, 5190, 5140, 5090, 5041, |
| 600 | 4993, 4946, 4899, 4854, 4809, 4766, 4723, 4681, |
| 601 | 4639, 4599, 4559, 4519, 4481, 4443, 4405, 4369, |
| 602 | 4332, 4297, 4262, 4228, 4194, 4161, 4128, 4096, |
| 603 | 4064, 4032, 4002, 3971, 3942, 3912, 3883, 3855, |
| 604 | 3826, 3799, 3771, 3744, 3718, 3692, 3666, 3640, |
| 605 | 3615, 3591, 3566, 3542, 3518, 3495, 3472, 3449, |
| 606 | 3426, 3404, 3382, 3360, 3339, 3318, 3297, 3276, |
| 607 | 3256, 3236, 3216, 3196, 3177, 3158, 3139, 3120, |
| 608 | 3102, 3084, 3066, 3048, 3030, 3013, 2995, 2978, |
| 609 | 2962, 2945, 2928, 2912, 2896, 2880, 2864, 2849, |
| 610 | 2833, 2818, 2803, 2788, 2774, 2759, 2744, 2730, |
| 611 | 2716, 2702, 2688, 2674, 2661, 2647, 2634, 2621, |
| 612 | 2608, 2595, 2582, 2570, 2557, 2545, 2532, 2520, |
| 613 | 2508, 2496, 2484, 2473, 2461, 2449, 2438, 2427, |
| 614 | 2416, 2404, 2394, 2383, 2372, 2361, 2351, 2340, |
| 615 | 2330, 2319, 2309, 2299, 2289, 2279, 2269, 2259, |
| 616 | 2250, 2240, 2231, 2221, 2212, 2202, 2193, 2184, |
| 617 | 2175, 2166, 2157, 2148, 2139, 2131, 2122, 2114, |
| 618 | 2105, 2097, 2088, 2080, 2072, 2064, 2056, 2048, |
| 619 | 2040, 2032, 2024, 2016, 2008, 2001, 1993, 1985, |
| 620 | 1978, 1971, 1963, 1956, 1949, 1941, 1934, 1927, |
| 621 | 1920, 1913, 1906, 1899, 1892, 1885, 1879, 1872, |
| 622 | 1865, 1859, 1852, 1846, 1839, 1833, 1826, 1820, |
| 623 | 1814, 1807, 1801, 1795, 1789, 1783, 1777, 1771, |
| 624 | 1765, 1759, 1753, 1747, 1741, 1736, 1730, 1724, |
| 625 | 1718, 1713, 1707, 1702, 1696, 1691, 1685, 1680, |
| 626 | 1675, 1669, 1664, 1659, 1653, 1648, 1643, 1638, |
| 627 | 1633, 1628, 1623, 1618, 1613, 1608, 1603, 1598, |
| 628 | 1593, 1588, 1583, 1579, 1574, 1569, 1565, 1560, |
| 629 | 1555, 1551, 1546, 1542, 1537, 1533, 1528, 1524, |
| 630 | 1519, 1515, 1510, 1506, 1502, 1497, 1493, 1489, |
| 631 | 1485, 1481, 1476, 1472, 1468, 1464, 1460, 1456, |
| 632 | 1452, 1448, 1444, 1440, 1436, 1432, 1428, 1424, |
| 633 | 1420, 1416, 1413, 1409, 1405, 1401, 1398, 1394, |
| 634 | 1390, 1387, 1383, 1379, 1376, 1372, 1368, 1365, |
| 635 | 1361, 1358, 1354, 1351, 1347, 1344, 1340, 1337, |
| 636 | 1334, 1330, 1327, 1323, 1320, 1317, 1314, 1310, |
| 637 | 1307, 1304, 1300, 1297, 1294, 1291, 1288, 1285, |
| 638 | 1281, 1278, 1275, 1272, 1269, 1266, 1263, 1260, |
| 639 | 1257, 1254, 1251, 1248, 1245, 1242, 1239, 1236, |
| 640 | 1233, 1230, 1227, 1224, 1222, 1219, 1216, 1213, |
| 641 | 1210, 1208, 1205, 1202, 1199, 1197, 1194, 1191, |
| 642 | 1188, 1186, 1183, 1180, 1178, 1175, 1172, 1170, |
| 643 | 1167, 1165, 1162, 1159, 1157, 1154, 1152, 1149, |
| 644 | 1147, 1144, 1142, 1139, 1137, 1134, 1132, 1129, |
| 645 | 1127, 1125, 1122, 1120, 1117, 1115, 1113, 1110, |
| 646 | 1108, 1106, 1103, 1101, 1099, 1096, 1094, 1092, |
| 647 | 1089, 1087, 1085, 1083, 1081, 1078, 1076, 1074, |
| 648 | 1072, 1069, 1067, 1065, 1063, 1061, 1059, 1057, |
| 649 | 1054, 1052, 1050, 1048, 1046, 1044, 1042, 1040, |
| 650 | 1038, 1036, 1034, 1032, 1030, 1028, 1026, 1024, |
| 651 | 1022, 1020, 1018, 1016, 1014, 1012, 1010, 1008, |
| 652 | 1006, 1004, 1002, 1000, 998, 996, 994, 992, |
| 653 | 991, 989, 987, 985, 983, 981, 979, 978, |
| 654 | 976, 974, 972, 970, 969, 967, 965, 963, |
| 655 | 961, 960, 958, 956, 954, 953, 951, 949, |
| 656 | 948, 946, 944, 942, 941, 939, 937, 936, |
| 657 | 934, 932, 931, 929, 927, 926, 924, 923, |
| 658 | 921, 919, 918, 916, 914, 913, 911, 910, |
| 659 | 908, 907, 905, 903, 902, 900, 899, 897, |
| 660 | 896, 894, 893, 891, 890, 888, 887, 885, |
| 661 | 884, 882, 881, 879, 878, 876, 875, 873, |
| 662 | 872, 870, 869, 868, 866, 865, 863, 862, |
| 663 | 860, 859, 858, 856, 855, 853, 852, 851, |
| 664 | 849, 848, 846, 845, 844, 842, 841, 840, |
| 665 | 838, 837, 836, 834, 833, 832, 830, 829, |
| 666 | 828, 826, 825, 824, 823, 821, 820, 819, |
| 667 | 817, 816, 815, 814, 812, 811, 810, 809, |
| 668 | 807, 806, 805, 804, 802, 801, 800, 799, |
| 669 | 798, 796, 795, 794, 793, 791, 790, 789, |
| 670 | 788, 787, 786, 784, 783, 782, 781, 780, |
| 671 | 779, 777, 776, 775, 774, 773, 772, 771, |
| 672 | 769, 768, 767, 766, 765, 764, 763, 762, |
| 673 | 760, 759, 758, 757, 756, 755, 754, 753, |
| 674 | 752, 751, 750, 748, 747, 746, 745, 744, |
| 675 | 743, 742, 741, 740, 739, 738, 737, 736, |
| 676 | 735, 734, 733, 732, 731, 730, 729, 728, |
| 677 | 727, 726, 725, 724, 723, 722, 721, 720, |
| 678 | 719, 718, 717, 716, 715, 714, 713, 712, |
| 679 | 711, 710, 709, 708, 707, 706, 705, 704, |
| 680 | 703, 702, 701, 700, 699, 699, 698, 697, |
| 681 | 696, 695, 694, 693, 692, 691, 690, 689, |
| 682 | 688, 688, 687, 686, 685, 684, 683, 682, |
| 683 | 681, 680, 680, 679, 678, 677, 676, 675, |
| 684 | 674, 673, 673, 672, 671, 670, 669, 668, |
| 685 | 667, 667, 666, 665, 664, 663, 662, 661, |
| 686 | 661, 660, 659, 658, 657, 657, 656, 655, |
| 687 | 654, 653, 652, 652, 651, 650, 649, 648, |
| 688 | 648, 647, 646, 645, 644, 644, 643, 642, |
| 689 | 641, 640, 640, 639, 638, 637, 637, 636, |
| 690 | 635, 634, 633, 633, 632, 631, 630, 630, |
| 691 | 629, 628, 627, 627, 626, 625, 624, 624, |
| 692 | 623, 622, 621, 621, 620, 619, 618, 618, |
| 693 | 617, 616, 616, 615, 614, 613, 613, 612, |
| 694 | 611, 611, 610, 609, 608, 608, 607, 606, |
| 695 | 606, 605, 604, 604, 603, 602, 601, 601, |
| 696 | 600, 599, 599, 598, 597, 597, 596, 595, |
| 697 | 595, 594, 593, 593, 592, 591, 591, 590, |
| 698 | 589, 589, 588, 587, 587, 586, 585, 585, |
| 699 | 584, 583, 583, 582, 581, 581, 580, 579, |
| 700 | 579, 578, 578, 577, 576, 576, 575, 574, |
| 701 | 574, 573, 572, 572, 571, 571, 570, 569, |
| 702 | 569, 568, 568, 567, 566, 566, 565, 564, |
| 703 | 564, 563, 563, 562, 561, 561, 560, 560, |
| 704 | 559, 558, 558, 557, 557, 556, 555, 555, |
| 705 | 554, 554, 553, 553, 552, 551, 551, 550, |
| 706 | 550, 549, 548, 548, 547, 547, 546, 546, |
| 707 | 545, 544, 544, 543, 543, 542, 542, 541, |
| 708 | 541, 540, 539, 539, 538, 538, 537, 537, |
| 709 | 536, 536, 535, 534, 534, 533, 533, 532, |
| 710 | 532, 531, 531, 530, 530, 529, 529, 528, |
| 711 | 527, 527, 526, 526, 525, 525, 524, 524, |
| 712 | 523, 523, 522, 522, 521, 521, 520, 520, |
| 713 | 519, 519, 518, 518, 517, 517, 516, 516, |
| 714 | 515, 515, 514, 514 |
| 715 | }; |
| 716 | |
| 717 | // Note that LinearToGamma() expects the values to be premultiplied by 4, |
| 718 | // so we incorporate this factor 4 inside the DIVIDE_BY_ALPHA macro directly. |
| 719 | #define DIVIDE_BY_ALPHA(sum, a) (((sum) * kInvAlpha[(a)]) >> (kAlphaFix - 2)) |
| 720 | |
| 721 | #else |
| 722 | |
| 723 | #define DIVIDE_BY_ALPHA(sum, a) (4 * (sum) / (a)) |
| 724 | |
| 725 | #endif // USE_INVERSE_ALPHA_TABLE |
| 726 | |
| 727 | static WEBP_INLINE int LinearToGammaWeighted(const uint8_t* src, |
| 728 | const uint8_t* a_ptr, |
| 729 | uint32_t total_a, int step, |
| 730 | int rgb_stride) { |
| 731 | const uint32_t sum = |
| 732 | a_ptr[0] * GammaToLinear(src[0]) + |
| 733 | a_ptr[step] * GammaToLinear(src[step]) + |
| 734 | a_ptr[rgb_stride] * GammaToLinear(src[rgb_stride]) + |
| 735 | a_ptr[rgb_stride + step] * GammaToLinear(src[rgb_stride + step]); |
| 736 | assert(total_a > 0 && total_a <= 4 * 0xff); |
| 737 | #if defined(USE_INVERSE_ALPHA_TABLE) |
| 738 | assert((uint64_t)sum * kInvAlpha[total_a] < ((uint64_t)1 << 32)); |
| 739 | #endif |
| 740 | return LinearToGamma(DIVIDE_BY_ALPHA(sum, total_a), 0); |
| 741 | } |
| 742 | |
| 743 | static WEBP_INLINE void ConvertRowToY(const uint8_t* const r_ptr, |
| 744 | const uint8_t* const g_ptr, |
| 745 | const uint8_t* const b_ptr, |
| 746 | int step, |
| 747 | uint8_t* const dst_y, |
| 748 | int width, |
| 749 | VP8Random* const rg) { |
| 750 | int i, j; |
| 751 | for (i = 0, j = 0; i < width; i += 1, j += step) { |
| 752 | dst_y[i] = RGBToY(r_ptr[j], g_ptr[j], b_ptr[j], rg); |
| 753 | } |
| 754 | } |
| 755 | |
| 756 | static WEBP_INLINE void AccumulateRGBA(const uint8_t* const r_ptr, |
| 757 | const uint8_t* const g_ptr, |
| 758 | const uint8_t* const b_ptr, |
| 759 | const uint8_t* const a_ptr, |
| 760 | int rgb_stride, |
| 761 | uint16_t* dst, int width) { |
| 762 | int i, j; |
| 763 | // we loop over 2x2 blocks and produce one R/G/B/A value for each. |
| 764 | for (i = 0, j = 0; i < (width >> 1); i += 1, j += 2 * 4, dst += 4) { |
| 765 | const uint32_t a = SUM4ALPHA(a_ptr + j); |
| 766 | int r, g, b; |
| 767 | if (a == 4 * 0xff || a == 0) { |
| 768 | r = SUM4(r_ptr + j, 4); |
| 769 | g = SUM4(g_ptr + j, 4); |
| 770 | b = SUM4(b_ptr + j, 4); |
| 771 | } else { |
| 772 | r = LinearToGammaWeighted(r_ptr + j, a_ptr + j, a, 4, rgb_stride); |
| 773 | g = LinearToGammaWeighted(g_ptr + j, a_ptr + j, a, 4, rgb_stride); |
| 774 | b = LinearToGammaWeighted(b_ptr + j, a_ptr + j, a, 4, rgb_stride); |
| 775 | } |
| 776 | dst[0] = r; |
| 777 | dst[1] = g; |
| 778 | dst[2] = b; |
| 779 | dst[3] = a; |
| 780 | } |
| 781 | if (width & 1) { |
| 782 | const uint32_t a = 2u * SUM2ALPHA(a_ptr + j); |
| 783 | int r, g, b; |
| 784 | if (a == 4 * 0xff || a == 0) { |
| 785 | r = SUM2(r_ptr + j); |
| 786 | g = SUM2(g_ptr + j); |
| 787 | b = SUM2(b_ptr + j); |
| 788 | } else { |
| 789 | r = LinearToGammaWeighted(r_ptr + j, a_ptr + j, a, 0, rgb_stride); |
| 790 | g = LinearToGammaWeighted(g_ptr + j, a_ptr + j, a, 0, rgb_stride); |
| 791 | b = LinearToGammaWeighted(b_ptr + j, a_ptr + j, a, 0, rgb_stride); |
| 792 | } |
| 793 | dst[0] = r; |
| 794 | dst[1] = g; |
| 795 | dst[2] = b; |
| 796 | dst[3] = a; |
| 797 | } |
| 798 | } |
| 799 | |
| 800 | static WEBP_INLINE void AccumulateRGB(const uint8_t* const r_ptr, |
| 801 | const uint8_t* const g_ptr, |
| 802 | const uint8_t* const b_ptr, |
| 803 | int step, int rgb_stride, |
| 804 | uint16_t* dst, int width) { |
| 805 | int i, j; |
| 806 | for (i = 0, j = 0; i < (width >> 1); i += 1, j += 2 * step, dst += 4) { |
| 807 | dst[0] = SUM4(r_ptr + j, step); |
| 808 | dst[1] = SUM4(g_ptr + j, step); |
| 809 | dst[2] = SUM4(b_ptr + j, step); |
| 810 | } |
| 811 | if (width & 1) { |
| 812 | dst[0] = SUM2(r_ptr + j); |
| 813 | dst[1] = SUM2(g_ptr + j); |
| 814 | dst[2] = SUM2(b_ptr + j); |
| 815 | } |
| 816 | } |
| 817 | |
| 818 | static WEBP_INLINE void ConvertRowsToUV(const uint16_t* rgb, |
| 819 | uint8_t* const dst_u, |
| 820 | uint8_t* const dst_v, |
| 821 | int width, |
| 822 | VP8Random* const rg) { |
| 823 | int i; |
| 824 | for (i = 0; i < width; i += 1, rgb += 4) { |
| 825 | const int r = rgb[0], g = rgb[1], b = rgb[2]; |
| 826 | dst_u[i] = RGBToU(r, g, b, rg); |
| 827 | dst_v[i] = RGBToV(r, g, b, rg); |
| 828 | } |
| 829 | } |
| 830 | |
| 831 | static int ImportYUVAFromRGBA(const uint8_t* r_ptr, |
| 832 | const uint8_t* g_ptr, |
| 833 | const uint8_t* b_ptr, |
| 834 | const uint8_t* a_ptr, |
| 835 | int step, // bytes per pixel |
| 836 | int rgb_stride, // bytes per scanline |
| 837 | float dithering, |
| 838 | int use_iterative_conversion, |
| 839 | WebPPicture* const picture) { |
| 840 | int y; |
| 841 | const int width = picture->width; |
| 842 | const int height = picture->height; |
| 843 | const int has_alpha = CheckNonOpaque(a_ptr, width, height, step, rgb_stride); |
| 844 | const int is_rgb = (r_ptr < b_ptr); // otherwise it's bgr |
| 845 | |
| 846 | picture->colorspace = has_alpha ? WEBP_YUV420A : WEBP_YUV420; |
| 847 | picture->use_argb = 0; |
| 848 | |
| 849 | // disable smart conversion if source is too small (overkill). |
| 850 | if (width < kMinDimensionIterativeConversion || |
| 851 | height < kMinDimensionIterativeConversion) { |
| 852 | use_iterative_conversion = 0; |
| 853 | } |
| 854 | |
| 855 | if (!WebPPictureAllocYUVA(picture, width, height)) { |
| 856 | return 0; |
| 857 | } |
| 858 | if (has_alpha) { |
| 859 | WebPInitAlphaProcessing(); |
| 860 | assert(step == 4); |
| 861 | #if defined(USE_GAMMA_COMPRESSION) && defined(USE_INVERSE_ALPHA_TABLE) |
| 862 | assert(kAlphaFix + kGammaFix <= 31); |
| 863 | #endif |
| 864 | } |
| 865 | |
| 866 | if (use_iterative_conversion) { |
| 867 | InitGammaTablesF(); |
| 868 | if (!PreprocessARGB(r_ptr, g_ptr, b_ptr, step, rgb_stride, picture)) { |
| 869 | return 0; |
| 870 | } |
| 871 | if (has_alpha) { |
| 872 | WebPExtractAlpha(a_ptr, rgb_stride, width, height, |
| 873 | picture->a, picture->a_stride); |
| 874 | } |
| 875 | } else { |
| 876 | const int uv_width = (width + 1) >> 1; |
| 877 | int use_dsp = (step == 3); // use special function in this case |
| 878 | // temporary storage for accumulated R/G/B values during conversion to U/V |
| 879 | uint16_t* const tmp_rgb = |
| 880 | (uint16_t*)WebPSafeMalloc(4 * uv_width, sizeof(*tmp_rgb)); |
| 881 | uint8_t* dst_y = picture->y; |
| 882 | uint8_t* dst_u = picture->u; |
| 883 | uint8_t* dst_v = picture->v; |
| 884 | uint8_t* dst_a = picture->a; |
| 885 | |
| 886 | VP8Random base_rg; |
| 887 | VP8Random* rg = NULL; |
| 888 | if (dithering > 0.) { |
| 889 | VP8InitRandom(&base_rg, dithering); |
| 890 | rg = &base_rg; |
| 891 | use_dsp = 0; // can't use dsp in this case |
| 892 | } |
| 893 | WebPInitConvertARGBToYUV(); |
| 894 | InitGammaTables(); |
| 895 | |
| 896 | if (tmp_rgb == NULL) return 0; // malloc error |
| 897 | |
| 898 | // Downsample Y/U/V planes, two rows at a time |
| 899 | for (y = 0; y < (height >> 1); ++y) { |
| 900 | int rows_have_alpha = has_alpha; |
| 901 | if (use_dsp) { |
| 902 | if (is_rgb) { |
| 903 | WebPConvertRGB24ToY(r_ptr, dst_y, width); |
| 904 | WebPConvertRGB24ToY(r_ptr + rgb_stride, |
| 905 | dst_y + picture->y_stride, width); |
| 906 | } else { |
| 907 | WebPConvertBGR24ToY(b_ptr, dst_y, width); |
| 908 | WebPConvertBGR24ToY(b_ptr + rgb_stride, |
| 909 | dst_y + picture->y_stride, width); |
| 910 | } |
| 911 | } else { |
| 912 | ConvertRowToY(r_ptr, g_ptr, b_ptr, step, dst_y, width, rg); |
| 913 | ConvertRowToY(r_ptr + rgb_stride, |
| 914 | g_ptr + rgb_stride, |
| 915 | b_ptr + rgb_stride, step, |
| 916 | dst_y + picture->y_stride, width, rg); |
| 917 | } |
| 918 | dst_y += 2 * picture->y_stride; |
| 919 | if (has_alpha) { |
| 920 | rows_have_alpha &= !WebPExtractAlpha(a_ptr, rgb_stride, width, 2, |
| 921 | dst_a, picture->a_stride); |
| 922 | dst_a += 2 * picture->a_stride; |
| 923 | } |
| 924 | // Collect averaged R/G/B(/A) |
| 925 | if (!rows_have_alpha) { |
| 926 | AccumulateRGB(r_ptr, g_ptr, b_ptr, step, rgb_stride, tmp_rgb, width); |
| 927 | } else { |
| 928 | AccumulateRGBA(r_ptr, g_ptr, b_ptr, a_ptr, rgb_stride, tmp_rgb, width); |
| 929 | } |
| 930 | // Convert to U/V |
| 931 | if (rg == NULL) { |
| 932 | WebPConvertRGBA32ToUV(tmp_rgb, dst_u, dst_v, uv_width); |
| 933 | } else { |
| 934 | ConvertRowsToUV(tmp_rgb, dst_u, dst_v, uv_width, rg); |
| 935 | } |
| 936 | dst_u += picture->uv_stride; |
| 937 | dst_v += picture->uv_stride; |
| 938 | r_ptr += 2 * rgb_stride; |
| 939 | b_ptr += 2 * rgb_stride; |
| 940 | g_ptr += 2 * rgb_stride; |
| 941 | if (has_alpha) a_ptr += 2 * rgb_stride; |
| 942 | } |
| 943 | if (height & 1) { // extra last row |
| 944 | int row_has_alpha = has_alpha; |
| 945 | if (use_dsp) { |
| 946 | if (r_ptr < b_ptr) { |
| 947 | WebPConvertRGB24ToY(r_ptr, dst_y, width); |
| 948 | } else { |
| 949 | WebPConvertBGR24ToY(b_ptr, dst_y, width); |
| 950 | } |
| 951 | } else { |
| 952 | ConvertRowToY(r_ptr, g_ptr, b_ptr, step, dst_y, width, rg); |
| 953 | } |
| 954 | if (row_has_alpha) { |
| 955 | row_has_alpha &= !WebPExtractAlpha(a_ptr, 0, width, 1, dst_a, 0); |
| 956 | } |
| 957 | // Collect averaged R/G/B(/A) |
| 958 | if (!row_has_alpha) { |
| 959 | // Collect averaged R/G/B |
| 960 | AccumulateRGB(r_ptr, g_ptr, b_ptr, step, /* rgb_stride = */ 0, |
| 961 | tmp_rgb, width); |
| 962 | } else { |
| 963 | AccumulateRGBA(r_ptr, g_ptr, b_ptr, a_ptr, /* rgb_stride = */ 0, |
| 964 | tmp_rgb, width); |
| 965 | } |
| 966 | if (rg == NULL) { |
| 967 | WebPConvertRGBA32ToUV(tmp_rgb, dst_u, dst_v, uv_width); |
| 968 | } else { |
| 969 | ConvertRowsToUV(tmp_rgb, dst_u, dst_v, uv_width, rg); |
| 970 | } |
| 971 | } |
| 972 | WebPSafeFree(tmp_rgb); |
| 973 | } |
| 974 | return 1; |
| 975 | } |
| 976 | |
| 977 | #undef SUM4 |
| 978 | #undef SUM2 |
| 979 | #undef SUM4ALPHA |
| 980 | #undef SUM2ALPHA |
| 981 | |
| 982 | //------------------------------------------------------------------------------ |
| 983 | // call for ARGB->YUVA conversion |
| 984 | |
| 985 | static int PictureARGBToYUVA(WebPPicture* picture, WebPEncCSP colorspace, |
| 986 | float dithering, int use_iterative_conversion) { |
| 987 | if (picture == NULL) return 0; |
| 988 | if (picture->argb == NULL) { |
| 989 | return WebPEncodingSetError(picture, VP8_ENC_ERROR_NULL_PARAMETER); |
| 990 | } else if ((colorspace & WEBP_CSP_UV_MASK) != WEBP_YUV420) { |
| 991 | return WebPEncodingSetError(picture, VP8_ENC_ERROR_INVALID_CONFIGURATION); |
| 992 | } else { |
| 993 | const uint8_t* const argb = (const uint8_t*)picture->argb; |
| 994 | const uint8_t* const r = ALPHA_IS_LAST ? argb + 2 : argb + 1; |
| 995 | const uint8_t* const g = ALPHA_IS_LAST ? argb + 1 : argb + 2; |
| 996 | const uint8_t* const b = ALPHA_IS_LAST ? argb + 0 : argb + 3; |
| 997 | const uint8_t* const a = ALPHA_IS_LAST ? argb + 3 : argb + 0; |
| 998 | |
| 999 | picture->colorspace = WEBP_YUV420; |
| 1000 | return ImportYUVAFromRGBA(r, g, b, a, 4, 4 * picture->argb_stride, |
| 1001 | dithering, use_iterative_conversion, picture); |
| 1002 | } |
| 1003 | } |
| 1004 | |
| 1005 | int WebPPictureARGBToYUVADithered(WebPPicture* picture, WebPEncCSP colorspace, |
| 1006 | float dithering) { |
| 1007 | return PictureARGBToYUVA(picture, colorspace, dithering, 0); |
| 1008 | } |
| 1009 | |
| 1010 | int WebPPictureARGBToYUVA(WebPPicture* picture, WebPEncCSP colorspace) { |
| 1011 | return PictureARGBToYUVA(picture, colorspace, 0.f, 0); |
| 1012 | } |
| 1013 | |
| 1014 | int WebPPictureSharpARGBToYUVA(WebPPicture* picture) { |
| 1015 | return PictureARGBToYUVA(picture, WEBP_YUV420, 0.f, 1); |
| 1016 | } |
| 1017 | // for backward compatibility |
| 1018 | int WebPPictureSmartARGBToYUVA(WebPPicture* picture) { |
| 1019 | return WebPPictureSharpARGBToYUVA(picture); |
| 1020 | } |
| 1021 | |
| 1022 | //------------------------------------------------------------------------------ |
| 1023 | // call for YUVA -> ARGB conversion |
| 1024 | |
| 1025 | int WebPPictureYUVAToARGB(WebPPicture* picture) { |
| 1026 | if (picture == NULL) return 0; |
| 1027 | if (picture->y == NULL || picture->u == NULL || picture->v == NULL) { |
| 1028 | return WebPEncodingSetError(picture, VP8_ENC_ERROR_NULL_PARAMETER); |
| 1029 | } |
| 1030 | if ((picture->colorspace & WEBP_CSP_ALPHA_BIT) && picture->a == NULL) { |
| 1031 | return WebPEncodingSetError(picture, VP8_ENC_ERROR_NULL_PARAMETER); |
| 1032 | } |
| 1033 | if ((picture->colorspace & WEBP_CSP_UV_MASK) != WEBP_YUV420) { |
| 1034 | return WebPEncodingSetError(picture, VP8_ENC_ERROR_INVALID_CONFIGURATION); |
| 1035 | } |
| 1036 | // Allocate a new argb buffer (discarding the previous one). |
| 1037 | if (!WebPPictureAllocARGB(picture, picture->width, picture->height)) return 0; |
| 1038 | picture->use_argb = 1; |
| 1039 | |
| 1040 | // Convert |
| 1041 | { |
| 1042 | int y; |
| 1043 | const int width = picture->width; |
| 1044 | const int height = picture->height; |
| 1045 | const int argb_stride = 4 * picture->argb_stride; |
| 1046 | uint8_t* dst = (uint8_t*)picture->argb; |
| 1047 | const uint8_t *cur_u = picture->u, *cur_v = picture->v, *cur_y = picture->y; |
| 1048 | WebPUpsampleLinePairFunc upsample = WebPGetLinePairConverter(ALPHA_IS_LAST); |
| 1049 | |
| 1050 | // First row, with replicated top samples. |
| 1051 | upsample(cur_y, NULL, cur_u, cur_v, cur_u, cur_v, dst, NULL, width); |
| 1052 | cur_y += picture->y_stride; |
| 1053 | dst += argb_stride; |
| 1054 | // Center rows. |
| 1055 | for (y = 1; y + 1 < height; y += 2) { |
| 1056 | const uint8_t* const top_u = cur_u; |
| 1057 | const uint8_t* const top_v = cur_v; |
| 1058 | cur_u += picture->uv_stride; |
| 1059 | cur_v += picture->uv_stride; |
| 1060 | upsample(cur_y, cur_y + picture->y_stride, top_u, top_v, cur_u, cur_v, |
| 1061 | dst, dst + argb_stride, width); |
| 1062 | cur_y += 2 * picture->y_stride; |
| 1063 | dst += 2 * argb_stride; |
| 1064 | } |
| 1065 | // Last row (if needed), with replicated bottom samples. |
| 1066 | if (height > 1 && !(height & 1)) { |
| 1067 | upsample(cur_y, NULL, cur_u, cur_v, cur_u, cur_v, dst, NULL, width); |
| 1068 | } |
| 1069 | // Insert alpha values if needed, in replacement for the default 0xff ones. |
| 1070 | if (picture->colorspace & WEBP_CSP_ALPHA_BIT) { |
| 1071 | for (y = 0; y < height; ++y) { |
| 1072 | uint32_t* const argb_dst = picture->argb + y * picture->argb_stride; |
| 1073 | const uint8_t* const src = picture->a + y * picture->a_stride; |
| 1074 | int x; |
| 1075 | for (x = 0; x < width; ++x) { |
| 1076 | argb_dst[x] = (argb_dst[x] & 0x00ffffffu) | ((uint32_t)src[x] << 24); |
| 1077 | } |
| 1078 | } |
| 1079 | } |
| 1080 | } |
| 1081 | return 1; |
| 1082 | } |
| 1083 | |
| 1084 | //------------------------------------------------------------------------------ |
| 1085 | // automatic import / conversion |
| 1086 | |
| 1087 | static int Import(WebPPicture* const picture, |
| 1088 | const uint8_t* const rgb, int rgb_stride, |
| 1089 | int step, int swap_rb, int import_alpha) { |
| 1090 | int y; |
| 1091 | const uint8_t* r_ptr = rgb + (swap_rb ? 2 : 0); |
| 1092 | const uint8_t* g_ptr = rgb + 1; |
| 1093 | const uint8_t* b_ptr = rgb + (swap_rb ? 0 : 2); |
| 1094 | const uint8_t* a_ptr = import_alpha ? rgb + 3 : NULL; |
| 1095 | const int width = picture->width; |
| 1096 | const int height = picture->height; |
| 1097 | |
| 1098 | if (!picture->use_argb) { |
| 1099 | return ImportYUVAFromRGBA(r_ptr, g_ptr, b_ptr, a_ptr, step, rgb_stride, |
| 1100 | 0.f /* no dithering */, 0, picture); |
| 1101 | } |
| 1102 | if (!WebPPictureAlloc(picture)) return 0; |
| 1103 | |
| 1104 | VP8EncDspARGBInit(); |
| 1105 | |
| 1106 | if (import_alpha) { |
| 1107 | uint32_t* dst = picture->argb; |
| 1108 | assert(step == 4); |
| 1109 | for (y = 0; y < height; ++y) { |
| 1110 | VP8PackARGB(a_ptr, r_ptr, g_ptr, b_ptr, width, dst); |
| 1111 | a_ptr += rgb_stride; |
| 1112 | r_ptr += rgb_stride; |
| 1113 | g_ptr += rgb_stride; |
| 1114 | b_ptr += rgb_stride; |
| 1115 | dst += picture->argb_stride; |
| 1116 | } |
| 1117 | } else { |
| 1118 | uint32_t* dst = picture->argb; |
| 1119 | assert(step >= 3); |
| 1120 | for (y = 0; y < height; ++y) { |
| 1121 | VP8PackRGB(r_ptr, g_ptr, b_ptr, width, step, dst); |
| 1122 | r_ptr += rgb_stride; |
| 1123 | g_ptr += rgb_stride; |
| 1124 | b_ptr += rgb_stride; |
| 1125 | dst += picture->argb_stride; |
| 1126 | } |
| 1127 | } |
| 1128 | return 1; |
| 1129 | } |
| 1130 | |
| 1131 | // Public API |
| 1132 | |
| 1133 | int WebPPictureImportRGB(WebPPicture* picture, |
| 1134 | const uint8_t* rgb, int rgb_stride) { |
| 1135 | return (picture != NULL && rgb != NULL) |
| 1136 | ? Import(picture, rgb, rgb_stride, 3, 0, 0) |
| 1137 | : 0; |
| 1138 | } |
| 1139 | |
| 1140 | int WebPPictureImportBGR(WebPPicture* picture, |
| 1141 | const uint8_t* rgb, int rgb_stride) { |
| 1142 | return (picture != NULL && rgb != NULL) |
| 1143 | ? Import(picture, rgb, rgb_stride, 3, 1, 0) |
| 1144 | : 0; |
| 1145 | } |
| 1146 | |
| 1147 | int WebPPictureImportRGBA(WebPPicture* picture, |
| 1148 | const uint8_t* rgba, int rgba_stride) { |
| 1149 | return (picture != NULL && rgba != NULL) |
| 1150 | ? Import(picture, rgba, rgba_stride, 4, 0, 1) |
| 1151 | : 0; |
| 1152 | } |
| 1153 | |
| 1154 | int WebPPictureImportBGRA(WebPPicture* picture, |
| 1155 | const uint8_t* rgba, int rgba_stride) { |
| 1156 | return (picture != NULL && rgba != NULL) |
| 1157 | ? Import(picture, rgba, rgba_stride, 4, 1, 1) |
| 1158 | : 0; |
| 1159 | } |
| 1160 | |
| 1161 | int WebPPictureImportRGBX(WebPPicture* picture, |
| 1162 | const uint8_t* rgba, int rgba_stride) { |
| 1163 | return (picture != NULL && rgba != NULL) |
| 1164 | ? Import(picture, rgba, rgba_stride, 4, 0, 0) |
| 1165 | : 0; |
| 1166 | } |
| 1167 | |
| 1168 | int WebPPictureImportBGRX(WebPPicture* picture, |
| 1169 | const uint8_t* rgba, int rgba_stride) { |
| 1170 | return (picture != NULL && rgba != NULL) |
| 1171 | ? Import(picture, rgba, rgba_stride, 4, 1, 0) |
| 1172 | : 0; |
| 1173 | } |
| 1174 | |
| 1175 | //------------------------------------------------------------------------------ |
| 1176 | |