1 | // Copyright 2014 Google Inc. All Rights Reserved. |
2 | // |
3 | // Use of this source code is governed by a BSD-style license |
4 | // that can be found in the COPYING file in the root of the source |
5 | // tree. An additional intellectual property rights grant can be found |
6 | // in the file PATENTS. All contributing project authors may |
7 | // be found in the AUTHORS file in the root of the source tree. |
8 | // ----------------------------------------------------------------------------- |
9 | // |
10 | // Rescaling functions |
11 | // |
12 | // Author: Skal (pascal.massimino@gmail.com) |
13 | |
14 | #include <assert.h> |
15 | |
16 | #include "./dsp.h" |
17 | #include "../utils/rescaler_utils.h" |
18 | |
19 | //------------------------------------------------------------------------------ |
20 | // Implementations of critical functions ImportRow / ExportRow |
21 | |
22 | #define ROUNDER (WEBP_RESCALER_ONE >> 1) |
23 | #define MULT_FIX(x, y) (((uint64_t)(x) * (y) + ROUNDER) >> WEBP_RESCALER_RFIX) |
24 | |
25 | //------------------------------------------------------------------------------ |
26 | // Row import |
27 | |
28 | void WebPRescalerImportRowExpandC(WebPRescaler* const wrk, const uint8_t* src) { |
29 | const int x_stride = wrk->num_channels; |
30 | const int x_out_max = wrk->dst_width * wrk->num_channels; |
31 | int channel; |
32 | assert(!WebPRescalerInputDone(wrk)); |
33 | assert(wrk->x_expand); |
34 | for (channel = 0; channel < x_stride; ++channel) { |
35 | int x_in = channel; |
36 | int x_out = channel; |
37 | // simple bilinear interpolation |
38 | int accum = wrk->x_add; |
39 | int left = src[x_in]; |
40 | int right = (wrk->src_width > 1) ? src[x_in + x_stride] : left; |
41 | x_in += x_stride; |
42 | while (1) { |
43 | wrk->frow[x_out] = right * wrk->x_add + (left - right) * accum; |
44 | x_out += x_stride; |
45 | if (x_out >= x_out_max) break; |
46 | accum -= wrk->x_sub; |
47 | if (accum < 0) { |
48 | left = right; |
49 | x_in += x_stride; |
50 | assert(x_in < wrk->src_width * x_stride); |
51 | right = src[x_in]; |
52 | accum += wrk->x_add; |
53 | } |
54 | } |
55 | assert(wrk->x_sub == 0 /* <- special case for src_width=1 */ || accum == 0); |
56 | } |
57 | } |
58 | |
59 | void WebPRescalerImportRowShrinkC(WebPRescaler* const wrk, const uint8_t* src) { |
60 | const int x_stride = wrk->num_channels; |
61 | const int x_out_max = wrk->dst_width * wrk->num_channels; |
62 | int channel; |
63 | assert(!WebPRescalerInputDone(wrk)); |
64 | assert(!wrk->x_expand); |
65 | for (channel = 0; channel < x_stride; ++channel) { |
66 | int x_in = channel; |
67 | int x_out = channel; |
68 | uint32_t sum = 0; |
69 | int accum = 0; |
70 | while (x_out < x_out_max) { |
71 | uint32_t base = 0; |
72 | accum += wrk->x_add; |
73 | while (accum > 0) { |
74 | accum -= wrk->x_sub; |
75 | assert(x_in < wrk->src_width * x_stride); |
76 | base = src[x_in]; |
77 | sum += base; |
78 | x_in += x_stride; |
79 | } |
80 | { // Emit next horizontal pixel. |
81 | const rescaler_t frac = base * (-accum); |
82 | wrk->frow[x_out] = sum * wrk->x_sub - frac; |
83 | // fresh fractional start for next pixel |
84 | sum = (int)MULT_FIX(frac, wrk->fx_scale); |
85 | } |
86 | x_out += x_stride; |
87 | } |
88 | assert(accum == 0); |
89 | } |
90 | } |
91 | |
92 | //------------------------------------------------------------------------------ |
93 | // Row export |
94 | |
95 | void WebPRescalerExportRowExpandC(WebPRescaler* const wrk) { |
96 | int x_out; |
97 | uint8_t* const dst = wrk->dst; |
98 | rescaler_t* const irow = wrk->irow; |
99 | const int x_out_max = wrk->dst_width * wrk->num_channels; |
100 | const rescaler_t* const frow = wrk->frow; |
101 | assert(!WebPRescalerOutputDone(wrk)); |
102 | assert(wrk->y_accum <= 0); |
103 | assert(wrk->y_expand); |
104 | assert(wrk->y_sub != 0); |
105 | if (wrk->y_accum == 0) { |
106 | for (x_out = 0; x_out < x_out_max; ++x_out) { |
107 | const uint32_t J = frow[x_out]; |
108 | const int v = (int)MULT_FIX(J, wrk->fy_scale); |
109 | assert(v >= 0 && v <= 255); |
110 | dst[x_out] = v; |
111 | } |
112 | } else { |
113 | const uint32_t B = WEBP_RESCALER_FRAC(-wrk->y_accum, wrk->y_sub); |
114 | const uint32_t A = (uint32_t)(WEBP_RESCALER_ONE - B); |
115 | for (x_out = 0; x_out < x_out_max; ++x_out) { |
116 | const uint64_t I = (uint64_t)A * frow[x_out] |
117 | + (uint64_t)B * irow[x_out]; |
118 | const uint32_t J = (uint32_t)((I + ROUNDER) >> WEBP_RESCALER_RFIX); |
119 | const int v = (int)MULT_FIX(J, wrk->fy_scale); |
120 | assert(v >= 0 && v <= 255); |
121 | dst[x_out] = v; |
122 | } |
123 | } |
124 | } |
125 | |
126 | void WebPRescalerExportRowShrinkC(WebPRescaler* const wrk) { |
127 | int x_out; |
128 | uint8_t* const dst = wrk->dst; |
129 | rescaler_t* const irow = wrk->irow; |
130 | const int x_out_max = wrk->dst_width * wrk->num_channels; |
131 | const rescaler_t* const frow = wrk->frow; |
132 | const uint32_t yscale = wrk->fy_scale * (-wrk->y_accum); |
133 | assert(!WebPRescalerOutputDone(wrk)); |
134 | assert(wrk->y_accum <= 0); |
135 | assert(!wrk->y_expand); |
136 | if (yscale) { |
137 | for (x_out = 0; x_out < x_out_max; ++x_out) { |
138 | const uint32_t frac = (uint32_t)MULT_FIX(frow[x_out], yscale); |
139 | const int v = (int)MULT_FIX(irow[x_out] - frac, wrk->fxy_scale); |
140 | assert(v >= 0 && v <= 255); |
141 | dst[x_out] = v; |
142 | irow[x_out] = frac; // new fractional start |
143 | } |
144 | } else { |
145 | for (x_out = 0; x_out < x_out_max; ++x_out) { |
146 | const int v = (int)MULT_FIX(irow[x_out], wrk->fxy_scale); |
147 | assert(v >= 0 && v <= 255); |
148 | dst[x_out] = v; |
149 | irow[x_out] = 0; |
150 | } |
151 | } |
152 | } |
153 | |
154 | #undef MULT_FIX |
155 | #undef ROUNDER |
156 | |
157 | //------------------------------------------------------------------------------ |
158 | // Main entry calls |
159 | |
160 | void WebPRescalerImportRow(WebPRescaler* const wrk, const uint8_t* src) { |
161 | assert(!WebPRescalerInputDone(wrk)); |
162 | if (!wrk->x_expand) { |
163 | WebPRescalerImportRowShrink(wrk, src); |
164 | } else { |
165 | WebPRescalerImportRowExpand(wrk, src); |
166 | } |
167 | } |
168 | |
169 | void WebPRescalerExportRow(WebPRescaler* const wrk) { |
170 | if (wrk->y_accum <= 0) { |
171 | assert(!WebPRescalerOutputDone(wrk)); |
172 | if (wrk->y_expand) { |
173 | WebPRescalerExportRowExpand(wrk); |
174 | } else if (wrk->fxy_scale) { |
175 | WebPRescalerExportRowShrink(wrk); |
176 | } else { // special case |
177 | int i; |
178 | assert(wrk->src_height == wrk->dst_height && wrk->x_add == 1); |
179 | assert(wrk->src_width == 1 && wrk->dst_width <= 2); |
180 | for (i = 0; i < wrk->num_channels * wrk->dst_width; ++i) { |
181 | wrk->dst[i] = wrk->irow[i]; |
182 | wrk->irow[i] = 0; |
183 | } |
184 | } |
185 | wrk->y_accum += wrk->y_add; |
186 | wrk->dst += wrk->dst_stride; |
187 | ++wrk->dst_y; |
188 | } |
189 | } |
190 | |
191 | //------------------------------------------------------------------------------ |
192 | |
193 | WebPRescalerImportRowFunc WebPRescalerImportRowExpand; |
194 | WebPRescalerImportRowFunc WebPRescalerImportRowShrink; |
195 | |
196 | WebPRescalerExportRowFunc WebPRescalerExportRowExpand; |
197 | WebPRescalerExportRowFunc WebPRescalerExportRowShrink; |
198 | |
199 | extern void WebPRescalerDspInitSSE2(void); |
200 | extern void WebPRescalerDspInitMIPS32(void); |
201 | extern void WebPRescalerDspInitMIPSdspR2(void); |
202 | extern void WebPRescalerDspInitMSA(void); |
203 | extern void WebPRescalerDspInitNEON(void); |
204 | |
205 | static volatile VP8CPUInfo rescaler_last_cpuinfo_used = |
206 | (VP8CPUInfo)&rescaler_last_cpuinfo_used; |
207 | |
208 | WEBP_TSAN_IGNORE_FUNCTION void WebPRescalerDspInit(void) { |
209 | if (rescaler_last_cpuinfo_used == VP8GetCPUInfo) return; |
210 | |
211 | WebPRescalerImportRowExpand = WebPRescalerImportRowExpandC; |
212 | WebPRescalerImportRowShrink = WebPRescalerImportRowShrinkC; |
213 | WebPRescalerExportRowExpand = WebPRescalerExportRowExpandC; |
214 | WebPRescalerExportRowShrink = WebPRescalerExportRowShrinkC; |
215 | |
216 | if (VP8GetCPUInfo != NULL) { |
217 | #if defined(WEBP_USE_SSE2) |
218 | if (VP8GetCPUInfo(kSSE2)) { |
219 | WebPRescalerDspInitSSE2(); |
220 | } |
221 | #endif |
222 | #if defined(WEBP_USE_NEON) |
223 | if (VP8GetCPUInfo(kNEON)) { |
224 | WebPRescalerDspInitNEON(); |
225 | } |
226 | #endif |
227 | #if defined(WEBP_USE_MIPS32) |
228 | if (VP8GetCPUInfo(kMIPS32)) { |
229 | WebPRescalerDspInitMIPS32(); |
230 | } |
231 | #endif |
232 | #if defined(WEBP_USE_MIPS_DSP_R2) |
233 | if (VP8GetCPUInfo(kMIPSdspR2)) { |
234 | WebPRescalerDspInitMIPSdspR2(); |
235 | } |
236 | #endif |
237 | #if defined(WEBP_USE_MSA) |
238 | if (VP8GetCPUInfo(kMSA)) { |
239 | WebPRescalerDspInitMSA(); |
240 | } |
241 | #endif |
242 | } |
243 | rescaler_last_cpuinfo_used = VP8GetCPUInfo; |
244 | } |
245 | |