1 | /* |
2 | * Copyright 2018 Google Inc. |
3 | * |
4 | * Use of this source code is governed by a BSD-style license that can be |
5 | * found in the LICENSE file. |
6 | */ |
7 | |
8 | #include "src/gpu/effects/GrYUVtoRGBEffect.h" |
9 | |
10 | #include "src/core/SkYUVMath.h" |
11 | #include "src/gpu/GrTexture.h" |
12 | #include "src/gpu/effects/GrMatrixEffect.h" |
13 | #include "src/gpu/glsl/GrGLSLFragmentProcessor.h" |
14 | #include "src/gpu/glsl/GrGLSLFragmentShaderBuilder.h" |
15 | #include "src/gpu/glsl/GrGLSLProgramBuilder.h" |
16 | #include "src/sksl/SkSLCPP.h" |
17 | #include "src/sksl/SkSLUtil.h" |
18 | |
19 | static void border_colors(SkYUVColorSpace cs, |
20 | const SkYUVAIndex yuvaIndices[4], |
21 | float planeBorders[4][4]) { |
22 | float m[20]; |
23 | SkColorMatrix_RGB2YUV(cs, m); |
24 | for (int i = 0; i < 4; ++i) { |
25 | if (yuvaIndices[i].fIndex == -1) { |
26 | return; |
27 | } |
28 | auto c = static_cast<int>(yuvaIndices[i].fChannel); |
29 | planeBorders[yuvaIndices[i].fIndex][c] = m[i*5 + 4]; |
30 | } |
31 | } |
32 | |
33 | std::unique_ptr<GrFragmentProcessor> GrYUVtoRGBEffect::Make(GrSurfaceProxyView views[], |
34 | const SkYUVAIndex yuvaIndices[4], |
35 | SkYUVColorSpace yuvColorSpace, |
36 | GrSamplerState samplerState, |
37 | const GrCaps& caps, |
38 | const SkMatrix& localMatrix, |
39 | const SkRect* subset, |
40 | const SkRect* domain) { |
41 | int numPlanes; |
42 | SkAssertResult(SkYUVAIndex::AreValidIndices(yuvaIndices, &numPlanes)); |
43 | |
44 | const SkISize yDimensions = |
45 | views[yuvaIndices[SkYUVAIndex::kY_Index].fIndex].proxy()->dimensions(); |
46 | |
47 | bool usesBorder = samplerState.wrapModeX() == GrSamplerState::WrapMode::kClampToBorder || |
48 | samplerState.wrapModeY() == GrSamplerState::WrapMode::kClampToBorder; |
49 | float planeBorders[4][4] = {}; |
50 | if (usesBorder) { |
51 | border_colors(yuvColorSpace, yuvaIndices, planeBorders); |
52 | } |
53 | |
54 | bool snap[2] = {false, false}; |
55 | std::unique_ptr<GrFragmentProcessor> planeFPs[4]; |
56 | for (int i = 0; i < numPlanes; ++i) { |
57 | SkISize dimensions = views[i].proxy()->dimensions(); |
58 | SkTCopyOnFirstWrite<SkMatrix> planeMatrix(&SkMatrix::I()); |
59 | SkRect planeSubset; |
60 | SkRect planeDomain; |
61 | bool makeLinearWithSnap = false; |
62 | float sx = 1.f, |
63 | sy = 1.f; |
64 | if (dimensions != yDimensions) { |
65 | // JPEG chroma subsampling of odd dimensions produces U and V planes with the ceiling of |
66 | // the image size divided by the subsampling factor (2). Our API for creating YUVA |
67 | // doesn't capture the intended subsampling (and we should fix that). This fixes up 2x |
68 | // subsampling for images with odd widths/heights (e.g. JPEG 420 or 422). |
69 | sx = (float)dimensions.width() / yDimensions.width(); |
70 | sy = (float)dimensions.height() / yDimensions.height(); |
71 | if ((yDimensions.width() & 0b1) && dimensions.width() == yDimensions.width() / 2 + 1) { |
72 | sx = 0.5f; |
73 | } |
74 | if ((yDimensions.height() & 0b1) && |
75 | dimensions.height() == yDimensions.height() / 2 + 1) { |
76 | sy = 0.5f; |
77 | } |
78 | *planeMatrix.writable() = SkMatrix::Scale(sx, sy); |
79 | if (subset) { |
80 | planeSubset = {subset->fLeft * sx, |
81 | subset->fTop * sy, |
82 | subset->fRight * sx, |
83 | subset->fBottom * sy}; |
84 | } |
85 | if (domain) { |
86 | planeDomain = {domain->fLeft * sx, |
87 | domain->fTop * sy, |
88 | domain->fRight * sx, |
89 | domain->fBottom * sy}; |
90 | } |
91 | // This promotion of nearest to linear filtering for UV planes exists to mimic |
92 | // libjpeg[-turbo]'s do_fancy_upsampling option. We will filter the subsampled plane, |
93 | // however we want to filter at a fixed point for each logical image pixel to simulate |
94 | // nearest neighbor. |
95 | if (samplerState.filter() == GrSamplerState::Filter::kNearest) { |
96 | bool snapX = (sx != 1.f), |
97 | snapY = (sy != 1.f); |
98 | makeLinearWithSnap = snapX || snapY; |
99 | snap[0] |= snapX; |
100 | snap[1] |= snapY; |
101 | if (domain) { |
102 | // The outer YUVToRGB effect will ensure sampling happens at pixel centers |
103 | // within this plane. |
104 | planeDomain = {std::floor(planeDomain.fLeft) + 0.5f, |
105 | std::floor(planeDomain.fTop) + 0.5f, |
106 | std::floor(planeDomain.fRight) + 0.5f, |
107 | std::floor(planeDomain.fBottom) + 0.5f}; |
108 | } |
109 | } |
110 | } else { |
111 | if (subset) { |
112 | planeSubset = *subset; |
113 | } |
114 | if (domain) { |
115 | planeDomain = *domain; |
116 | } |
117 | } |
118 | if (subset) { |
119 | SkASSERT(samplerState.mipmapped() == GrMipmapped::kNo); |
120 | if (makeLinearWithSnap) { |
121 | // The plane is subsampled and we have an overall subset on the image. We're |
122 | // emulating do_fancy_upsampling using linear filtering but snapping look ups to the |
123 | // y-plane pixel centers. Consider a logical image pixel at the edge of the subset. |
124 | // When computing the logical pixel color value we should use a 50/50 blend of two |
125 | // values from the subsampled plane. Depending on where the subset edge falls in |
126 | // actual subsampled plane, one of those values may come from outside the subset. |
127 | // Hence, we use this custom inset factory which applies the wrap mode to |
128 | // planeSubset but allows linear filtering to read pixels from the plane that are |
129 | // just outside planeSubset. |
130 | SkRect* domainRect = domain ? &planeDomain : nullptr; |
131 | planeFPs[i] = GrTextureEffect::MakeCustomLinearFilterInset( |
132 | views[i], kUnknown_SkAlphaType, *planeMatrix, samplerState.wrapModeX(), |
133 | samplerState.wrapModeY(), planeSubset, domainRect, {sx / 2.f, sy / 2.f}, |
134 | caps, planeBorders[i]); |
135 | } else if (domain) { |
136 | planeFPs[i] = GrTextureEffect::MakeSubset(views[i], kUnknown_SkAlphaType, |
137 | *planeMatrix, samplerState, planeSubset, |
138 | planeDomain, caps, planeBorders[i]); |
139 | } else { |
140 | planeFPs[i] = GrTextureEffect::MakeSubset(views[i], kUnknown_SkAlphaType, |
141 | *planeMatrix, samplerState, planeSubset, |
142 | caps, planeBorders[i]); |
143 | } |
144 | } else { |
145 | GrSamplerState planeSampler = samplerState; |
146 | if (makeLinearWithSnap) { |
147 | planeSampler.setFilterMode(GrSamplerState::Filter::kLinear); |
148 | } |
149 | planeFPs[i] = GrTextureEffect::Make(views[i], kUnknown_SkAlphaType, *planeMatrix, |
150 | planeSampler, caps, planeBorders[i]); |
151 | } |
152 | } |
153 | auto fp = std::unique_ptr<GrFragmentProcessor>( |
154 | new GrYUVtoRGBEffect(planeFPs, numPlanes, yuvaIndices, snap, yuvColorSpace)); |
155 | return GrMatrixEffect::Make(localMatrix, std::move(fp)); |
156 | } |
157 | |
158 | static SkAlphaType alpha_type(const SkYUVAIndex yuvaIndices[4]) { |
159 | return yuvaIndices[3].fIndex >= 0 ? kPremul_SkAlphaType : kOpaque_SkAlphaType; |
160 | } |
161 | |
162 | GrYUVtoRGBEffect::GrYUVtoRGBEffect(std::unique_ptr<GrFragmentProcessor> planeFPs[4], |
163 | int numPlanes, |
164 | const SkYUVAIndex yuvaIndices[4], |
165 | const bool snap[2], |
166 | SkYUVColorSpace yuvColorSpace) |
167 | : GrFragmentProcessor(kGrYUVtoRGBEffect_ClassID, |
168 | ModulateForClampedSamplerOptFlags(alpha_type(yuvaIndices))) |
169 | , fYUVColorSpace(yuvColorSpace) { |
170 | std::copy_n(yuvaIndices, 4, fYUVAIndices); |
171 | std::copy_n(snap, 2, fSnap); |
172 | |
173 | if (fSnap[0] || fSnap[1]) { |
174 | // Need this so that we can access coords in SKSL to perform snapping. |
175 | this->setUsesSampleCoordsDirectly(); |
176 | for (int i = 0; i < numPlanes; ++i) { |
177 | this->registerChild(std::move(planeFPs[i]), SkSL::SampleUsage::Explicit()); |
178 | } |
179 | } else { |
180 | for (int i = 0; i < numPlanes; ++i) { |
181 | this->registerChild(std::move(planeFPs[i])); |
182 | } |
183 | } |
184 | } |
185 | |
186 | #if GR_TEST_UTILS |
187 | SkString GrYUVtoRGBEffect::onDumpInfo() const { |
188 | SkString str("(" ); |
189 | for (int i = 0; i < 4; ++i) { |
190 | str.appendf("YUVAIndices[%d]=%d %d, " , |
191 | i, fYUVAIndices[i].fIndex, static_cast<int>(fYUVAIndices[i].fChannel)); |
192 | } |
193 | str.appendf("YUVColorSpace=%d, snap=(%d, %d))" , |
194 | static_cast<int>(fYUVColorSpace), fSnap[0], fSnap[1]); |
195 | return str; |
196 | } |
197 | #endif |
198 | |
199 | GrGLSLFragmentProcessor* GrYUVtoRGBEffect::onCreateGLSLInstance() const { |
200 | class GrGLSLYUVtoRGBEffect : public GrGLSLFragmentProcessor { |
201 | public: |
202 | GrGLSLYUVtoRGBEffect() {} |
203 | |
204 | void emitCode(EmitArgs& args) override { |
205 | GrGLSLFPFragmentBuilder* fragBuilder = args.fFragBuilder; |
206 | const GrYUVtoRGBEffect& yuvEffect = args.fFp.cast<GrYUVtoRGBEffect>(); |
207 | |
208 | int numPlanes = yuvEffect.numChildProcessors(); |
209 | |
210 | const char* sampleCoords = "" ; |
211 | if (yuvEffect.fSnap[0] || yuvEffect.fSnap[1]) { |
212 | fragBuilder->codeAppendf("float2 snappedCoords = %s;" , args.fSampleCoord); |
213 | if (yuvEffect.fSnap[0]) { |
214 | fragBuilder->codeAppend("snappedCoords.x = floor(snappedCoords.x) + 0.5;" ); |
215 | } |
216 | if (yuvEffect.fSnap[1]) { |
217 | fragBuilder->codeAppend("snappedCoords.y = floor(snappedCoords.y) + 0.5;" ); |
218 | } |
219 | sampleCoords = "snappedCoords" ; |
220 | } |
221 | |
222 | fragBuilder->codeAppendf("half4 planes[%d];" , numPlanes); |
223 | for (int i = 0; i < numPlanes; ++i) { |
224 | SkString tempVar = this->invokeChild(i, args, sampleCoords); |
225 | fragBuilder->codeAppendf("planes[%d] = %s;" , i, tempVar.c_str()); |
226 | } |
227 | |
228 | bool hasAlpha = yuvEffect.fYUVAIndices[3].fIndex >= 0; |
229 | SkString rgba[4]; |
230 | rgba[3] = "1" ; |
231 | for (int i = 0; i < (hasAlpha ? 4 : 3); ++i) { |
232 | auto info = yuvEffect.fYUVAIndices[i]; |
233 | auto letter = "rgba" [static_cast<int>(info.fChannel)]; |
234 | rgba[i].printf("planes[%d].%c" , info.fIndex, letter); |
235 | } |
236 | |
237 | fragBuilder->codeAppendf("half4 color = half4(%s, %s, %s, %s);" , |
238 | rgba[0].c_str(), rgba[1].c_str(), rgba[2].c_str(), rgba[3].c_str()); |
239 | |
240 | if (kIdentity_SkYUVColorSpace != yuvEffect.fYUVColorSpace) { |
241 | fColorSpaceMatrixVar = args.fUniformHandler->addUniform(&yuvEffect, |
242 | kFragment_GrShaderFlag, kHalf3x3_GrSLType, "colorSpaceMatrix" ); |
243 | fColorSpaceTranslateVar = args.fUniformHandler->addUniform(&yuvEffect, |
244 | kFragment_GrShaderFlag, kHalf3_GrSLType, "colorSpaceTranslate" ); |
245 | fragBuilder->codeAppendf( |
246 | "color.rgb = saturate(color.rgb * %s + %s);" , |
247 | args.fUniformHandler->getUniformCStr(fColorSpaceMatrixVar), |
248 | args.fUniformHandler->getUniformCStr(fColorSpaceTranslateVar)); |
249 | } |
250 | |
251 | if (hasAlpha) { |
252 | // premultiply alpha |
253 | fragBuilder->codeAppendf("color.rgb *= color.a;" ); |
254 | } |
255 | fragBuilder->codeAppendf("%s = color;" , args.fOutputColor); |
256 | } |
257 | |
258 | private: |
259 | void onSetData(const GrGLSLProgramDataManager& pdman, |
260 | const GrFragmentProcessor& proc) override { |
261 | const GrYUVtoRGBEffect& yuvEffect = proc.cast<GrYUVtoRGBEffect>(); |
262 | |
263 | if (yuvEffect.fYUVColorSpace != kIdentity_SkYUVColorSpace) { |
264 | SkASSERT(fColorSpaceMatrixVar.isValid()); |
265 | float yuvM[20]; |
266 | SkColorMatrix_YUV2RGB(yuvEffect.fYUVColorSpace, yuvM); |
267 | // We drop the fourth column entirely since the transformation |
268 | // should not depend on alpha. The fifth column is sent as a separate |
269 | // vector. The fourth row is also dropped entirely because alpha should |
270 | // never be modified. |
271 | SkASSERT(yuvM[3] == 0 && yuvM[8] == 0 && yuvM[13] == 0 && yuvM[18] == 1); |
272 | SkASSERT(yuvM[15] == 0 && yuvM[16] == 0 && yuvM[17] == 0 && yuvM[19] == 0); |
273 | float mtx[9] = { |
274 | yuvM[ 0], yuvM[ 1], yuvM[ 2], |
275 | yuvM[ 5], yuvM[ 6], yuvM[ 7], |
276 | yuvM[10], yuvM[11], yuvM[12], |
277 | }; |
278 | float v[3] = {yuvM[4], yuvM[9], yuvM[14]}; |
279 | pdman.setMatrix3f(fColorSpaceMatrixVar, mtx); |
280 | pdman.set3fv(fColorSpaceTranslateVar, 1, v); |
281 | } |
282 | } |
283 | |
284 | UniformHandle fColorSpaceMatrixVar; |
285 | UniformHandle fColorSpaceTranslateVar; |
286 | }; |
287 | |
288 | return new GrGLSLYUVtoRGBEffect; |
289 | } |
290 | void GrYUVtoRGBEffect::onGetGLSLProcessorKey(const GrShaderCaps& caps, |
291 | GrProcessorKeyBuilder* b) const { |
292 | uint32_t packed = 0; |
293 | for (int i = 0; i < 4; ++i) { |
294 | if (fYUVAIndices[i].fIndex < 0) { |
295 | continue; |
296 | } |
297 | |
298 | uint8_t index = fYUVAIndices[i].fIndex; |
299 | uint8_t chann = static_cast<int>(fYUVAIndices[i].fChannel); |
300 | |
301 | SkASSERT(index < 4 && chann < 4); |
302 | |
303 | packed |= (index | (chann << 2)) << (i * 4); |
304 | } |
305 | if (fYUVColorSpace == kIdentity_SkYUVColorSpace) { |
306 | packed |= 1 << 16; |
307 | } |
308 | if (fSnap[0]) { |
309 | packed |= 1 << 17; |
310 | } |
311 | if (fSnap[1]) { |
312 | packed |= 1 << 18; |
313 | } |
314 | b->add32(packed); |
315 | } |
316 | |
317 | bool GrYUVtoRGBEffect::onIsEqual(const GrFragmentProcessor& other) const { |
318 | const GrYUVtoRGBEffect& that = other.cast<GrYUVtoRGBEffect>(); |
319 | |
320 | return std::equal(fYUVAIndices, fYUVAIndices + 4, that.fYUVAIndices) && |
321 | std::equal(fSnap, fSnap + 2, that.fSnap) && |
322 | fYUVColorSpace == that.fYUVColorSpace; |
323 | } |
324 | |
325 | GrYUVtoRGBEffect::GrYUVtoRGBEffect(const GrYUVtoRGBEffect& src) |
326 | : GrFragmentProcessor(kGrYUVtoRGBEffect_ClassID, src.optimizationFlags()) |
327 | , fYUVColorSpace(src.fYUVColorSpace) { |
328 | this->cloneAndRegisterAllChildProcessors(src); |
329 | if (src.fSnap[0] || src.fSnap[1]) { |
330 | this->setUsesSampleCoordsDirectly(); |
331 | } |
332 | std::copy_n(src.fYUVAIndices, this->numChildProcessors(), fYUVAIndices); |
333 | std::copy_n(src.fSnap, 2, fSnap); |
334 | } |
335 | |
336 | std::unique_ptr<GrFragmentProcessor> GrYUVtoRGBEffect::clone() const { |
337 | return std::unique_ptr<GrFragmentProcessor>(new GrYUVtoRGBEffect(*this)); |
338 | } |
339 | |