1/****************************************************************************
2**
3** Copyright (C) 2016 The Qt Company Ltd.
4** Contact: https://www.qt.io/licensing/
5**
6** This file is part of the QtGui module of the Qt Toolkit.
7**
8** $QT_BEGIN_LICENSE:LGPL$
9** Commercial License Usage
10** Licensees holding valid commercial Qt licenses may use this file in
11** accordance with the commercial license agreement provided with the
12** Software or, alternatively, in accordance with the terms contained in
13** a written agreement between you and The Qt Company. For licensing terms
14** and conditions see https://www.qt.io/terms-conditions. For further
15** information use the contact form at https://www.qt.io/contact-us.
16**
17** GNU Lesser General Public License Usage
18** Alternatively, this file may be used under the terms of the GNU Lesser
19** General Public License version 3 as published by the Free Software
20** Foundation and appearing in the file LICENSE.LGPL3 included in the
21** packaging of this file. Please review the following information to
22** ensure the GNU Lesser General Public License version 3 requirements
23** will be met: https://www.gnu.org/licenses/lgpl-3.0.html.
24**
25** GNU General Public License Usage
26** Alternatively, this file may be used under the terms of the GNU
27** General Public License version 2.0 or (at your option) the GNU General
28** Public license version 3 or any later version approved by the KDE Free
29** Qt Foundation. The licenses are as published by the Free Software
30** Foundation and appearing in the file LICENSE.GPL2 and LICENSE.GPL3
31** included in the packaging of this file. Please review the following
32** information to ensure the GNU General Public License requirements will
33** be met: https://www.gnu.org/licenses/gpl-2.0.html and
34** https://www.gnu.org/licenses/gpl-3.0.html.
35**
36** $QT_END_LICENSE$
37**
38****************************************************************************/
39
40#include <private/qdrawhelper_p.h>
41#include <private/qdrawingprimitive_sse2_p.h>
42#include <private/qpaintengine_raster_p.h>
43#include <private/qpixellayout_p.h>
44
45#if defined(QT_COMPILER_SUPPORTS_SSE4_1)
46
47QT_BEGIN_NAMESPACE
48
49#ifndef __AVX2__
50template<bool RGBA>
51static void convertARGBToARGB32PM_sse4(uint *buffer, const uint *src, int count)
52{
53 int i = 0;
54 const __m128i alphaMask = _mm_set1_epi32(0xff000000);
55 const __m128i rgbaMask = _mm_setr_epi8(2, 1, 0, 3, 6, 5, 4, 7, 10, 9, 8, 11, 14, 13, 12, 15);
56 const __m128i shuffleMask = _mm_setr_epi8(6, 7, 6, 7, 6, 7, 6, 7, 14, 15, 14, 15, 14, 15, 14, 15);
57 const __m128i half = _mm_set1_epi16(0x0080);
58 const __m128i zero = _mm_setzero_si128();
59
60 for (; i < count - 3; i += 4) {
61 __m128i srcVector = _mm_loadu_si128((const __m128i *)&src[i]);
62 if (!_mm_testz_si128(srcVector, alphaMask)) {
63 if (!_mm_testc_si128(srcVector, alphaMask)) {
64 if (RGBA)
65 srcVector = _mm_shuffle_epi8(srcVector, rgbaMask);
66 __m128i src1 = _mm_unpacklo_epi8(srcVector, zero);
67 __m128i src2 = _mm_unpackhi_epi8(srcVector, zero);
68 __m128i alpha1 = _mm_shuffle_epi8(src1, shuffleMask);
69 __m128i alpha2 = _mm_shuffle_epi8(src2, shuffleMask);
70 src1 = _mm_mullo_epi16(src1, alpha1);
71 src2 = _mm_mullo_epi16(src2, alpha2);
72 src1 = _mm_add_epi16(src1, _mm_srli_epi16(src1, 8));
73 src2 = _mm_add_epi16(src2, _mm_srli_epi16(src2, 8));
74 src1 = _mm_add_epi16(src1, half);
75 src2 = _mm_add_epi16(src2, half);
76 src1 = _mm_srli_epi16(src1, 8);
77 src2 = _mm_srli_epi16(src2, 8);
78 src1 = _mm_blend_epi16(src1, alpha1, 0x88);
79 src2 = _mm_blend_epi16(src2, alpha2, 0x88);
80 srcVector = _mm_packus_epi16(src1, src2);
81 _mm_storeu_si128((__m128i *)&buffer[i], srcVector);
82 } else {
83 if (RGBA)
84 _mm_storeu_si128((__m128i *)&buffer[i], _mm_shuffle_epi8(srcVector, rgbaMask));
85 else if (buffer != src)
86 _mm_storeu_si128((__m128i *)&buffer[i], srcVector);
87 }
88 } else {
89 _mm_storeu_si128((__m128i *)&buffer[i], zero);
90 }
91 }
92
93 SIMD_EPILOGUE(i, count, 3) {
94 uint v = qPremultiply(src[i]);
95 buffer[i] = RGBA ? RGBA2ARGB(v) : v;
96 }
97}
98
99template<bool RGBA>
100static void convertARGBToRGBA64PM_sse4(QRgba64 *buffer, const uint *src, int count)
101{
102 int i = 0;
103 const __m128i alphaMask = _mm_set1_epi32(0xff000000);
104 const __m128i rgbaMask = _mm_setr_epi8(2, 1, 0, 3, 6, 5, 4, 7, 10, 9, 8, 11, 14, 13, 12, 15);
105 const __m128i shuffleMask = _mm_setr_epi8(6, 7, 6, 7, 6, 7, 6, 7, 14, 15, 14, 15, 14, 15, 14, 15);
106 const __m128i zero = _mm_setzero_si128();
107
108 for (; i < count - 3; i += 4) {
109 __m128i srcVector = _mm_loadu_si128((const __m128i *)&src[i]);
110 if (!_mm_testz_si128(srcVector, alphaMask)) {
111 bool cf = _mm_testc_si128(srcVector, alphaMask);
112
113 if (!RGBA)
114 srcVector = _mm_shuffle_epi8(srcVector, rgbaMask);
115 const __m128i src1 = _mm_unpacklo_epi8(srcVector, srcVector);
116 const __m128i src2 = _mm_unpackhi_epi8(srcVector, srcVector);
117 if (!cf) {
118 __m128i alpha1 = _mm_shuffle_epi8(src1, shuffleMask);
119 __m128i alpha2 = _mm_shuffle_epi8(src2, shuffleMask);
120 __m128i dst1 = _mm_mulhi_epu16(src1, alpha1);
121 __m128i dst2 = _mm_mulhi_epu16(src2, alpha2);
122 // Map 0->0xfffe to 0->0xffff
123 dst1 = _mm_add_epi16(dst1, _mm_srli_epi16(dst1, 15));
124 dst2 = _mm_add_epi16(dst2, _mm_srli_epi16(dst2, 15));
125 // correct alpha value:
126 dst1 = _mm_blend_epi16(dst1, src1, 0x88);
127 dst2 = _mm_blend_epi16(dst2, src2, 0x88);
128 _mm_storeu_si128((__m128i *)&buffer[i], dst1);
129 _mm_storeu_si128((__m128i *)&buffer[i + 2], dst2);
130 } else {
131 _mm_storeu_si128((__m128i *)&buffer[i], src1);
132 _mm_storeu_si128((__m128i *)&buffer[i + 2], src2);
133 }
134 } else {
135 _mm_storeu_si128((__m128i *)&buffer[i], zero);
136 _mm_storeu_si128((__m128i *)&buffer[i + 2], zero);
137 }
138 }
139
140 SIMD_EPILOGUE(i, count, 3) {
141 const uint s = RGBA ? RGBA2ARGB(src[i]) : src[i];
142 buffer[i] = QRgba64::fromArgb32(s).premultiplied();
143 }
144}
145#endif // __AVX2__
146
147static inline __m128 Q_DECL_VECTORCALL reciprocal_mul_ps(__m128 a, float mul)
148{
149 __m128 ia = _mm_rcp_ps(a); // Approximate 1/a
150 // Improve precision of ia using Newton-Raphson
151 ia = _mm_sub_ps(_mm_add_ps(ia, ia), _mm_mul_ps(ia, _mm_mul_ps(ia, a)));
152 ia = _mm_mul_ps(ia, _mm_set1_ps(mul));
153 return ia;
154}
155
156template<bool RGBA, bool RGBx>
157static inline void convertARGBFromARGB32PM_sse4(uint *buffer, const uint *src, int count)
158{
159 int i = 0;
160 if ((_MM_GET_EXCEPTION_MASK() & _MM_MASK_INVALID) == 0) {
161 for (; i < count; ++i) {
162 uint v = qUnpremultiply(src[i]);
163 if (RGBx)
164 v = 0xff000000 | v;
165 if (RGBA)
166 v = ARGB2RGBA(v);
167 buffer[i] = v;
168 }
169 return;
170 }
171 const __m128i alphaMask = _mm_set1_epi32(0xff000000);
172 const __m128i rgbaMask = _mm_setr_epi8(2, 1, 0, 3, 6, 5, 4, 7, 10, 9, 8, 11, 14, 13, 12, 15);
173 const __m128i zero = _mm_setzero_si128();
174
175 for (; i < count - 3; i += 4) {
176 __m128i srcVector = _mm_loadu_si128((const __m128i *)&src[i]);
177 if (!_mm_testz_si128(srcVector, alphaMask)) {
178 if (!_mm_testc_si128(srcVector, alphaMask)) {
179 __m128i srcVectorAlpha = _mm_srli_epi32(srcVector, 24);
180 if (RGBA)
181 srcVector = _mm_shuffle_epi8(srcVector, rgbaMask);
182 const __m128 a = _mm_cvtepi32_ps(srcVectorAlpha);
183 const __m128 ia = reciprocal_mul_ps(a, 255.0f);
184 __m128i src1 = _mm_unpacklo_epi8(srcVector, zero);
185 __m128i src3 = _mm_unpackhi_epi8(srcVector, zero);
186 __m128i src2 = _mm_unpackhi_epi16(src1, zero);
187 __m128i src4 = _mm_unpackhi_epi16(src3, zero);
188 src1 = _mm_unpacklo_epi16(src1, zero);
189 src3 = _mm_unpacklo_epi16(src3, zero);
190 __m128 ia1 = _mm_shuffle_ps(ia, ia, _MM_SHUFFLE(0, 0, 0, 0));
191 __m128 ia2 = _mm_shuffle_ps(ia, ia, _MM_SHUFFLE(1, 1, 1, 1));
192 __m128 ia3 = _mm_shuffle_ps(ia, ia, _MM_SHUFFLE(2, 2, 2, 2));
193 __m128 ia4 = _mm_shuffle_ps(ia, ia, _MM_SHUFFLE(3, 3, 3, 3));
194 src1 = _mm_cvtps_epi32(_mm_mul_ps(_mm_cvtepi32_ps(src1), ia1));
195 src2 = _mm_cvtps_epi32(_mm_mul_ps(_mm_cvtepi32_ps(src2), ia2));
196 src3 = _mm_cvtps_epi32(_mm_mul_ps(_mm_cvtepi32_ps(src3), ia3));
197 src4 = _mm_cvtps_epi32(_mm_mul_ps(_mm_cvtepi32_ps(src4), ia4));
198 src1 = _mm_packus_epi32(src1, src2);
199 src3 = _mm_packus_epi32(src3, src4);
200 src1 = _mm_packus_epi16(src1, src3);
201 // Handle potential alpha == 0 values:
202 __m128i srcVectorAlphaMask = _mm_cmpeq_epi32(srcVectorAlpha, zero);
203 src1 = _mm_andnot_si128(srcVectorAlphaMask, src1);
204 // Fixup alpha values:
205 if (RGBx)
206 srcVector = _mm_or_si128(src1, alphaMask);
207 else
208 srcVector = _mm_blendv_epi8(src1, srcVector, alphaMask);
209 _mm_storeu_si128((__m128i *)&buffer[i], srcVector);
210 } else {
211 if (RGBA)
212 _mm_storeu_si128((__m128i *)&buffer[i], _mm_shuffle_epi8(srcVector, rgbaMask));
213 else if (buffer != src)
214 _mm_storeu_si128((__m128i *)&buffer[i], srcVector);
215 }
216 } else {
217 if (RGBx)
218 _mm_storeu_si128((__m128i *)&buffer[i], alphaMask);
219 else
220 _mm_storeu_si128((__m128i *)&buffer[i], zero);
221 }
222 }
223
224 SIMD_EPILOGUE(i, count, 3) {
225 uint v = qUnpremultiply_sse4(src[i]);
226 if (RGBx)
227 v = 0xff000000 | v;
228 if (RGBA)
229 v = ARGB2RGBA(v);
230 buffer[i] = v;
231 }
232}
233
234template<bool RGBA>
235static inline void convertARGBFromRGBA64PM_sse4(uint *buffer, const QRgba64 *src, int count)
236{
237 int i = 0;
238 if ((_MM_GET_EXCEPTION_MASK() & _MM_MASK_INVALID) == 0) {
239 for (; i < count; ++i) {
240 const QRgba64 v = src[i].unpremultiplied();
241 buffer[i] = RGBA ? toRgba8888(v) : toArgb32(v);
242 }
243 return;
244 }
245 const __m128i alphaMask = _mm_set1_epi64x(qint64(Q_UINT64_C(0xffff) << 48));
246 const __m128i alphaMask32 = _mm_set1_epi32(0xff000000);
247 const __m128i rgbaMask = _mm_setr_epi8(2, 1, 0, 3, 6, 5, 4, 7, 10, 9, 8, 11, 14, 13, 12, 15);
248 const __m128i zero = _mm_setzero_si128();
249
250 for (; i < count - 3; i += 4) {
251 __m128i srcVector1 = _mm_loadu_si128((const __m128i *)&src[i]);
252 __m128i srcVector2 = _mm_loadu_si128((const __m128i *)&src[i + 2]);
253 bool transparent1 = _mm_testz_si128(srcVector1, alphaMask);
254 bool opaque1 = _mm_testc_si128(srcVector1, alphaMask);
255 bool transparent2 = _mm_testz_si128(srcVector2, alphaMask);
256 bool opaque2 = _mm_testc_si128(srcVector2, alphaMask);
257
258 if (!(transparent1 && transparent2)) {
259 if (!(opaque1 && opaque2)) {
260 __m128i srcVector1Alpha = _mm_srli_epi64(srcVector1, 48);
261 __m128i srcVector2Alpha = _mm_srli_epi64(srcVector2, 48);
262 __m128i srcVectorAlpha = _mm_packus_epi32(srcVector1Alpha, srcVector2Alpha);
263 const __m128 a = _mm_cvtepi32_ps(srcVectorAlpha);
264 // Convert srcVectorAlpha to final 8-bit alpha channel
265 srcVectorAlpha = _mm_add_epi32(srcVectorAlpha, _mm_set1_epi32(128));
266 srcVectorAlpha = _mm_sub_epi32(srcVectorAlpha, _mm_srli_epi32(srcVectorAlpha, 8));
267 srcVectorAlpha = _mm_srli_epi32(srcVectorAlpha, 8);
268 srcVectorAlpha = _mm_slli_epi32(srcVectorAlpha, 24);
269 const __m128 ia = reciprocal_mul_ps(a, 255.0f);
270 __m128i src1 = _mm_unpacklo_epi16(srcVector1, zero);
271 __m128i src2 = _mm_unpackhi_epi16(srcVector1, zero);
272 __m128i src3 = _mm_unpacklo_epi16(srcVector2, zero);
273 __m128i src4 = _mm_unpackhi_epi16(srcVector2, zero);
274 __m128 ia1 = _mm_shuffle_ps(ia, ia, _MM_SHUFFLE(0, 0, 0, 0));
275 __m128 ia2 = _mm_shuffle_ps(ia, ia, _MM_SHUFFLE(1, 1, 1, 1));
276 __m128 ia3 = _mm_shuffle_ps(ia, ia, _MM_SHUFFLE(2, 2, 2, 2));
277 __m128 ia4 = _mm_shuffle_ps(ia, ia, _MM_SHUFFLE(3, 3, 3, 3));
278 src1 = _mm_cvtps_epi32(_mm_mul_ps(_mm_cvtepi32_ps(src1), ia1));
279 src2 = _mm_cvtps_epi32(_mm_mul_ps(_mm_cvtepi32_ps(src2), ia2));
280 src3 = _mm_cvtps_epi32(_mm_mul_ps(_mm_cvtepi32_ps(src3), ia3));
281 src4 = _mm_cvtps_epi32(_mm_mul_ps(_mm_cvtepi32_ps(src4), ia4));
282 src1 = _mm_packus_epi32(src1, src2);
283 src3 = _mm_packus_epi32(src3, src4);
284 // Handle potential alpha == 0 values:
285 __m128i srcVector1AlphaMask = _mm_cmpeq_epi64(srcVector1Alpha, zero);
286 __m128i srcVector2AlphaMask = _mm_cmpeq_epi64(srcVector2Alpha, zero);
287 src1 = _mm_andnot_si128(srcVector1AlphaMask, src1);
288 src3 = _mm_andnot_si128(srcVector2AlphaMask, src3);
289 src1 = _mm_packus_epi16(src1, src3);
290 // Fixup alpha values:
291 src1 = _mm_blendv_epi8(src1, srcVectorAlpha, alphaMask32);
292 // Fix RGB order
293 if (!RGBA)
294 src1 = _mm_shuffle_epi8(src1, rgbaMask);
295 _mm_storeu_si128((__m128i *)&buffer[i], src1);
296 } else {
297 __m128i src1 = _mm_unpacklo_epi16(srcVector1, zero);
298 __m128i src2 = _mm_unpackhi_epi16(srcVector1, zero);
299 __m128i src3 = _mm_unpacklo_epi16(srcVector2, zero);
300 __m128i src4 = _mm_unpackhi_epi16(srcVector2, zero);
301 src1 = _mm_add_epi32(src1, _mm_set1_epi32(128));
302 src2 = _mm_add_epi32(src2, _mm_set1_epi32(128));
303 src3 = _mm_add_epi32(src3, _mm_set1_epi32(128));
304 src4 = _mm_add_epi32(src4, _mm_set1_epi32(128));
305 src1 = _mm_sub_epi32(src1, _mm_srli_epi32(src1, 8));
306 src2 = _mm_sub_epi32(src2, _mm_srli_epi32(src2, 8));
307 src3 = _mm_sub_epi32(src3, _mm_srli_epi32(src3, 8));
308 src4 = _mm_sub_epi32(src4, _mm_srli_epi32(src4, 8));
309 src1 = _mm_srli_epi32(src1, 8);
310 src2 = _mm_srli_epi32(src2, 8);
311 src3 = _mm_srli_epi32(src3, 8);
312 src4 = _mm_srli_epi32(src4, 8);
313 src1 = _mm_packus_epi32(src1, src2);
314 src3 = _mm_packus_epi32(src3, src4);
315 src1 = _mm_packus_epi16(src1, src3);
316 if (!RGBA)
317 src1 = _mm_shuffle_epi8(src1, rgbaMask);
318 _mm_storeu_si128((__m128i *)&buffer[i], src1);
319 }
320 } else {
321 _mm_storeu_si128((__m128i *)&buffer[i], zero);
322 }
323 }
324
325 SIMD_EPILOGUE(i, count, 3) {
326 buffer[i] = qConvertRgba64ToRgb32_sse4<RGBA ? PixelOrderRGB : PixelOrderBGR>(src[i]);
327 }
328}
329
330#ifndef __AVX2__
331void QT_FASTCALL convertARGB32ToARGB32PM_sse4(uint *buffer, int count, const QList<QRgb> *)
332{
333 convertARGBToARGB32PM_sse4<false>(buffer, buffer, count);
334}
335
336void QT_FASTCALL convertRGBA8888ToARGB32PM_sse4(uint *buffer, int count, const QList<QRgb> *)
337{
338 convertARGBToARGB32PM_sse4<true>(buffer, buffer, count);
339}
340
341const QRgba64 * QT_FASTCALL convertARGB32ToRGBA64PM_sse4(QRgba64 *buffer, const uint *src, int count,
342 const QList<QRgb> *, QDitherInfo *)
343{
344 convertARGBToRGBA64PM_sse4<false>(buffer, src, count);
345 return buffer;
346}
347
348const QRgba64 * QT_FASTCALL convertRGBA8888ToRGBA64PM_sse4(QRgba64 *buffer, const uint *src, int count,
349 const QList<QRgb> *, QDitherInfo *)
350{
351 convertARGBToRGBA64PM_sse4<true>(buffer, src, count);
352 return buffer;
353}
354
355const uint *QT_FASTCALL fetchARGB32ToARGB32PM_sse4(uint *buffer, const uchar *src, int index, int count,
356 const QList<QRgb> *, QDitherInfo *)
357{
358 convertARGBToARGB32PM_sse4<false>(buffer, reinterpret_cast<const uint *>(src) + index, count);
359 return buffer;
360}
361
362const uint *QT_FASTCALL fetchRGBA8888ToARGB32PM_sse4(uint *buffer, const uchar *src, int index, int count,
363 const QList<QRgb> *, QDitherInfo *)
364{
365 convertARGBToARGB32PM_sse4<true>(buffer, reinterpret_cast<const uint *>(src) + index, count);
366 return buffer;
367}
368
369const QRgba64 *QT_FASTCALL fetchARGB32ToRGBA64PM_sse4(QRgba64 *buffer, const uchar *src, int index, int count,
370 const QList<QRgb> *, QDitherInfo *)
371{
372 convertARGBToRGBA64PM_sse4<false>(buffer, reinterpret_cast<const uint *>(src) + index, count);
373 return buffer;
374}
375
376const QRgba64 *QT_FASTCALL fetchRGBA8888ToRGBA64PM_sse4(QRgba64 *buffer, const uchar *src, int index, int count,
377 const QList<QRgb> *, QDitherInfo *)
378{
379 convertARGBToRGBA64PM_sse4<true>(buffer, reinterpret_cast<const uint *>(src) + index, count);
380 return buffer;
381}
382#endif // __AVX2__
383
384void QT_FASTCALL storeRGB32FromARGB32PM_sse4(uchar *dest, const uint *src, int index, int count,
385 const QList<QRgb> *, QDitherInfo *)
386{
387 uint *d = reinterpret_cast<uint *>(dest) + index;
388 convertARGBFromARGB32PM_sse4<false,true>(d, src, count);
389}
390
391void QT_FASTCALL storeARGB32FromARGB32PM_sse4(uchar *dest, const uint *src, int index, int count,
392 const QList<QRgb> *, QDitherInfo *)
393{
394 uint *d = reinterpret_cast<uint *>(dest) + index;
395 convertARGBFromARGB32PM_sse4<false,false>(d, src, count);
396}
397
398void QT_FASTCALL storeRGBA8888FromARGB32PM_sse4(uchar *dest, const uint *src, int index, int count,
399 const QList<QRgb> *, QDitherInfo *)
400{
401 uint *d = reinterpret_cast<uint *>(dest) + index;
402 convertARGBFromARGB32PM_sse4<true,false>(d, src, count);
403}
404
405void QT_FASTCALL storeRGBXFromARGB32PM_sse4(uchar *dest, const uint *src, int index, int count,
406 const QList<QRgb> *, QDitherInfo *)
407{
408 uint *d = reinterpret_cast<uint *>(dest) + index;
409 convertARGBFromARGB32PM_sse4<true,true>(d, src, count);
410}
411
412template<QtPixelOrder PixelOrder>
413void QT_FASTCALL storeA2RGB30PMFromARGB32PM_sse4(uchar *dest, const uint *src, int index, int count,
414 const QList<QRgb> *, QDitherInfo *)
415{
416 uint *d = reinterpret_cast<uint *>(dest) + index;
417 for (int i = 0; i < count; ++i)
418 d[i] = qConvertArgb32ToA2rgb30_sse4<PixelOrder>(src[i]);
419}
420
421#if QT_CONFIG(raster_64bit)
422void QT_FASTCALL destStore64ARGB32_sse4(QRasterBuffer *rasterBuffer, int x, int y, const QRgba64 *buffer, int length)
423{
424 uint *dest = (uint*)rasterBuffer->scanLine(y) + x;
425 convertARGBFromRGBA64PM_sse4<false>(dest, buffer, length);
426}
427
428void QT_FASTCALL destStore64RGBA8888_sse4(QRasterBuffer *rasterBuffer, int x, int y, const QRgba64 *buffer, int length)
429{
430 uint *dest = (uint*)rasterBuffer->scanLine(y) + x;
431 convertARGBFromRGBA64PM_sse4<true>(dest, buffer, length);
432}
433#endif
434
435void QT_FASTCALL storeARGB32FromRGBA64PM_sse4(uchar *dest, const QRgba64 *src, int index, int count,
436 const QList<QRgb> *, QDitherInfo *)
437{
438 uint *d = (uint*)dest + index;
439 convertARGBFromRGBA64PM_sse4<false>(d, src, count);
440}
441
442void QT_FASTCALL storeRGBA8888FromRGBA64PM_sse4(uchar *dest, const QRgba64 *src, int index, int count,
443 const QList<QRgb> *, QDitherInfo *)
444{
445 uint *d = (uint*)dest + index;
446 convertARGBFromRGBA64PM_sse4<true>(d, src, count);
447}
448
449template
450void QT_FASTCALL storeA2RGB30PMFromARGB32PM_sse4<PixelOrderBGR>(uchar *dest, const uint *src, int index, int count,
451 const QList<QRgb> *, QDitherInfo *);
452template
453void QT_FASTCALL storeA2RGB30PMFromARGB32PM_sse4<PixelOrderRGB>(uchar *dest, const uint *src, int index, int count,
454 const QList<QRgb> *, QDitherInfo *);
455
456QT_END_NAMESPACE
457
458#endif
459