Line | Source | Count |
1 | | - |
2 | | - |
3 | | - |
4 | | - |
5 | | - |
6 | | - |
7 | | - |
8 | | - |
9 | | - |
10 | | - |
11 | | - |
12 | | - |
13 | | - |
14 | | - |
15 | | - |
16 | | - |
17 | | - |
18 | | - |
19 | | - |
20 | | - |
21 | | - |
22 | | - |
23 | | - |
24 | | - |
25 | | - |
26 | | - |
27 | | - |
28 | | - |
29 | | - |
30 | | - |
31 | | - |
32 | | - |
33 | | - |
34 | #include <qimage.h> | - |
35 | #include <private/qimage_p.h> | - |
36 | #include <private/qsimd_p.h> | - |
37 | | - |
38 | #ifdef QT_COMPILER_SUPPORTS_SSSE3 | - |
39 | | - |
40 | QT_BEGIN_NAMESPACE | - |
41 | | - |
42 | | - |
43 | | - |
44 | | - |
45 | Q_GUI_EXPORT void QT_FASTCALL qt_convert_rgb888_to_rgb32_ssse3(quint32 *dst, const uchar *src, int len) | - |
46 | { | - |
47 | quint32 *const end = dst + len; | - |
48 | | - |
49 | | - |
50 | | - |
51 | const int offsetToAlignOn16Bytes = (4 - ((reinterpret_cast<quintptr>(dst) >> 2) & 0x3)) & 0x3; | - |
52 | const int prologLength = qMin(len, offsetToAlignOn16Bytes); | - |
53 | | - |
54 | for (int i = 0; i < prologLength; ++i) {TRUE | never evaluated | FALSE | never evaluated |
| 0 |
55 | *dst++ = qRgb(src[0], src[1], src[2]); | - |
56 | src += 3; | - |
57 | } never executed: end of block | 0 |
58 | | - |
59 | | - |
60 | const __m128i shuffleMask = _mm_set_epi8(char(0xff), 9, 10, 11, char(0xff), 6, 7, 8, char(0xff), 3, 4, 5, char(0xff), 0, 1, 2); | - |
61 | | - |
62 | | - |
63 | const __m128i shuffleMaskEnd = _mm_set_epi8(char(0xff), 13, 14, 15, char(0xff), 10, 11, 12, char(0xff), 7, 8, 9, char(0xff), 4, 5, 6); | - |
64 | | - |
65 | | - |
66 | const __m128i alphaMask = _mm_set1_epi32(0xff000000); | - |
67 | | - |
68 | const __m128i *inVectorPtr = (const __m128i *)src; | - |
69 | __m128i *dstVectorPtr = (__m128i *)dst; | - |
70 | | - |
71 | const int simdRoundCount = (len - prologLength) / 16; | - |
72 | for (int i = 0; i < simdRoundCount; ++i) {TRUE | never evaluated | FALSE | never evaluated |
| 0 |
73 | | - |
74 | | - |
75 | | - |
76 | | - |
77 | | - |
78 | | - |
79 | | - |
80 | | - |
81 | | - |
82 | | - |
83 | __m128i firstSrcVector = _mm_lddqu_si128(inVectorPtr); | - |
84 | __m128i outputVector = _mm_shuffle_epi8(firstSrcVector, shuffleMask); | - |
85 | _mm_store_si128(dstVectorPtr, _mm_or_si128(outputVector, alphaMask)); | - |
86 | ++inVectorPtr; | - |
87 | ++dstVectorPtr; | - |
88 | | - |
89 | | - |
90 | | - |
91 | __m128i secondSrcVector = _mm_lddqu_si128(inVectorPtr); | - |
92 | __m128i srcVector = _mm_alignr_epi8(secondSrcVector, firstSrcVector, 12); | - |
93 | outputVector = _mm_shuffle_epi8(srcVector, shuffleMask); | - |
94 | _mm_store_si128(dstVectorPtr, _mm_or_si128(outputVector, alphaMask)); | - |
95 | ++inVectorPtr; | - |
96 | ++dstVectorPtr; | - |
97 | firstSrcVector = secondSrcVector; | - |
98 | | - |
99 | | - |
100 | secondSrcVector = _mm_lddqu_si128(inVectorPtr); | - |
101 | srcVector = _mm_alignr_epi8(secondSrcVector, firstSrcVector, 8); | - |
102 | outputVector = _mm_shuffle_epi8(srcVector, shuffleMask); | - |
103 | _mm_store_si128(dstVectorPtr, _mm_or_si128(outputVector, alphaMask)); | - |
104 | ++inVectorPtr; | - |
105 | ++dstVectorPtr; | - |
106 | | - |
107 | | - |
108 | | - |
109 | outputVector = _mm_shuffle_epi8(secondSrcVector, shuffleMaskEnd); | - |
110 | _mm_store_si128(dstVectorPtr, _mm_or_si128(outputVector, alphaMask)); | - |
111 | ++dstVectorPtr; | - |
112 | } never executed: end of block | 0 |
113 | src = (const uchar *)inVectorPtr; | - |
114 | dst = (quint32 *)dstVectorPtr; | - |
115 | | - |
116 | while (dst != end) {TRUE | never evaluated | FALSE | never evaluated |
| 0 |
117 | *dst++ = qRgb(src[0], src[1], src[2]); | - |
118 | src += 3; | - |
119 | } never executed: end of block | 0 |
120 | } never executed: end of block | 0 |
121 | | - |
122 | void convert_RGB888_to_RGB32_ssse3(QImageData *dest, const QImageData *src, Qt::ImageConversionFlags) | - |
123 | { | - |
124 | Q_ASSERT(src->format == QImage::Format_RGB888); | - |
125 | Q_ASSERT(dest->format == QImage::Format_RGB32 || dest->format == QImage::Format_ARGB32 || dest->format == QImage::Format_ARGB32_Premultiplied); | - |
126 | Q_ASSERT(src->width == dest->width); | - |
127 | Q_ASSERT(src->height == dest->height); | - |
128 | | - |
129 | const uchar *src_data = (uchar *) src->data; | - |
130 | quint32 *dest_data = (quint32 *) dest->data; | - |
131 | | - |
132 | for (int i = 0; i < src->height; ++i) {TRUE | never evaluated | FALSE | never evaluated |
| 0 |
133 | qt_convert_rgb888_to_rgb32_ssse3(dest_data, src_data, src->width); | - |
134 | src_data += src->bytes_per_line; | - |
135 | dest_data = (quint32 *)((uchar*)dest_data + dest->bytes_per_line); | - |
136 | } never executed: end of block | 0 |
137 | } never executed: end of block | 0 |
138 | | - |
139 | QT_END_NAMESPACE | - |
140 | | - |
141 | #endif // QT_COMPILER_SUPPORTS_SSSE3 | - |
| | |