Mercurial > hg > dmlib
annotate dmblitfunc.h @ 14:a40c266a71a2
Bitshift less in dmScaledBlitSurface32to32TransparentX()
author | Matti Hamalainen <ccr@tnsp.org> |
---|---|
date | Fri, 28 Sep 2012 10:48:57 +0300 |
parents | 07bace8425d9 |
children | a60fe802636a |
rev | line source |
---|---|
0 | 1 /* |
2 * DMLib | |
3 * -- Sprite / surface blitting functions | |
4 * Programmed and designed by Matti 'ccr' Hamalainen | |
5 * (C) Copyright 2011-2012 Tecnic Software productions (TNSP) | |
6 */ | |
7 | |
8 // ======================================================================= | |
9 // DMD_NONE | |
10 // ======================================================================= | |
11 | |
12 #define DM_SCALED_NAME dmScaledBlitSurface8to8 | |
13 #define DM_SCALED_SRC_BYTES 1 | |
14 #define DM_SCALED_DST_BYTES 1 | |
15 #define DM_SCALED_SRC_TYPE Uint8 | |
16 #define DM_SCALED_DST_TYPE Uint8 | |
17 | |
18 #define DM_SCALED_INNER *dp++ = sp[FP_GETH(xv)]; | |
19 | |
20 #include "dmscaledblit.h" | |
21 | |
22 // ----------------------------------------------------------------------- | |
23 | |
24 #define DM_SCALED_NAME dmScaledBlitSurface8to32 | |
25 #define DM_SCALED_SRC_BYTES 1 | |
26 #define DM_SCALED_DST_BYTES 4 | |
27 #define DM_SCALED_SRC_TYPE Uint8 | |
28 #define DM_SCALED_DST_TYPE Uint32 | |
29 | |
30 #define DM_SCALED_VARS const Uint32 *pal; | |
31 #define DM_SCALED_INIT \ | |
32 if (src->format->palette == NULL || src->format->palette->ncolors < 256) return -2; \ | |
33 pal = (Uint32 *) src->format->palette->colors; | |
34 | |
35 #define DM_SCALED_INNER *dp++ = pal[sp[FP_GETH(xv)]]; | |
36 | |
37 #include "dmscaledblit.h" | |
38 | |
39 // ----------------------------------------------------------------------- | |
40 | |
41 #define DM_SCALED_NAME dmScaledBlitSurface32to32 | |
42 #define DM_SCALED_SRC_BYTES 4 | |
43 #define DM_SCALED_DST_BYTES 4 | |
44 #define DM_SCALED_SRC_TYPE Uint32 | |
45 #define DM_SCALED_DST_TYPE Uint32 | |
46 #define DM_SCALED_INIT | |
47 | |
48 #define DM_SCALED_INNER *dp++ = sp[FP_GETH(xv)]; | |
49 | |
50 #include "dmscaledblit.h" | |
51 | |
52 | |
53 // ======================================================================= | |
54 // DMD_TRANSPARENT | |
55 // ======================================================================= | |
56 | |
57 #define DM_SCALED_NAME dmScaledBlitSurface8to8Transparent | |
58 #define DM_SCALED_SRC_BYTES 1 | |
59 #define DM_SCALED_DST_BYTES 1 | |
60 #define DM_SCALED_SRC_TYPE Uint8 | |
61 #define DM_SCALED_DST_TYPE Uint8 | |
62 | |
63 #define DM_SCALED_INNER \ | |
64 *dp = sp[FP_GETH(xv)] ? sp[FP_GETH(xv)] : *dp; dp++; | |
65 | |
66 #include "dmscaledblit.h" | |
67 | |
68 // ----------------------------------------------------------------------- | |
69 | |
70 #define DM_SCALED_NAME dmScaledBlitSurface8to32Transparent | |
71 #define DM_SCALED_SRC_BYTES 1 | |
72 #define DM_SCALED_DST_BYTES 4 | |
73 #define DM_SCALED_SRC_TYPE Uint8 | |
74 #define DM_SCALED_DST_TYPE DMRGBA32 | |
75 #define DM_SCALED_VARS const DMRGBA32 *pal; | |
76 #define DM_SCALED_INIT \ | |
77 if (src->format->palette == NULL || src->format->palette->ncolors < 256) return -2; \ | |
78 pal = (DMRGBA32 *) src->format->palette->colors; | |
79 | |
80 #define DM_SCALED_INNER \ | |
81 const DMRGBA32 q = pal[sp[FP_GETH(xv)]]; \ | |
82 dp->r += ((q.r - dp->r) * q.a) >> 8; \ | |
83 dp->g += ((q.g - dp->g) * q.a) >> 8; \ | |
84 dp->b += ((q.b - dp->b) * q.a) >> 8; \ | |
85 dp->a = q.a; \ | |
86 dp++; | |
87 | |
88 #include "dmscaledblit.h" | |
89 | |
90 | |
91 // ----------------------------------------------------------------------- | |
92 | |
93 #define DM_SCALED_NAME dmScaledBlitSurface32to32Transparent | |
94 #define DM_SCALED_SRC_BYTES 4 | |
95 #define DM_SCALED_DST_BYTES 4 | |
96 #define DM_SCALED_INIT | |
97 | |
98 #ifdef DM_USE_SIMD | |
99 #define DM_SCALED_INNER_INIT \ | |
12
35b0c83af3ca
MMX-version of scaled 32-bit RGBA alpha blending blit works now.
Matti Hamalainen <ccr@tnsp.org>
parents:
10
diff
changeset
|
100 const Uint32 qpdmask = 0xff000000; \ |
35b0c83af3ca
MMX-version of scaled 32-bit RGBA alpha blending blit works now.
Matti Hamalainen <ccr@tnsp.org>
parents:
10
diff
changeset
|
101 const Uint64 qpdrm = 0xff00ff00ff00ffULL; |
0 | 102 |
103 #define DM_SCALED_SRC_TYPE Uint32 | |
104 #define DM_SCALED_DST_TYPE Uint32 | |
105 #define DM_SCALED_INNER \ | |
106 asm( \ | |
107 "movd %2, %%mm1\n" \ | |
12
35b0c83af3ca
MMX-version of scaled 32-bit RGBA alpha blending blit works now.
Matti Hamalainen <ccr@tnsp.org>
parents:
10
diff
changeset
|
108 \ |
35b0c83af3ca
MMX-version of scaled 32-bit RGBA alpha blending blit works now.
Matti Hamalainen <ccr@tnsp.org>
parents:
10
diff
changeset
|
109 "movd %3, %%mm2\n" \ |
13
07bace8425d9
Optimize the scaled RGBA alpha blit MMX version further.
Matti Hamalainen <ccr@tnsp.org>
parents:
12
diff
changeset
|
110 "movq %%mm1, %%mm5\n" \ |
07bace8425d9
Optimize the scaled RGBA alpha blit MMX version further.
Matti Hamalainen <ccr@tnsp.org>
parents:
12
diff
changeset
|
111 "pand %%mm2, %%mm5\n" \ |
07bace8425d9
Optimize the scaled RGBA alpha blit MMX version further.
Matti Hamalainen <ccr@tnsp.org>
parents:
12
diff
changeset
|
112 "psrlw $8, %%mm5\n" \ |
07bace8425d9
Optimize the scaled RGBA alpha blit MMX version further.
Matti Hamalainen <ccr@tnsp.org>
parents:
12
diff
changeset
|
113 "punpcklwd %%mm5, %%mm5\n" \ |
07bace8425d9
Optimize the scaled RGBA alpha blit MMX version further.
Matti Hamalainen <ccr@tnsp.org>
parents:
12
diff
changeset
|
114 "punpckhwd %%mm5, %%mm5\n" \ |
0 | 115 \ |
13
07bace8425d9
Optimize the scaled RGBA alpha blit MMX version further.
Matti Hamalainen <ccr@tnsp.org>
parents:
12
diff
changeset
|
116 "pxor %%mm2, %%mm2\n" \ |
0 | 117 "movd %1, %%mm3\n" \ |
118 "punpcklbw %%mm2, %%mm1\n" \ | |
13
07bace8425d9
Optimize the scaled RGBA alpha blit MMX version further.
Matti Hamalainen <ccr@tnsp.org>
parents:
12
diff
changeset
|
119 "punpcklbw %%mm2, %%mm3\n" \ |
12
35b0c83af3ca
MMX-version of scaled 32-bit RGBA alpha blending blit works now.
Matti Hamalainen <ccr@tnsp.org>
parents:
10
diff
changeset
|
120 \ |
0 | 121 "psubw %%mm3, %%mm1\n" \ |
12
35b0c83af3ca
MMX-version of scaled 32-bit RGBA alpha blending blit works now.
Matti Hamalainen <ccr@tnsp.org>
parents:
10
diff
changeset
|
122 "pmullw %%mm5, %%mm1\n" \ |
35b0c83af3ca
MMX-version of scaled 32-bit RGBA alpha blending blit works now.
Matti Hamalainen <ccr@tnsp.org>
parents:
10
diff
changeset
|
123 "psraw $8, %%mm1\n" \ |
35b0c83af3ca
MMX-version of scaled 32-bit RGBA alpha blending blit works now.
Matti Hamalainen <ccr@tnsp.org>
parents:
10
diff
changeset
|
124 "paddw %%mm3, %%mm1\n" \ |
13
07bace8425d9
Optimize the scaled RGBA alpha blit MMX version further.
Matti Hamalainen <ccr@tnsp.org>
parents:
12
diff
changeset
|
125 "pand %4, %%mm1\n" \ |
0 | 126 "packuswb %%mm2, %%mm1\n" \ |
127 "movd %%mm1, %0\n" \ | |
128 : "=m" (*dp) \ | |
12
35b0c83af3ca
MMX-version of scaled 32-bit RGBA alpha blending blit works now.
Matti Hamalainen <ccr@tnsp.org>
parents:
10
diff
changeset
|
129 : "m" (*dp), "m" (sp[FP_GETH(xv)]), "m" (qpdmask), "m" (qpdrm) \ |
0 | 130 : "memory" ); dp++; |
131 | |
132 #define DM_SCALED_FINISH asm("emms\n"); | |
13
07bace8425d9
Optimize the scaled RGBA alpha blit MMX version further.
Matti Hamalainen <ccr@tnsp.org>
parents:
12
diff
changeset
|
133 |
0 | 134 #else |
135 #define DM_SCALED_SRC_TYPE DMRGBA32 | |
136 #define DM_SCALED_DST_TYPE DMRGBA32 | |
137 #define DM_SCALED_INNER \ | |
138 const DMRGBA32 q = sp[FP_GETH(xv)]; \ | |
139 dp->r += ((q.r - dp->r) * q.a) >> 8; \ | |
140 dp->g += ((q.g - dp->g) * q.a) >> 8; \ | |
141 dp->b += ((q.b - dp->b) * q.a) >> 8; \ | |
142 dp->a = q.a; \ | |
143 dp++; | |
144 #endif | |
145 | |
146 #include "dmscaledblit.h" | |
147 | |
148 // ----------------------------------------------------------------------- | |
149 | |
150 #define DM_SCALED_NAME dmScaledBlitSurface32to32TransparentX | |
151 #define DM_SCALED_SRC_BYTES 4 | |
152 #define DM_SCALED_DST_BYTES 4 | |
153 #define DM_SCALED_SRC_TYPE DMRGBA32 | |
154 #define DM_SCALED_DST_TYPE DMRGBA32 | |
155 #define DM_SCALED_INIT | |
156 | |
157 #define DM_SCALED_INNER \ | |
158 const DMRGBA32 q = sp[FP_GETH(xv)]; \ | |
14
a40c266a71a2
Bitshift less in dmScaledBlitSurface32to32TransparentX()
Matti Hamalainen <ccr@tnsp.org>
parents:
13
diff
changeset
|
159 dp->r = (q.r * q.a + dp->r * dp->a) >> 8; \ |
a40c266a71a2
Bitshift less in dmScaledBlitSurface32to32TransparentX()
Matti Hamalainen <ccr@tnsp.org>
parents:
13
diff
changeset
|
160 dp->g = (q.g * q.a + dp->g * dp->a) >> 8; \ |
a40c266a71a2
Bitshift less in dmScaledBlitSurface32to32TransparentX()
Matti Hamalainen <ccr@tnsp.org>
parents:
13
diff
changeset
|
161 dp->b = (q.b * q.a + dp->b * dp->a) >> 8; \ |
0 | 162 dp->a = q.a ? q.a : dp->a; \ |
163 dp++; | |
164 | |
165 #include "dmscaledblit.h" | |
166 | |
167 | |
168 // ======================================================================= | |
169 // DMD_SATURATE | |
170 // ======================================================================= | |
171 | |
172 #define DM_SCALED_NAME dmScaledBlitSurface8to8Saturate | |
173 #define DM_SCALED_SRC_BYTES 1 | |
174 #define DM_SCALED_DST_BYTES 1 | |
175 #define DM_SCALED_SRC_TYPE Uint8 | |
176 #define DM_SCALED_DST_TYPE Uint8 | |
177 #define DM_SCALED_INNER *(dp++) += sp[FP_GETH(xv)]; | |
178 #include "dmscaledblit.h" | |
179 | |
180 // ----------------------------------------------------------------------- | |
181 | |
182 #define DM_SCALED_NAME dmScaledBlitSurface8to32Saturate | |
183 #define DM_SCALED_SRC_BYTES 1 | |
184 #define DM_SCALED_DST_BYTES 4 | |
185 #define DM_SCALED_SRC_TYPE Uint8 | |
186 #define DM_SCALED_DST_TYPE DMRGBA32 | |
187 #define DM_SCALED_VARS const DMRGBA32 *pal; | |
188 #define DM_SCALED_INIT \ | |
189 if (src->format->palette == NULL || src->format->palette->ncolors < 256) return -2; \ | |
190 pal = (DMRGBA32 *) src->format->palette->colors; | |
191 | |
192 #ifdef DM_USE_SIMD | |
193 #define DM_SCALED_INNER \ | |
194 asm("movd %2, %%mm1\n" \ | |
195 "movd %1, %%mm2\n" \ | |
196 "paddusb %%mm2, %%mm1\n" \ | |
197 "movd %%mm1, %0\n" \ | |
198 : "=m" (*dp) \ | |
199 : "m" (*dp), "m" (pal[sp[FP_GETH(xv)]]) \ | |
200 : "memory" ); dp++; | |
201 | |
202 #define DM_SCALED_FINISH asm("emms\n"); | |
203 #else | |
204 #define DM_SCALED_INNER \ | |
205 const DMRGBA32 q = pal[sp[FP_GETH(xv)]]; \ | |
206 const int qr = dp->r + q.r, qg = dp->g + q.g, qb = dp->b + q.b; \ | |
207 dp->r = qr < 256 ? qr : 255; \ | |
208 dp->g = qg < 256 ? qg : 255; \ | |
209 dp->b = qb < 256 ? qb : 255; \ | |
210 dp->a = q.a; \ | |
211 dp++; | |
212 #endif | |
213 | |
214 #include "dmscaledblit.h" | |
215 | |
216 // ----------------------------------------------------------------------- | |
217 | |
218 #define DM_SCALED_NAME dmScaledBlitSurface32to32Saturate | |
219 #define DM_SCALED_SRC_BYTES 4 | |
220 #define DM_SCALED_DST_BYTES 4 | |
221 #define DM_SCALED_INIT | |
222 | |
223 #ifdef DM_USE_SIMD | |
224 #define DM_SCALED_SRC_TYPE Uint32 | |
225 #define DM_SCALED_DST_TYPE Uint32 | |
226 #define DM_SCALED_INNER \ | |
227 asm("movd %2, %%mm1\n" \ | |
228 "movd %1, %%mm2\n" \ | |
229 "paddusb %%mm2, %%mm1\n" \ | |
230 "movd %%mm1, %0\n" \ | |
231 : "=m" (*dp) \ | |
232 : "m" (*dp), "m" (sp[FP_GETH(xv)]) \ | |
233 : "memory" ); dp++; | |
234 | |
235 #define DM_SCALED_FINISH asm("emms\n"); | |
236 #else | |
237 #define DM_SCALED_SRC_TYPE DMRGBA32 | |
238 #define DM_SCALED_DST_TYPE DMRGBA32 | |
239 #define DM_SCALED_INNER \ | |
240 const DMRGBA32 q = sp[FP_GETH(xv)]; \ | |
241 const int qr = dp->r + q.r, qg = dp->g + q.g, qb = dp->b + q.b; \ | |
242 dp->r = qr < 256 ? qr : 255; \ | |
243 dp->g = qg < 256 ? qg : 255; \ | |
244 dp->b = qb < 256 ? qb : 255; \ | |
245 dp->a = q.a; \ | |
246 dp++; | |
247 #endif | |
248 | |
249 #include "dmscaledblit.h" | |
250 | |
251 | |
252 // ======================================================================= | |
253 // ======================================================================= |