OpenTTD Source  1.11.0-beta2
32bpp_anim_sse4.cpp
Go to the documentation of this file.
1 /*
2  * This file is part of OpenTTD.
3  * OpenTTD is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, version 2.
4  * OpenTTD is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
5  * See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with OpenTTD. If not, see <http://www.gnu.org/licenses/>.
6  */
7 
10 #ifdef WITH_SSE
11 
12 #include "../stdafx.h"
13 #include "../video/video_driver.hpp"
14 #include "../table/sprites.h"
15 #include "32bpp_anim_sse4.hpp"
16 #include "32bpp_sse_func.hpp"
17 
18 #include "../safeguards.h"
19 
21 static FBlitter_32bppSSE4_Anim iFBlitter_32bppSSE4_Anim;
22 
30 IGNORE_UNINITIALIZED_WARNING_START
31 template <BlitterMode mode, Blitter_32bppSSE2::ReadMode read_mode, Blitter_32bppSSE2::BlockType bt_last, bool translucent, bool animated>
32 inline void Blitter_32bppSSE4_Anim::Draw(const Blitter::BlitterParams *bp, ZoomLevel zoom)
33 {
34  const byte * const remap = bp->remap;
35  Colour *dst_line = (Colour *) bp->dst + bp->top * bp->pitch + bp->left;
36  uint16 *anim_line = this->anim_buf + this->ScreenToAnimOffset((uint32 *)bp->dst) + bp->top * this->anim_buf_pitch + bp->left;
37  int effective_width = bp->width;
38 
39  /* Find where to start reading in the source sprite. */
40  const Blitter_32bppSSE_Base::SpriteData * const sd = (const Blitter_32bppSSE_Base::SpriteData *) bp->sprite;
41  const SpriteInfo * const si = &sd->infos[zoom];
42  const MapValue *src_mv_line = (const MapValue *) &sd->data[si->mv_offset] + bp->skip_top * si->sprite_width;
43  const Colour *src_rgba_line = (const Colour *) ((const byte *) &sd->data[si->sprite_offset] + bp->skip_top * si->sprite_line_size);
44 
45  if (read_mode != RM_WITH_MARGIN) {
46  src_rgba_line += bp->skip_left;
47  src_mv_line += bp->skip_left;
48  }
49  const MapValue *src_mv = src_mv_line;
50 
51  /* Load these variables into register before loop. */
52  const __m128i a_cm = ALPHA_CONTROL_MASK;
53  const __m128i pack_low_cm = PACK_LOW_CONTROL_MASK;
54  const __m128i tr_nom_base = TRANSPARENT_NOM_BASE;
55 
56  for (int y = bp->height; y != 0; y--) {
57  Colour *dst = dst_line;
58  const Colour *src = src_rgba_line + META_LENGTH;
59  if (mode != BM_TRANSPARENT) src_mv = src_mv_line;
60  uint16 *anim = anim_line;
61 
62  if (read_mode == RM_WITH_MARGIN) {
63  assert(bt_last == BT_NONE); // or you must ensure block type is preserved
64  anim += src_rgba_line[0].data;
65  src += src_rgba_line[0].data;
66  dst += src_rgba_line[0].data;
67  if (mode != BM_TRANSPARENT) src_mv += src_rgba_line[0].data;
68  const int width_diff = si->sprite_width - bp->width;
69  effective_width = bp->width - (int) src_rgba_line[0].data;
70  const int delta_diff = (int) src_rgba_line[1].data - width_diff;
71  const int new_width = effective_width - delta_diff;
72  effective_width = delta_diff > 0 ? new_width : effective_width;
73  if (effective_width <= 0) goto next_line;
74  }
75 
76  switch (mode) {
77  default:
78  if (!translucent) {
79  for (uint x = (uint) effective_width; x > 0; x--) {
80  if (src->a) {
81  if (animated) {
82  *anim = *(const uint16*) src_mv;
83  *dst = (src_mv->m >= PALETTE_ANIM_START) ? AdjustBrightneSSE(this->LookupColourInPalette(src_mv->m), src_mv->v) : src->data;
84  } else {
85  *anim = 0;
86  *dst = *src;
87  }
88  }
89  if (animated) src_mv++;
90  anim++;
91  src++;
92  dst++;
93  }
94  break;
95  }
96 
97  for (uint x = (uint) effective_width/2; x != 0; x--) {
98  uint32 mvX2 = *((uint32 *) const_cast<MapValue *>(src_mv));
99  __m128i srcABCD = _mm_loadl_epi64((const __m128i*) src);
100  __m128i dstABCD = _mm_loadl_epi64((__m128i*) dst);
101 
102  if (animated) {
103  /* Remap colours. */
104  const byte m0 = mvX2;
105  if (m0 >= PALETTE_ANIM_START) {
106  const Colour c0 = (this->LookupColourInPalette(m0).data & 0x00FFFFFF) | (src[0].data & 0xFF000000);
107  InsertFirstUint32(AdjustBrightneSSE(c0, (byte) (mvX2 >> 8)).data, srcABCD);
108  }
109  const byte m1 = mvX2 >> 16;
110  if (m1 >= PALETTE_ANIM_START) {
111  const Colour c1 = (this->LookupColourInPalette(m1).data & 0x00FFFFFF) | (src[1].data & 0xFF000000);
112  InsertSecondUint32(AdjustBrightneSSE(c1, (byte) (mvX2 >> 24)).data, srcABCD);
113  }
114 
115  /* Update anim buffer. */
116  const byte a0 = src[0].a;
117  const byte a1 = src[1].a;
118  uint32 anim01 = 0;
119  if (a0 == 255) {
120  if (a1 == 255) {
121  *(uint32*) anim = mvX2;
122  goto bmno_full_opacity;
123  }
124  anim01 = (uint16) mvX2;
125  } else if (a0 == 0) {
126  if (a1 == 0) {
127  goto bmno_full_transparency;
128  } else {
129  if (a1 == 255) anim[1] = (uint16) (mvX2 >> 16);
130  goto bmno_alpha_blend;
131  }
132  }
133  if (a1 > 0) {
134  if (a1 == 255) anim01 |= mvX2 & 0xFFFF0000;
135  *(uint32*) anim = anim01;
136  } else {
137  anim[0] = (uint16) anim01;
138  }
139  } else {
140  if (src[0].a) anim[0] = 0;
141  if (src[1].a) anim[1] = 0;
142  }
143 
144  /* Blend colours. */
145 bmno_alpha_blend:
146  srcABCD = AlphaBlendTwoPixels(srcABCD, dstABCD, a_cm, pack_low_cm);
147 bmno_full_opacity:
148  _mm_storel_epi64((__m128i *) dst, srcABCD);
149 bmno_full_transparency:
150  src_mv += 2;
151  src += 2;
152  anim += 2;
153  dst += 2;
154  }
155 
156  if ((bt_last == BT_NONE && effective_width & 1) || bt_last == BT_ODD) {
157  if (src->a == 0) {
158  } else if (src->a == 255) {
159  *anim = *(const uint16*) src_mv;
160  *dst = (src_mv->m >= PALETTE_ANIM_START) ? AdjustBrightneSSE(LookupColourInPalette(src_mv->m), src_mv->v) : *src;
161  } else {
162  *anim = 0;
163  __m128i srcABCD;
164  __m128i dstABCD = _mm_cvtsi32_si128(dst->data);
165  if (src_mv->m >= PALETTE_ANIM_START) {
166  Colour colour = AdjustBrightneSSE(LookupColourInPalette(src_mv->m), src_mv->v);
167  colour.a = src->a;
168  srcABCD = _mm_cvtsi32_si128(colour.data);
169  } else {
170  srcABCD = _mm_cvtsi32_si128(src->data);
171  }
172  dst->data = _mm_cvtsi128_si32(AlphaBlendTwoPixels(srcABCD, dstABCD, a_cm, pack_low_cm));
173  }
174  }
175  break;
176 
177  case BM_COLOUR_REMAP:
178  for (uint x = (uint) effective_width / 2; x != 0; x--) {
179  uint32 mvX2 = *((uint32 *) const_cast<MapValue *>(src_mv));
180  __m128i srcABCD = _mm_loadl_epi64((const __m128i*) src);
181  __m128i dstABCD = _mm_loadl_epi64((__m128i*) dst);
182 
183  /* Remap colours. */
184  const uint m0 = (byte) mvX2;
185  const uint r0 = remap[m0];
186  const uint m1 = (byte) (mvX2 >> 16);
187  const uint r1 = remap[m1];
188  if (mvX2 & 0x00FF00FF) {
189  #define CMOV_REMAP(m_colour, m_colour_init, m_src, m_m) \
190  /* Written so the compiler uses CMOV. */ \
191  Colour m_colour = m_colour_init; \
192  { \
193  const Colour srcm = (Colour) (m_src); \
194  const uint m = (byte) (m_m); \
195  const uint r = remap[m]; \
196  const Colour cmap = (this->LookupColourInPalette(r).data & 0x00FFFFFF) | (srcm.data & 0xFF000000); \
197  m_colour = r == 0 ? m_colour : cmap; \
198  m_colour = m != 0 ? m_colour : srcm; \
199  }
200 #ifdef _SQ64
201  uint64 srcs = _mm_cvtsi128_si64(srcABCD);
202  uint64 dsts;
203  if (animated) dsts = _mm_cvtsi128_si64(dstABCD);
204  uint64 remapped_src = 0;
205  CMOV_REMAP(c0, animated ? dsts : 0, srcs, mvX2);
206  remapped_src = c0.data;
207  CMOV_REMAP(c1, animated ? dsts >> 32 : 0, srcs >> 32, mvX2 >> 16);
208  remapped_src |= (uint64) c1.data << 32;
209  srcABCD = _mm_cvtsi64_si128(remapped_src);
210 #else
211  Colour remapped_src[2];
212  CMOV_REMAP(c0, animated ? _mm_cvtsi128_si32(dstABCD) : 0, _mm_cvtsi128_si32(srcABCD), mvX2);
213  remapped_src[0] = c0.data;
214  CMOV_REMAP(c1, animated ? dst[1] : 0, src[1], mvX2 >> 16);
215  remapped_src[1] = c1.data;
216  srcABCD = _mm_loadl_epi64((__m128i*) &remapped_src);
217 #endif
218 
219  if ((mvX2 & 0xFF00FF00) != 0x80008000) srcABCD = AdjustBrightnessOfTwoPixels(srcABCD, mvX2);
220  }
221 
222  /* Update anim buffer. */
223  if (animated) {
224  const byte a0 = src[0].a;
225  const byte a1 = src[1].a;
226  uint32 anim01 = mvX2 & 0xFF00FF00;
227  if (a0 == 255) {
228  anim01 |= r0;
229  if (a1 == 255) {
230  *(uint32*) anim = anim01 | (r1 << 16);
231  goto bmcr_full_opacity;
232  }
233  } else if (a0 == 0) {
234  if (a1 == 0) {
235  goto bmcr_full_transparency;
236  } else {
237  if (a1 == 255) {
238  anim[1] = r1 | (anim01 >> 16);
239  }
240  goto bmcr_alpha_blend;
241  }
242  }
243  if (a1 > 0) {
244  if (a1 == 255) anim01 |= r1 << 16;
245  *(uint32*) anim = anim01;
246  } else {
247  anim[0] = (uint16) anim01;
248  }
249  } else {
250  if (src[0].a) anim[0] = 0;
251  if (src[1].a) anim[1] = 0;
252  }
253 
254  /* Blend colours. */
255 bmcr_alpha_blend:
256  srcABCD = AlphaBlendTwoPixels(srcABCD, dstABCD, a_cm, pack_low_cm);
257 bmcr_full_opacity:
258  _mm_storel_epi64((__m128i *) dst, srcABCD);
259 bmcr_full_transparency:
260  src_mv += 2;
261  dst += 2;
262  src += 2;
263  anim += 2;
264  }
265 
266  if ((bt_last == BT_NONE && effective_width & 1) || bt_last == BT_ODD) {
267  /* In case the m-channel is zero, do not remap this pixel in any way. */
268  __m128i srcABCD;
269  if (src->a == 0) break;
270  if (src_mv->m) {
271  const uint r = remap[src_mv->m];
272  *anim = (animated && src->a == 255) ? r | ((uint16) src_mv->v << 8 ) : 0;
273  if (r != 0) {
274  Colour remapped_colour = AdjustBrightneSSE(this->LookupColourInPalette(r), src_mv->v);
275  if (src->a == 255) {
276  *dst = remapped_colour;
277  } else {
278  remapped_colour.a = src->a;
279  srcABCD = _mm_cvtsi32_si128(remapped_colour.data);
280  goto bmcr_alpha_blend_single;
281  }
282  }
283  } else {
284  *anim = 0;
285  srcABCD = _mm_cvtsi32_si128(src->data);
286  if (src->a < 255) {
287 bmcr_alpha_blend_single:
288  __m128i dstABCD = _mm_cvtsi32_si128(dst->data);
289  srcABCD = AlphaBlendTwoPixels(srcABCD, dstABCD, a_cm, pack_low_cm);
290  }
291  dst->data = _mm_cvtsi128_si32(srcABCD);
292  }
293  }
294  break;
295 
296  case BM_TRANSPARENT:
297  /* Make the current colour a bit more black, so it looks like this image is transparent. */
298  for (uint x = (uint) bp->width / 2; x > 0; x--) {
299  __m128i srcABCD = _mm_loadl_epi64((const __m128i*) src);
300  __m128i dstABCD = _mm_loadl_epi64((__m128i*) dst);
301  _mm_storel_epi64((__m128i *) dst, DarkenTwoPixels(srcABCD, dstABCD, a_cm, tr_nom_base));
302  src += 2;
303  dst += 2;
304  anim += 2;
305  if (src[-2].a) anim[-2] = 0;
306  if (src[-1].a) anim[-1] = 0;
307  }
308 
309  if ((bt_last == BT_NONE && bp->width & 1) || bt_last == BT_ODD) {
310  __m128i srcABCD = _mm_cvtsi32_si128(src->data);
311  __m128i dstABCD = _mm_cvtsi32_si128(dst->data);
312  dst->data = _mm_cvtsi128_si32(DarkenTwoPixels(srcABCD, dstABCD, a_cm, tr_nom_base));
313  if (src[0].a) anim[0] = 0;
314  }
315  break;
316 
317  case BM_CRASH_REMAP:
318  for (uint x = (uint) bp->width; x > 0; x--) {
319  if (src_mv->m == 0) {
320  if (src->a != 0) {
321  uint8 g = MakeDark(src->r, src->g, src->b);
322  *dst = ComposeColourRGBA(g, g, g, src->a, *dst);
323  *anim = 0;
324  }
325  } else {
326  uint r = remap[src_mv->m];
327  if (r != 0) *dst = ComposeColourPANoCheck(this->AdjustBrightness(this->LookupColourInPalette(r), src_mv->v), src->a, *dst);
328  }
329  src_mv++;
330  dst++;
331  src++;
332  anim++;
333  }
334  break;
335 
336  case BM_BLACK_REMAP:
337  for (uint x = (uint) bp->width; x > 0; x--) {
338  if (src->a != 0) {
339  *dst = Colour(0, 0, 0);
340  *anim = 0;
341  }
342  src_mv++;
343  dst++;
344  src++;
345  anim++;
346  }
347  break;
348  }
349 
350 next_line:
351  if (mode != BM_TRANSPARENT) src_mv_line += si->sprite_width;
352  src_rgba_line = (const Colour*) ((const byte*) src_rgba_line + si->sprite_line_size);
353  dst_line += bp->pitch;
354  anim_line += this->anim_buf_pitch;
355  }
356 }
357 IGNORE_UNINITIALIZED_WARNING_STOP
358 
366 void Blitter_32bppSSE4_Anim::Draw(Blitter::BlitterParams *bp, BlitterMode mode, ZoomLevel zoom)
367 {
368  const Blitter_32bppSSE_Base::SpriteFlags sprite_flags = ((const Blitter_32bppSSE_Base::SpriteData *) bp->sprite)->flags;
369  switch (mode) {
370  default: {
371 bm_normal:
372  if (bp->skip_left != 0 || bp->width <= MARGIN_NORMAL_THRESHOLD) {
373  const BlockType bt_last = (BlockType) (bp->width & 1);
374  if (bt_last == BT_EVEN) {
375  if (sprite_flags & SF_NO_ANIM) Draw<BM_NORMAL, RM_WITH_SKIP, BT_EVEN, true, false>(bp, zoom);
376  else Draw<BM_NORMAL, RM_WITH_SKIP, BT_EVEN, true, true>(bp, zoom);
377  } else {
378  if (sprite_flags & SF_NO_ANIM) Draw<BM_NORMAL, RM_WITH_SKIP, BT_ODD, true, false>(bp, zoom);
379  else Draw<BM_NORMAL, RM_WITH_SKIP, BT_ODD, true, true>(bp, zoom);
380  }
381  } else {
382 #ifdef _SQ64
383  if (sprite_flags & SF_TRANSLUCENT) {
384  if (sprite_flags & SF_NO_ANIM) Draw<BM_NORMAL, RM_WITH_MARGIN, BT_NONE, true, false>(bp, zoom);
385  else Draw<BM_NORMAL, RM_WITH_MARGIN, BT_NONE, true, true>(bp, zoom);
386  } else {
387  if (sprite_flags & SF_NO_ANIM) Draw<BM_NORMAL, RM_WITH_MARGIN, BT_NONE, false, false>(bp, zoom);
388  else Draw<BM_NORMAL, RM_WITH_MARGIN, BT_NONE, false, true>(bp, zoom);
389  }
390 #else
391  if (sprite_flags & SF_NO_ANIM) Draw<BM_NORMAL, RM_WITH_MARGIN, BT_NONE, true, false>(bp, zoom);
392  else Draw<BM_NORMAL, RM_WITH_MARGIN, BT_NONE, true, true>(bp, zoom);
393 #endif
394  }
395  break;
396  }
397  case BM_COLOUR_REMAP:
398  if (sprite_flags & SF_NO_REMAP) goto bm_normal;
399  if (bp->skip_left != 0 || bp->width <= MARGIN_REMAP_THRESHOLD) {
400  if (sprite_flags & SF_NO_ANIM) Draw<BM_COLOUR_REMAP, RM_WITH_SKIP, BT_NONE, true, false>(bp, zoom);
401  else Draw<BM_COLOUR_REMAP, RM_WITH_SKIP, BT_NONE, true, true>(bp, zoom);
402  } else {
403  if (sprite_flags & SF_NO_ANIM) Draw<BM_COLOUR_REMAP, RM_WITH_MARGIN, BT_NONE, true, false>(bp, zoom);
404  else Draw<BM_COLOUR_REMAP, RM_WITH_MARGIN, BT_NONE, true, true>(bp, zoom);
405  }
406  break;
407  case BM_TRANSPARENT: Draw<BM_TRANSPARENT, RM_NONE, BT_NONE, true, true>(bp, zoom); return;
408  case BM_CRASH_REMAP: Draw<BM_CRASH_REMAP, RM_NONE, BT_NONE, true, true>(bp, zoom); return;
409  case BM_BLACK_REMAP: Draw<BM_BLACK_REMAP, RM_NONE, BT_NONE, true, true>(bp, zoom); return;
410  }
411 }
412 
413 #endif /* WITH_SSE */
Colour::data
uint32 data
Conversion of the channel information to a 32 bit number.
Definition: gfx_type.h:164
Blitter::BlitterParams::top
int top
The top offset in the 'dst' in pixels to start drawing.
Definition: base.hpp:42
BM_TRANSPARENT
@ BM_TRANSPARENT
Perform transparency colour remapping.
Definition: base.hpp:20
Blitter::BlitterParams::skip_left
int skip_left
How much pixels of the source to skip on the left (based on zoom of dst)
Definition: base.hpp:35
BlitterMode
BlitterMode
The modes of blitting we can do.
Definition: base.hpp:17
Blitter::BlitterParams::width
int width
The width in pixels that needs to be drawn to dst.
Definition: base.hpp:37
Blitter::BlitterParams::dst
void * dst
Destination buffer.
Definition: base.hpp:44
ZoomLevel
ZoomLevel
All zoom levels we know.
Definition: zoom_type.h:21
Blitter::BlitterParams::pitch
int pitch
The pitch of the destination buffer.
Definition: base.hpp:45
Blitter::BlitterParams::sprite
const void * sprite
Pointer to the sprite how ever the encoder stored it.
Definition: base.hpp:32
BM_COLOUR_REMAP
@ BM_COLOUR_REMAP
Perform a colour remapping.
Definition: base.hpp:19
BM_CRASH_REMAP
@ BM_CRASH_REMAP
Perform a crash remapping.
Definition: base.hpp:21
BM_BLACK_REMAP
@ BM_BLACK_REMAP
Perform remapping to a completely blackened sprite.
Definition: base.hpp:22
PALETTE_ANIM_START
@ PALETTE_ANIM_START
Index in the _palettes array from which all animations are taking places (table/palettes....
Definition: gfx_type.h:282
Colour
Structure to access the alpha, red, green, and blue channels from a 32 bit number.
Definition: gfx_type.h:163
Colour::a
uint8 a
colour channels in LE order
Definition: gfx_type.h:171
Blitter::BlitterParams::left
int left
The left offset in the 'dst' in pixels to start drawing.
Definition: base.hpp:41
32bpp_sse_func.hpp
32bpp_anim_sse4.hpp
Blitter::BlitterParams
Parameters related to blitting.
Definition: base.hpp:31
Blitter::BlitterParams::height
int height
The height in pixels that needs to be drawn to dst.
Definition: base.hpp:38
Blitter::BlitterParams::skip_top
int skip_top
How much pixels of the source to skip on the top (based on zoom of dst)
Definition: base.hpp:36
Blitter::BlitterParams::remap
const byte * remap
XXX – Temporary storage for remap array.
Definition: base.hpp:33