rubidium@9723: /* $Id$ */ rubidium@9723: rubidium@10455: /** @file 32bpp_optimized.cpp Implementation of the optimized 32 bpp blitter. */ rubidium@10455: rubidium@9703: #include "../stdafx.h" rubidium@9723: #include "../zoom_func.h" rubidium@9723: #include "../gfx_func.h" rubidium@9703: #include "../debug.h" rubidium@11126: #include "../core/math_func.hpp" rubidium@11126: #include "../core/alloc_func.hpp" rubidium@9703: #include "32bpp_optimized.hpp" rubidium@9703: rubidium@9703: static FBlitter_32bppOptimized iFBlitter_32bppOptimized; rubidium@9703: rubidium@11126: /** rubidium@11126: * Draws a sprite to a (screen) buffer. It is templated to allow faster operation. rubidium@11126: * rubidium@11126: * @param mode blitter mode rubidium@11126: * @param bp further blitting parameters rubidium@11126: * @param zoom zoom level at which we are drawing rubidium@11126: */ rubidium@11126: template rubidium@11126: inline void Blitter_32bppOptimized::Draw(const Blitter::BlitterParams *bp, ZoomLevel zoom) rubidium@9703: { rubidium@11126: const SpriteData *src = (const SpriteData *)bp->sprite; rubidium@9703: rubidium@11126: /* src_px : each line begins with uint32 n = 'number of bytes in this line', rubidium@11126: * then n times is the Colour struct for this line */ rubidium@11126: const Colour *src_px = (const Colour *)(src->data + src->offset[zoom][0]); rubidium@11126: /* src_n : each line begins with uint32 n = 'number of bytes in this line', rubidium@11126: * then interleaved stream of 'm' and 'n' channels. 'm' is remap, rubidium@11126: * 'n' is number of bytes with the same alpha channel class */ rubidium@11126: const uint8 *src_n = (const uint8 *)(src->data + src->offset[zoom][1]); rubidium@11126: rubidium@11126: /* skip upper lines in src_px and src_n */ rubidium@11126: for (uint i = bp->skip_top; i != 0; i--) { rubidium@11126: src_px = (const Colour *)((const byte *)src_px + *(const uint32 *)src_px); rubidium@11126: src_n += *(uint32 *)src_n; rubidium@11126: } rubidium@11126: rubidium@11126: /* skip lines in dst */ rubidium@11126: uint32 *dst = (uint32 *)bp->dst + bp->top * bp->pitch + bp->left; rubidium@11126: rubidium@11126: /* store so we don't have to access it via bp everytime (compiler assumes pointer aliasing) */ rubidium@11126: const byte *remap = bp->remap; rubidium@9703: rubidium@9703: for (int y = 0; y < bp->height; y++) { rubidium@11126: /* next dst line begins here */ rubidium@11126: uint32 *dst_ln = dst + bp->pitch; rubidium@9703: rubidium@11126: /* next src line begins here */ rubidium@11126: const Colour *src_px_ln = (const Colour *)((const byte *)src_px + *(const uint32 *)src_px); rubidium@11126: src_px++; rubidium@9703: rubidium@11126: /* next src_n line begins here */ rubidium@11126: const uint8 *src_n_ln = src_n + *(uint32 *)src_n; rubidium@11126: src_n += 4; rubidium@11126: rubidium@11126: /* we will end this line when we reach this point */ rubidium@11126: uint32 *dst_end = dst + bp->skip_left; rubidium@11126: rubidium@11126: /* number of pixels with the same aplha channel class */ rubidium@11126: uint n; rubidium@11126: rubidium@11126: while (dst < dst_end) { rubidium@11126: n = *src_n++; rubidium@11126: rubidium@11126: if (src_px->a == 0) { rubidium@11126: dst += n; rubidium@11126: src_px ++; rubidium@11126: src_n++; rubidium@11126: } else { rubidium@11126: if (dst + n > dst_end) { rubidium@11126: uint d = dst_end - dst; rubidium@11126: src_px += d; rubidium@11126: src_n += d; rubidium@11126: rubidium@11126: dst = dst_end - bp->skip_left; rubidium@11126: dst_end = dst + bp->width; rubidium@11126: rubidium@11126: n = min(n - d, (uint)bp->width); rubidium@11126: goto draw; rubidium@11126: } rubidium@11126: dst += n; rubidium@11126: src_px += n; rubidium@11126: src_n += n; rubidium@11126: } rubidium@11126: } rubidium@11126: rubidium@11126: dst -= bp->skip_left; rubidium@11126: dst_end -= bp->skip_left; rubidium@11126: rubidium@11126: dst_end += bp->width; rubidium@11126: rubidium@11126: while (dst < dst_end) { rubidium@11126: n = min(*src_n++, (uint)(dst_end - dst)); rubidium@11126: rubidium@11126: if (src_px->a == 0) { rubidium@11126: dst += n; rubidium@11126: src_px++; rubidium@11126: src_n++; rubidium@9703: continue; rubidium@9703: } rubidium@9703: rubidium@11126: draw:; rubidium@11126: rubidium@9703: switch (mode) { rubidium@9703: case BM_COLOUR_REMAP: rubidium@11126: if (src_px->a == 255) { rubidium@11126: do { rubidium@11126: uint m = *src_n; rubidium@11126: /* In case the m-channel is zero, do not remap this pixel in any way */ rubidium@11126: if (m == 0) { rubidium@11126: *dst = *src_px; rubidium@11126: } else { rubidium@11126: uint r = remap[m]; rubidium@11126: if (r != 0) *dst = this->LookupColourInPalette(r); rubidium@11126: } rubidium@11126: dst++; rubidium@11126: src_px++; rubidium@11126: src_n++; rubidium@11126: } while (--n != 0); rubidium@9703: } else { rubidium@11126: do { rubidium@11126: uint m = *src_n; rubidium@11126: if (m == 0) { rubidium@11126: *dst = ComposeColourRGBANoCheck(src_px->r, src_px->g, src_px->b, src_px->a, *dst); rubidium@11126: } else { rubidium@11126: uint r = remap[m]; rubidium@11126: if (r != 0) *dst = ComposeColourPANoCheck(this->LookupColourInPalette(r), src_px->a, *dst); rubidium@11126: } rubidium@11126: dst++; rubidium@11126: src_px++; rubidium@11126: src_n++; rubidium@11126: } while (--n != 0); rubidium@9703: } rubidium@9703: break; rubidium@9703: rubidium@9703: case BM_TRANSPARENT: rubidium@9703: /* TODO -- We make an assumption here that the remap in fact is transparency, not some color. rubidium@9703: * This is never a problem with the code we produce, but newgrfs can make it fail... or at least: rubidium@9703: * we produce a result the newgrf maker didn't expect ;) */ rubidium@9703: rubidium@9703: /* Make the current color a bit more black, so it looks like this image is transparent */ rubidium@11126: src_n += n; rubidium@11126: if (src_px->a == 255) { rubidium@11126: src_px += n; rubidium@11126: do { rubidium@11126: *dst = MakeTransparent(*dst, 3, 4); rubidium@11126: dst++; rubidium@11126: } while (--n != 0); rubidium@11126: } else { rubidium@11126: do { rubidium@11126: *dst = MakeTransparent(*dst, (256 * 4 - src_px->a), 256 * 4); rubidium@11126: dst++; rubidium@11126: src_px++; rubidium@11126: } while (--n != 0); rubidium@11126: } rubidium@9703: break; rubidium@9703: rubidium@9703: default: rubidium@11126: if (src_px->a == 255) { rubidium@11126: /* faster than memcpy(), n is usually low */ rubidium@11126: src_n += n; rubidium@11126: do { rubidium@11126: *dst++ = *src_px++; rubidium@11126: } while (--n != 0); rubidium@11126: } else { rubidium@11126: src_n += n; rubidium@11126: do { rubidium@11126: *dst = ComposeColourRGBANoCheck(src_px->r, src_px->g, src_px->b, src_px->a, *dst); rubidium@11126: dst++; rubidium@11126: src_px++; rubidium@11126: } while (--n != 0); rubidium@11126: } rubidium@9703: break; rubidium@9703: } rubidium@9703: } rubidium@11126: rubidium@11126: dst = dst_ln; rubidium@11126: src_px = src_px_ln; rubidium@11126: src_n = src_n_ln; rubidium@9703: } rubidium@9703: } rubidium@9703: rubidium@11126: /** rubidium@11126: * Draws a sprite to a (screen) buffer. Calls adequate templated function. rubidium@11126: * rubidium@11126: * @param bp further blitting parameters rubidium@11126: * @param mode blitter mode rubidium@11126: * @param zoom zoom level at which we are drawing rubidium@11126: */ glx@10920: void Blitter_32bppOptimized::Draw(Blitter::BlitterParams *bp, BlitterMode mode, ZoomLevel zoom) glx@10920: { glx@10920: switch (mode) { glx@10920: default: NOT_REACHED(); glx@10920: case BM_NORMAL: Draw (bp, zoom); return; glx@10920: case BM_COLOUR_REMAP: Draw(bp, zoom); return; glx@10920: case BM_TRANSPARENT: Draw (bp, zoom); return; glx@10920: } glx@10920: } glx@10920: rubidium@11126: /** rubidium@11126: * Resizes the sprite in a very simple way, takes every n-th pixel and every n-th row rubidium@11126: * rubidium@11126: * @param sprite_src sprite to resize rubidium@11126: * @param zoom resizing scale rubidium@11126: * @return resized sprite rubidium@11126: */ rubidium@11126: static const SpriteLoader::Sprite *ResizeSprite(const SpriteLoader::Sprite *sprite_src, ZoomLevel zoom) rubidium@11126: { rubidium@11126: SpriteLoader::Sprite *sprite = MallocT(1); rubidium@11126: rubidium@11126: if (zoom == ZOOM_LVL_NORMAL) { rubidium@11126: memcpy(sprite, sprite_src, sizeof(*sprite)); rubidium@11126: uint size = sprite_src->height * sprite_src->width; rubidium@11126: sprite->data = MallocT(size); rubidium@11126: memcpy(sprite->data, sprite_src->data, size * sizeof(SpriteLoader::CommonPixel)); rubidium@11126: return sprite; rubidium@11126: } rubidium@11126: rubidium@11126: sprite->height = UnScaleByZoom(sprite_src->height, zoom); rubidium@11126: sprite->width = UnScaleByZoom(sprite_src->width, zoom); rubidium@11126: sprite->x_offs = UnScaleByZoom(sprite_src->x_offs, zoom); rubidium@11126: sprite->y_offs = UnScaleByZoom(sprite_src->y_offs, zoom); rubidium@11126: rubidium@11126: uint size = sprite->height * sprite->width; rubidium@11126: SpriteLoader::CommonPixel *dst = sprite->data = CallocT(size); rubidium@11126: rubidium@11126: const SpriteLoader::CommonPixel *src = (SpriteLoader::CommonPixel *)sprite_src->data; rubidium@11126: const SpriteLoader::CommonPixel *src_end = src + sprite_src->height * sprite_src->width; rubidium@11126: rubidium@11126: uint scaled_1 = ScaleByZoom(1, zoom); rubidium@11126: rubidium@11126: for (uint y = 0; y < sprite->height; y++) { rubidium@11126: if (src >= src_end) src = src_end - sprite_src->width; rubidium@11126: rubidium@11126: const SpriteLoader::CommonPixel *src_ln = src + sprite_src->width * scaled_1; rubidium@11126: for (uint x = 0; x < sprite->width; x++) { rubidium@11126: if (src >= src_ln) src = src_ln - 1; rubidium@11126: *dst = *src; rubidium@11126: dst++; rubidium@11126: src += scaled_1; rubidium@11126: } rubidium@11126: rubidium@11126: src = src_ln; rubidium@11126: } rubidium@11126: rubidium@11126: return sprite; rubidium@11126: } rubidium@11126: rubidium@9703: Sprite *Blitter_32bppOptimized::Encode(SpriteLoader::Sprite *sprite, Blitter::AllocatorProc *allocator) rubidium@9703: { rubidium@11126: /* streams of pixels (a, r, g, b channels) rubidium@11126: * rubidium@11126: * stored in separated stream so data are always aligned on 4B boundary */ rubidium@11126: Colour *dst_px_orig[ZOOM_LVL_COUNT]; rubidium@11126: rubidium@11126: /* interleaved stream of 'm' channel and 'n' channel rubidium@11126: * 'n' is number if following pixels with the same alpha channel class rubidium@11126: * there are 3 classes: 0, 255, others rubidium@11126: * rubidium@11126: * it has to be stored in one stream so fewer registers are used - rubidium@11126: * x86 has problems with register allocation even with this solution */ rubidium@11126: uint8 *dst_n_orig[ZOOM_LVL_COUNT]; rubidium@11126: rubidium@11126: /* lengths of streams */ rubidium@11126: uint32 lengths[ZOOM_LVL_COUNT][2]; rubidium@11126: rubidium@11126: for (ZoomLevel z = ZOOM_LVL_BEGIN; z < ZOOM_LVL_END; z++) { rubidium@11126: const SpriteLoader::Sprite *src_orig = ResizeSprite(sprite, z); rubidium@11126: rubidium@11126: uint size = src_orig->height * src_orig->width; rubidium@11126: rubidium@11126: dst_px_orig[z] = CallocT(size + src_orig->height * 2); rubidium@11126: dst_n_orig[z] = CallocT(size * 2 + src_orig->height * 4 * 2); rubidium@11126: rubidium@11126: uint32 *dst_px_ln = (uint32 *)dst_px_orig[z]; rubidium@11126: uint32 *dst_n_ln = (uint32 *)dst_n_orig[z]; rubidium@11126: rubidium@11126: const SpriteLoader::CommonPixel *src = (const SpriteLoader::CommonPixel *)src_orig->data; rubidium@11126: rubidium@11126: for (uint y = src_orig->height; y > 0; y--) { rubidium@11126: Colour *dst_px = (Colour *)(dst_px_ln + 1); rubidium@11126: uint8 *dst_n = (uint8 *)(dst_n_ln + 1); rubidium@11126: rubidium@11126: uint8 *dst_len = dst_n++; rubidium@11126: rubidium@11126: uint last = 3; rubidium@11126: int len = 0; rubidium@11126: rubidium@11126: for (uint x = src_orig->width; x > 0; x--) { rubidium@11126: uint8 a = src->a; rubidium@11126: uint t = a > 0 && a < 255 ? 1 : a; rubidium@11126: rubidium@11126: if (last != t || len == 255) { rubidium@11126: if (last != 3) { rubidium@11126: *dst_len = len; rubidium@11126: dst_len = dst_n++; rubidium@11126: } rubidium@11126: len = 0; rubidium@11126: } rubidium@11126: rubidium@11126: last = t; rubidium@11126: len++; rubidium@11126: rubidium@11126: if (a != 0) { rubidium@11126: dst_px->a = a; rubidium@11126: *dst_n = src->m; rubidium@11126: if (src->m != 0) { rubidium@11126: /* Pre-convert the mapping channel to a RGB value */ rubidium@11126: uint32 colour = this->LookupColourInPalette(src->m); rubidium@11126: dst_px->r = GB(colour, 16, 8); rubidium@11126: dst_px->g = GB(colour, 8, 8); rubidium@11126: dst_px->b = GB(colour, 0, 8); rubidium@11126: } else { rubidium@11126: dst_px->r = src->r; rubidium@11126: dst_px->g = src->g; rubidium@11126: dst_px->b = src->b; rubidium@11126: } rubidium@11126: dst_px++; rubidium@11126: dst_n++; rubidium@11126: } else if (len == 1) { rubidium@11126: dst_px++; rubidium@11126: *dst_n = src->m; rubidium@11126: dst_n++; rubidium@11126: } rubidium@11126: rubidium@11126: src++; rubidium@11126: } rubidium@11126: rubidium@11126: if (last != 3) { rubidium@11126: *dst_len = len; rubidium@11126: } rubidium@11126: rubidium@11126: dst_px = (Colour *)AlignPtr(dst_px, 4); rubidium@11126: dst_n = (uint8 *)AlignPtr(dst_n, 4); rubidium@11126: rubidium@11126: *dst_px_ln = (uint8 *)dst_px - (uint8 *)dst_px_ln; rubidium@11126: *dst_n_ln = (uint8 *)dst_n - (uint8 *)dst_n_ln; rubidium@11126: rubidium@11126: dst_px_ln = (uint32 *)dst_px; rubidium@11126: dst_n_ln = (uint32 *)dst_n; rubidium@11126: } rubidium@11126: rubidium@11126: lengths[z][0] = (byte *)dst_px_ln - (byte *)dst_px_orig[z]; // all are aligned to 4B boundary rubidium@11126: lengths[z][1] = (byte *)dst_n_ln - (byte *)dst_n_orig[z]; rubidium@11126: rubidium@11126: free(src_orig->data); rubidium@11126: free((void *)src_orig); rubidium@11126: } rubidium@11126: rubidium@11126: uint len = 0; // total length of data rubidium@11126: for (ZoomLevel z = ZOOM_LVL_BEGIN; z < ZOOM_LVL_END; z++) { rubidium@11126: len += lengths[z][0] + lengths[z][1]; rubidium@11126: } rubidium@11126: rubidium@11126: Sprite *dest_sprite = (Sprite *)allocator(sizeof(*dest_sprite) + sizeof(SpriteData) + len); rubidium@9703: rubidium@9703: dest_sprite->height = sprite->height; rubidium@9703: dest_sprite->width = sprite->width; rubidium@9703: dest_sprite->x_offs = sprite->x_offs; rubidium@9703: dest_sprite->y_offs = sprite->y_offs; rubidium@9703: rubidium@11126: SpriteData *dst = (SpriteData *)dest_sprite->data; rubidium@9703: rubidium@11126: for (ZoomLevel z = ZOOM_LVL_BEGIN; z < ZOOM_LVL_END; z++) { rubidium@11126: dst->offset[z][0] = z == ZOOM_LVL_BEGIN ? 0 : lengths[z - 1][1] + dst->offset[z - 1][1]; rubidium@11126: dst->offset[z][1] = lengths[z][0] + dst->offset[z][0]; rubidium@11126: rubidium@11126: memcpy(dst->data + dst->offset[z][0], dst_px_orig[z], lengths[z][0]); rubidium@11126: memcpy(dst->data + dst->offset[z][1], dst_n_orig[z], lengths[z][1]); rubidium@11126: rubidium@11126: free(dst_px_orig[z]); rubidium@11126: free(dst_n_orig[z]); rubidium@9703: } rubidium@11126: rubidium@9703: return dest_sprite; rubidium@9703: }