// Copyright (C) 2002-2012 Nikolaus Gebhardt / Thomas Alten // This file is part of the "Irrlicht Engine". // For conditions of distribution and use, see copyright notice in irrlicht.h #pragma once #include "SoftwareDriver2_helper.h" //! f18 - fixpoint 14.18 limit to 16k Textures #define CBLIT_USE_FIXPOINT18 #if defined(CBLIT_USE_FIXPOINT18) typedef int f18; #define f18_one 262144 #define f18_zero 0 #define f32_to_f18(x) ((f18)floorf(((x) * 262144.f) + 0.f)) #define f32_to_f32(x) (x) #define f18_floor(x) ((x) >> 18) #define f18_round(x) ((x + 131.072) >> 18) #else typedef float f18; #define f18_one 1.f #define f18_zero_dot_five 0.5f #define f18_zero 0.f #define f32_to_f18(x) (x) #define f32_to_f32(x) (x) #define f18_floor(x) ((int)(x)) #define f18_round(x) ((int)(x + 0.5f)) #endif struct SBlitJob { AbsRectangle Dest; AbsRectangle Source; u32 argb; const void *src; void *dst; u32 width; // draw size u32 height; u32 srcPixelMul; // pixel byte size u32 dstPixelMul; int srcPitch; // scanline byte size. allow negative for mirror u32 dstPitch; bool stretch; f32 x_stretch; f32 y_stretch; }; /* return alpha in [0;256] Granularity from 32-Bit ARGB add highbit alpha ( alpha > 127 ? + 1 ) */ static inline u32 extractAlpha(const u32 c) { return (c >> 24) + (c >> 31); } /*! Scale Color by (1/value) value 0 - 256 ( alpha ) */ inline u32 PixelLerp32(const u32 source, const u32 value) { u32 srcRB = source & 0x00FF00FF; u32 srcXG = (source & 0xFF00FF00) >> 8; srcRB *= value; srcXG *= value; srcRB >>= 8; // srcXG >>= 8; srcXG &= 0xFF00FF00; srcRB &= 0x00FF00FF; return srcRB | srcXG; } /*! */ static void executeBlit_TextureCopy_x_to_x(const SBlitJob *job) { if (job->stretch) { const f18 wscale = f32_to_f18(job->x_stretch); const f18 hscale = f32_to_f18(job->y_stretch); f18 src_y = f18_zero; if (job->srcPixelMul == 4) { const u32 *src = (u32 *)(job->src); u32 *dst = (u32 *)(job->dst); for (u32 dy = 0; dy < job->height; ++dy, src_y += hscale) { src = (u32 *)((u8 *)(job->src) + job->srcPitch * f18_floor(src_y)); f18 src_x = f18_zero; for (u32 dx = 0; dx < job->width; ++dx, src_x += wscale) { dst[dx] = src[f18_floor(src_x)]; } dst = (u32 *)((u8 *)(dst) + job->dstPitch); } } else if (job->srcPixelMul == 2) { const u16 *src = (u16 *)(job->src); u16 *dst = (u16 *)(job->dst); for (u32 dy = 0; dy < job->height; ++dy, src_y += hscale) { src = (u16 *)((u8 *)(job->src) + job->srcPitch * f18_floor(src_y)); f18 src_x = f18_zero; for (u32 dx = 0; dx < job->width; ++dx, src_x += wscale) { dst[dx] = src[f18_floor(src_x)]; } dst = (u16 *)((u8 *)(dst) + job->dstPitch); } } } else { const size_t widthPitch = job->width * job->dstPixelMul; const void *src = (void *)job->src; void *dst = (void *)job->dst; for (u32 dy = 0; dy < job->height; ++dy) { memcpy(dst, src, widthPitch); src = (void *)((u8 *)(src) + job->srcPitch); dst = (void *)((u8 *)(dst) + job->dstPitch); } } } /*! */ static void executeBlit_TextureCopy_32_to_16(const SBlitJob *job) { const u32 w = job->width; const u32 h = job->height; const u32 *src = static_cast(job->src); u16 *dst = static_cast(job->dst); if (job->stretch) { const float wscale = job->x_stretch; const float hscale = job->y_stretch; for (u32 dy = 0; dy < h; ++dy) { const u32 src_y = (u32)(dy * hscale); src = (u32 *)((u8 *)(job->src) + job->srcPitch * src_y); for (u32 dx = 0; dx < w; ++dx) { const u32 src_x = (u32)(dx * wscale); // 16 bit Blitter depends on pre-multiplied color const u32 s = PixelLerp32(src[src_x] | 0xFF000000, extractAlpha(src[src_x])); dst[dx] = video::A8R8G8B8toA1R5G5B5(s); } dst = (u16 *)((u8 *)(dst) + job->dstPitch); } } else { for (u32 dy = 0; dy != h; ++dy) { for (u32 dx = 0; dx != w; ++dx) { // 16 bit Blitter depends on pre-multiplied color const u32 s = PixelLerp32(src[dx] | 0xFF000000, extractAlpha(src[dx])); dst[dx] = video::A8R8G8B8toA1R5G5B5(s); } src = (u32 *)((u8 *)(src) + job->srcPitch); dst = (u16 *)((u8 *)(dst) + job->dstPitch); } } } /*! */ static void executeBlit_TextureCopy_24_to_16(const SBlitJob *job) { const u32 w = job->width; const u32 h = job->height; const u8 *src = static_cast(job->src); u16 *dst = static_cast(job->dst); if (job->stretch) { const float wscale = job->x_stretch * 3.f; const float hscale = job->y_stretch; for (u32 dy = 0; dy < h; ++dy) { const u32 src_y = (u32)(dy * hscale); src = (u8 *)(job->src) + job->srcPitch * src_y; for (u32 dx = 0; dx < w; ++dx) { const u8 *src_x = src + (u32)(dx * wscale); dst[dx] = video::RGBA16(src_x[0], src_x[1], src_x[2]); } dst = (u16 *)((u8 *)(dst) + job->dstPitch); } } else { for (u32 dy = 0; dy != h; ++dy) { const u8 *s = src; for (u32 dx = 0; dx != w; ++dx) { dst[dx] = video::RGBA16(s[0], s[1], s[2]); s += 3; } src = src + job->srcPitch; dst = (u16 *)((u8 *)(dst) + job->dstPitch); } } } /*! */ static void executeBlit_TextureCopy_16_to_32(const SBlitJob *job) { const u32 w = job->width; const u32 h = job->height; const u16 *src = static_cast(job->src); u32 *dst = static_cast(job->dst); if (job->stretch) { const float wscale = job->x_stretch; const float hscale = job->y_stretch; for (u32 dy = 0; dy < h; ++dy) { const u32 src_y = (u32)(dy * hscale); src = (u16 *)((u8 *)(job->src) + job->srcPitch * src_y); for (u32 dx = 0; dx < w; ++dx) { const u32 src_x = (u32)(dx * wscale); dst[dx] = video::A1R5G5B5toA8R8G8B8(src[src_x]); } dst = (u32 *)((u8 *)(dst) + job->dstPitch); } } else { for (u32 dy = 0; dy != h; ++dy) { for (u32 dx = 0; dx != w; ++dx) { dst[dx] = video::A1R5G5B5toA8R8G8B8(src[dx]); } src = (u16 *)((u8 *)(src) + job->srcPitch); dst = (u32 *)((u8 *)(dst) + job->dstPitch); } } } static void executeBlit_TextureCopy_16_to_24(const SBlitJob *job) { const u32 w = job->width; const u32 h = job->height; const u16 *src = static_cast(job->src); u8 *dst = static_cast(job->dst); if (job->stretch) { const float wscale = job->x_stretch; const float hscale = job->y_stretch; for (u32 dy = 0; dy < h; ++dy) { const u32 src_y = (u32)(dy * hscale); src = (u16 *)((u8 *)(job->src) + job->srcPitch * src_y); for (u32 dx = 0; dx < w; ++dx) { const u32 src_x = (u32)(dx * wscale); u32 color = video::A1R5G5B5toA8R8G8B8(src[src_x]); u8 *writeTo = &dst[dx * 3]; *writeTo++ = (color >> 16) & 0xFF; *writeTo++ = (color >> 8) & 0xFF; *writeTo++ = color & 0xFF; } dst += job->dstPitch; } } else { for (u32 dy = 0; dy != h; ++dy) { for (u32 dx = 0; dx != w; ++dx) { u32 color = video::A1R5G5B5toA8R8G8B8(src[dx]); u8 *writeTo = &dst[dx * 3]; *writeTo++ = (color >> 16) & 0xFF; *writeTo++ = (color >> 8) & 0xFF; *writeTo++ = color & 0xFF; } src = (u16 *)((u8 *)(src) + job->srcPitch); dst += job->dstPitch; } } } /*! */ static void executeBlit_TextureCopy_24_to_32(const SBlitJob *job) { const u32 w = job->width; const u32 h = job->height; const u8 *src = static_cast(job->src); u32 *dst = static_cast(job->dst); if (job->stretch) { const float wscale = job->x_stretch * 3.f; const float hscale = job->y_stretch; for (u32 dy = 0; dy < h; ++dy) { const u32 src_y = (u32)(dy * hscale); src = (const u8 *)job->src + (job->srcPitch * src_y); for (u32 dx = 0; dx < w; ++dx) { const u8 *s = src + (u32)(dx * wscale); dst[dx] = 0xFF000000 | s[0] << 16 | s[1] << 8 | s[2]; } dst = (u32 *)((u8 *)(dst) + job->dstPitch); } } else { for (u32 dy = 0; dy < job->height; ++dy) { const u8 *s = src; for (u32 dx = 0; dx < job->width; ++dx) { dst[dx] = 0xFF000000 | s[0] << 16 | s[1] << 8 | s[2]; s += 3; } src = src + job->srcPitch; dst = (u32 *)((u8 *)(dst) + job->dstPitch); } } } static void executeBlit_TextureCopy_32_to_24(const SBlitJob *job) { const u32 w = job->width; const u32 h = job->height; const u32 *src = static_cast(job->src); u8 *dst = static_cast(job->dst); if (job->stretch) { const float wscale = job->x_stretch; const float hscale = job->y_stretch; for (u32 dy = 0; dy < h; ++dy) { const u32 src_y = (u32)(dy * hscale); src = (u32 *)((u8 *)(job->src) + job->srcPitch * src_y); for (u32 dx = 0; dx < w; ++dx) { const u32 src_x = src[(u32)(dx * wscale)]; u8 *writeTo = &dst[dx * 3]; *writeTo++ = (src_x >> 16) & 0xFF; *writeTo++ = (src_x >> 8) & 0xFF; *writeTo++ = src_x & 0xFF; } dst += job->dstPitch; } } else { for (u32 dy = 0; dy != h; ++dy) { for (u32 dx = 0; dx != w; ++dx) { u8 *writeTo = &dst[dx * 3]; *writeTo++ = (src[dx] >> 16) & 0xFF; *writeTo++ = (src[dx] >> 8) & 0xFF; *writeTo++ = src[dx] & 0xFF; } src = (u32 *)((u8 *)(src) + job->srcPitch); dst += job->dstPitch; } } } // Blitter Operation enum eBlitter { BLITTER_INVALID = 0, BLITTER_TEXTURE, }; typedef void (*tExecuteBlit)(const SBlitJob *job); /*! */ struct blitterTable { eBlitter operation; s32 destFormat; s32 sourceFormat; tExecuteBlit func; }; static const blitterTable blitTable[] = { {BLITTER_TEXTURE, -2, -2, executeBlit_TextureCopy_x_to_x}, {BLITTER_TEXTURE, video::ECF_A1R5G5B5, video::ECF_A8R8G8B8, executeBlit_TextureCopy_32_to_16}, {BLITTER_TEXTURE, video::ECF_A1R5G5B5, video::ECF_R8G8B8, executeBlit_TextureCopy_24_to_16}, {BLITTER_TEXTURE, video::ECF_A8R8G8B8, video::ECF_A1R5G5B5, executeBlit_TextureCopy_16_to_32}, {BLITTER_TEXTURE, video::ECF_A8R8G8B8, video::ECF_R8G8B8, executeBlit_TextureCopy_24_to_32}, {BLITTER_TEXTURE, video::ECF_R8G8B8, video::ECF_A1R5G5B5, executeBlit_TextureCopy_16_to_24}, {BLITTER_TEXTURE, video::ECF_R8G8B8, video::ECF_A8R8G8B8, executeBlit_TextureCopy_32_to_24}, {BLITTER_INVALID, -1, -1, 0}, }; static inline tExecuteBlit getBlitter2(eBlitter operation, const video::IImage *dest, const video::IImage *source) { video::ECOLOR_FORMAT sourceFormat = (video::ECOLOR_FORMAT)(source ? source->getColorFormat() : -1); video::ECOLOR_FORMAT destFormat = (video::ECOLOR_FORMAT)(dest ? dest->getColorFormat() : -1); const blitterTable *b = blitTable; while (b->operation != BLITTER_INVALID) { if (b->operation == operation) { if ((b->destFormat == -1 || b->destFormat == destFormat) && (b->sourceFormat == -1 || b->sourceFormat == sourceFormat)) return b->func; else if (b->destFormat == -2 && (sourceFormat == destFormat)) return b->func; } b += 1; } return 0; } // bounce clipping to texture inline void setClip(AbsRectangle &out, const core::rect *clip, const video::IImage *tex, s32 passnative, const core::dimension2d *tex_org) { if (0 == tex) { if (clip && passnative) { out.x0 = clip->UpperLeftCorner.X; out.x1 = clip->LowerRightCorner.X; out.y0 = clip->UpperLeftCorner.Y; out.y1 = clip->LowerRightCorner.Y; } else { out.x0 = 0; out.x1 = 0; out.y0 = 0; out.y1 = 0; } return; } const s32 w = tex->getDimension().Width; const s32 h = tex->getDimension().Height; // driver could have changed texture size. if (clip && tex_org && ((u32)w != tex_org->Width || (u32)h != tex_org->Height)) { out.x0 = core::s32_clamp((clip->UpperLeftCorner.X * w) / tex_org->Width, 0, w - 1); out.x1 = core::s32_clamp((clip->LowerRightCorner.X * w) / tex_org->Width, out.x0, w); out.y0 = core::s32_clamp((clip->UpperLeftCorner.Y * h) / tex_org->Height, 0, h - 1); out.y1 = core::s32_clamp((clip->LowerRightCorner.Y * h) / tex_org->Height, out.y0, h); } else if (clip) { // y-1 to prevent starting on illegal memory (not ideal!). out.x0 = core::s32_clamp(clip->UpperLeftCorner.X, 0, w - 1); out.x1 = core::s32_clamp(clip->LowerRightCorner.X, passnative ? 0 : out.x0, w); out.y0 = core::s32_clamp(clip->UpperLeftCorner.Y, 0, h - 1); out.y1 = core::s32_clamp(clip->LowerRightCorner.Y, passnative ? 0 : out.y0, h); } else { out.x0 = 0; out.y0 = 0; out.x1 = w; out.y1 = h; } } /*! a generic 2D Blitter */ static s32 Blit(eBlitter operation, video::IImage *dest, const core::rect *destClipping, const core::position2d *destPos, video::IImage *const source, const core::rect *sourceClipping, u32 argb) { tExecuteBlit blitter = getBlitter2(operation, dest, source); if (0 == blitter) { return 0; } // Clipping AbsRectangle sourceClip; AbsRectangle destClip; AbsRectangle v; SBlitJob job; setClip(sourceClip, sourceClipping, source, 1, 0); setClip(destClip, destClipping, dest, 0, 0); v.x0 = destPos ? destPos->X : 0; v.y0 = destPos ? destPos->Y : 0; v.x1 = v.x0 + (sourceClip.x1 - sourceClip.x0); v.y1 = v.y0 + (sourceClip.y1 - sourceClip.y0); if (!intersect(job.Dest, destClip, v)) return 0; job.width = job.Dest.x1 - job.Dest.x0; job.height = job.Dest.y1 - job.Dest.y0; job.Source.x0 = sourceClip.x0 + (job.Dest.x0 - v.x0); job.Source.x1 = job.Source.x0 + job.width; job.Source.y0 = sourceClip.y0 + (job.Dest.y0 - v.y0); job.Source.y1 = job.Source.y0 + job.height; job.argb = argb; job.stretch = false; job.x_stretch = 1.f; job.y_stretch = 1.f; if (source) { job.srcPitch = source->getPitch(); job.srcPixelMul = source->getBytesPerPixel(); job.src = (void *)((u8 *)source->getData() + (job.Source.y0 * job.srcPitch) + (job.Source.x0 * job.srcPixelMul)); } else { // use srcPitch for color operation on dest job.srcPitch = job.width * dest->getBytesPerPixel(); } job.dstPitch = dest->getPitch(); job.dstPixelMul = dest->getBytesPerPixel(); job.dst = (void *)((u8 *)dest->getData() + (job.Dest.y0 * job.dstPitch) + (job.Dest.x0 * job.dstPixelMul)); blitter(&job); return 1; }