Torque3D/Engine/source/platformWin32/winAsmBlit.cpp
marauder2k7 3aef90a6bc Update GFXTextureManager and GBitmap
GBitmap Changes:
Added all other formats to gbitmap that we support
gbitmap now supports cubemaps
added converters for all these other formats
added stb_image_resize for extrudemips so we can extrude mipmaps for all other formats

GFXTextureManager
Can now directly make cubemaps and texture arrays based on the GFXTextureProfile
API implementations for all functions that cubemaps and arrays needed
2025-12-22 10:29:01 +00:00

208 lines
6.4 KiB
C++

//-----------------------------------------------------------------------------
// Copyright (c) 2012 GarageGames, LLC
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files (the "Software"), to
// deal in the Software without restriction, including without limitation the
// rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
// sell copies of the Software, and to permit persons to whom the Software is
// furnished to do so, subject to the following conditions:
//
// The above copyright notice and this permission notice shall be included in
// all copies or substantial portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
// FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
// IN THE SOFTWARE.
//-----------------------------------------------------------------------------
#include "math/mMath.h"
#include "gfx/bitmap/gBitmap.h"
#include "gfx/bitmap/bitmapUtils.h"
#if !defined(__MWERKS__) && defined(_MSC_VER)
#define asm _asm
#endif
//--------------------------------------------------------------------------
void bitmapExtrude5551_asm(const void *srcMip, void *mip, U32 height, U32 width)
{
const U16 *src = (const U16 *) srcMip;
U16 *dst = (U16 *) mip;
U32 stride = width << 1;
for(U32 y = 0; y < height; y++)
{
for(U32 x = 0; x < width; x++)
{
U32 a = src[0];
U32 b = src[1];
U32 c = src[stride];
U32 d = src[stride+1];
dst[x] = ((((a >> 11) + (b >> 11) + (c >> 11) + (d >> 11)) >> 2) << 11) |
((( ((a >> 6) & 0x1f) + ((b >> 6) & 0x1f) + ((c >> 6) & 0x1f) + ((d >> 6) & 0x1F) ) >> 2) << 6) |
((( ((a >> 1) & 0x1F) + ((b >> 1) & 0x1F) + ((c >> 1) & 0x1f) + ((d >> 1) & 0x1f)) >> 2) << 1);
src += 2;
}
src += stride;
dst += width;
}
}
#if defined(TORQUE_SUPPORTS_VC_INLINE_X86_ASM)
//--------------------------------------------------------------------------
void bitmapExtrudeRGB_mmx(const void *srcMip, void *mip, U32 srcHeight, U32 srcWidth)
{
if (srcHeight == 1 || srcWidth == 1) {
bitmapExtrudeRGB_c(srcMip, mip, srcHeight, srcWidth);
return;
}
U32 width = srcWidth >> 1;
U32 height = srcHeight >> 1;
if (width <= 1)
{
bitmapExtrudeRGB_c(srcMip, mip, srcHeight, srcWidth);
return;
}
U64 ZERO = 0x0000000000000000;
const U8 *src = (const U8 *) srcMip;
U8 *dst = (U8 *) mip;
U32 srcStride = (width << 1) * 3;
U32 dstStride = width * 3;
for(U32 y = 0; y < height; y++)
{
asm
{
mov eax, src
mov ebx, eax
add ebx, srcStride
mov ecx, dst
mov edx, width
//--------------------------------------
row_loop:
punpcklbw mm0, [eax]
psrlw mm0, 8
punpcklbw mm1, [eax+3]
psrlw mm1, 8
paddw mm0, mm1
punpcklbw mm1, [ebx]
psrlw mm1, 8
paddw mm0, mm1
punpcklbw mm1, [ebx+3]
psrlw mm1, 8
paddw mm0, mm1
psrlw mm0, 2
//pxor mm1, mm1
packuswb mm0, ZERO // mm1
movd [ecx], mm0
add eax, 6
add ebx, 6
add ecx, 3
dec edx
jnz row_loop
}
src += srcStride + srcStride; // advance to next line
dst += dstStride;
}
asm
{
emms
}
}
//--------------------------------------------------------------------------
void bitmapConvertRGB_to_5551_mmx(U8 *src, U32 pixels)
{
U64 MULFACT = 0x0008200000082000; // RGB quad word multiplier
U64 REDBLUE = 0x00f800f800f800f8; // Red-Blue mask
U64 GREEN = 0x0000f8000000f800; // Green mask
U64 ALPHA = 0x0000000000010001; // 100% Alpha mask
U64 ZERO = 0x0000000000000000;
U32 evenPixels = pixels >> 1; // the MMX loop can only do an even number
U32 oddPixels = pixels & 1; // of pixels since it processes 2 at a time
U16 *dst = (U16*)src;
if (evenPixels)
{
asm
{
mov eax, src // YES, src = dst at start
mov ebx, dst // convert image in place
mov edx, evenPixels
pixel_loop2:
movd mm0, [eax] // get first 24-bit pixel
movd mm1, [eax+3] // get second 24-bit pixel
punpckldq mm0, mm1 // put second in high dword
movq mm1, mm0 // save the original data
pand mm0, REDBLUE // mask out all but the 5MSBits of red and blue
pmaddwd mm0, MULFACT // multiply each word by
// 2**13, 2**3, 2**13, 2**3 and add results
pand mm1, GREEN // mask out all but the 5MSBits of green
por mm0, mm1 // combine the red, green, and blue bits
psrld mm0, 6 // shift into position
packssdw mm0, ZERO // pack into single dword
pslld mm0, 1 // shift into final position
por mm0, ALPHA // add the alpha bit
movd [ebx], mm0
add eax, 6
add ebx, 4
dec edx
jnz pixel_loop2
mov src, eax
mov dst, ebx
emms
}
}
if (oddPixels)
{
U32 r = src[0] >> 3;
U32 g = src[1] >> 3;
U32 b = src[2] >> 3;
*dst = (b << 1) | (g << 6) | (r << 11) | 1;
}
}
#endif
//--------------------------------------------------------------------------
void PlatformBlitInit()
{
bitmapExtrude5551 = bitmapExtrude5551_asm;
//bitmapExtrudeRGB = bitmapExtrudeRGB_c;
if (Platform::SystemInfo.processor.properties & CPU_PROP_MMX)
{
#if defined(TORQUE_SUPPORTS_VC_INLINE_X86_ASM)
bitmapExtrudeRGB = bitmapExtrudeRGB_mmx;
bitmapConvertRGB_to_5551 = bitmapConvertRGB_to_5551_mmx;
#endif
}
}