Serious-Engine/Sources/Engine/Graphics/Color.cpp
Ryan C. Gordon 9820436fbe First pass at cleaning out 64-bit issues.
Touches a lot of code to remove long constants like "1L", so this patch is
large and ugly, but I think it makes all those Clamp() calls look nicer in
the long run.

Most of the game is 64-bit clean, since we can build without assembly code
now. I've marked the things that are obviously still wrong with STUBBED lines.

That being said: a 64-bit build can already run the demos mostly correctly,
so we're actually almost there!

There are a few obvious things that are obviously wrong, to be fixed.
2016-04-06 23:20:29 -04:00

695 lines
19 KiB
C++

/* Copyright (c) 2002-2012 Croteam Ltd.
This program is free software; you can redistribute it and/or modify
it under the terms of version 2 of the GNU General Public License as published by
the Free Software Foundation
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License along
with this program; if not, write to the Free Software Foundation, Inc.,
51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. */
#include "Engine/StdH.h"
#include <Engine/Graphics/Color.h>
#include <Engine/Math/Functions.h>
// asm shortcuts
#define O offset
#define Q qword ptr
#define D dword ptr
#define W word ptr
#define B byte ptr
extern const UBYTE *pubClipByte;
// convert HSV components to CroTeam COLOR format
COLOR HSVToColor( UBYTE const ubH, UBYTE const ubS, UBYTE const ubV)
{
if( ubS>1) {
SLONG xH = (SLONG)ubH *1536; // ->FIXINT/(256/6)
INDEX iHlo = xH & 0xFFFF;
SLONG slP = ((SLONG)ubV * (256- (SLONG)ubS)) >>8;
SLONG slQ = ((SLONG)ubV * (256-(((SLONG)ubS*iHlo)>>16))) >>8;
SLONG slT = ((SLONG)ubV * (256-(((SLONG)ubS*(65536-iHlo))>>16))) >>8;
switch( xH>>16) {
case 0: return RGBToColor(ubV,slT,slP);
case 1: return RGBToColor(slQ,ubV,slP);
case 2: return RGBToColor(slP,ubV,slT);
case 3: return RGBToColor(slP,slQ,ubV);
case 4: return RGBToColor(slT,slP,ubV);
case 5: return RGBToColor(ubV,slP,slQ);
default: ASSERTALWAYS("WHAT\?\?\?"); return C_BLACK;
}
} else return RGBToColor(ubV,ubV,ubV);
}
// convert CroTeam COLOR format to HSV components
void ColorToHSV( COLOR const colSrc, UBYTE &ubH, UBYTE &ubS, UBYTE &ubV)
{
UBYTE ubR, ubG, ubB;
ColorToRGB( colSrc, ubR,ubG,ubB);
ubH = 0;
ubS = 0;
ubV = Max( Max(ubR,ubG),ubB);
if( ubV>1) {
SLONG slD = ubV - Min( Min(ubR,ubG),ubB);
if( slD<1) return;
ubS = (slD*255) /ubV;
if( ubR==ubV) ubH = 0+ (((SLONG)ubG-ubB)*85) / (slD*2);
else if( ubG==ubV) ubH = 85+ (((SLONG)ubB-ubR)*85) / (slD*2);
else ubH = 170+ (((SLONG)ubR-ubG)*85) / (slD*2);
}
}
// color checking routines
#define GRAY_TRESHOLD 4
#define WHITE_TRESHOLD (255-GRAY_TRESHOLD)
BOOL IsGray( COLOR const col)
{
UBYTE ubR,ubG,ubB;
ColorToRGB( col, ubR,ubG,ubB);
INDEX iMaxDelta = Max( Max(ubR,ubG),ubB) - Min( Min(ubR,ubG),ubB);
if( iMaxDelta<GRAY_TRESHOLD) return TRUE;
return FALSE;
}
BOOL IsBlack( COLOR const col)
{
UBYTE ubR,ubG,ubB;
ColorToRGB( col, ubR,ubG,ubB);
if( ubR<GRAY_TRESHOLD && ubG<GRAY_TRESHOLD && ubB<GRAY_TRESHOLD) return TRUE;
return FALSE;
}
BOOL IsWhite( COLOR const col)
{
UBYTE ubR,ubG,ubB;
ColorToRGB( col, ubR,ubG,ubB);
if( ubR>WHITE_TRESHOLD && ubG>WHITE_TRESHOLD && ubB>WHITE_TRESHOLD) return TRUE;
return FALSE;
}
BOOL IsBigger( COLOR const col1, COLOR const col2)
{
UBYTE ubR1,ubG1,ubB1;
UBYTE ubR2,ubG2,ubB2;
ColorToRGB( col1, ubR1,ubG1,ubB1);
ColorToRGB( col2, ubR2,ubG2,ubB2);
SLONG slGray1 = (((SLONG)ubR1+ubG1+ubB1)*21846) >>16;
SLONG slGray2 = (((SLONG)ubR2+ubG2+ubB2)*21846) >>16;
return (slGray1>slGray2);
}
// has color same hue and saturation (with little tolerance) ?
BOOL CompareChroma( COLOR col1, COLOR col2)
{
// make color1 bigger
if( IsBigger(col2,col1)) Swap(col1,col2);
// find biggest component
SLONG slR1=0, slG1=0, slB1=0;
SLONG slR2=0, slG2=0, slB2=0;
ColorToRGB( col1, (UBYTE&)slR1, (UBYTE&)slG1, (UBYTE&)slB1);
ColorToRGB( col2, (UBYTE&)slR2, (UBYTE&)slG2, (UBYTE&)slB2);
SLONG slMax1 = Max(Max(slR1,slG1),slB1);
SLONG slMax2 = Max(Max(slR2,slG2),slB2);
// trivial?
if( slMax1<GRAY_TRESHOLD || slMax2<GRAY_TRESHOLD) return TRUE;
// find expected color
SLONG slR,slG,slB, slDiv;
if( slR1==slMax1) {
slDiv = 65536 / slR1;
slR = slR2;
slG = (slR2*slG1*slDiv)>>16;
slB = (slR2*slB1*slDiv)>>16;
} else if( slG1==slMax1) {
slDiv = 65536 / slG1;
slR = (slG2*slR1*slDiv)>>16;
slG = slG2;
slB = (slG2*slB1*slDiv)>>16;
} else {
slDiv = 65536 / slB1;
slR = (slB2*slR1*slDiv)>>16;
slG = (slB2*slG1*slDiv)>>16;
slB = slB2;
}
// check expected color
if( Abs(slR-slR2) > (GRAY_TRESHOLD/2)) return FALSE;
if( Abs(slG-slG2) > (GRAY_TRESHOLD/2)) return FALSE;
if( Abs(slB-slB2) > (GRAY_TRESHOLD/2)) return FALSE;
return TRUE;
}
// find corresponding desaturated color (it's not same as gray!)
COLOR DesaturateColor( COLOR const col)
{
UBYTE ubR,ubG,ubB,ubA, ubMax;
ColorToRGBA( col, ubR,ubG,ubB,ubA);
ubMax = Max(Max(ubR,ubG),ubB);
return RGBAToColor( ubMax,ubMax,ubMax,ubA);
}
// adjust color saturation and/or hue
COLOR AdjustColor( COLOR const col, SLONG const slHueShift, SLONG const slSaturation)
{
// nothing?
if( slHueShift==0 && slSaturation==256) return col;
// saturation?
COLOR colRes = col;
UBYTE ubA = (col&CT_AMASK)>>CT_ASHIFT;
if( slSaturation!=256)
{ // calculate gray factor
UBYTE ubR,ubG,ubB;
ColorToRGB( col, ubR,ubG,ubB);
SLONG slGray = (ubR*72 + ubG*152 + ubB*32)>>8;
// saturate color components
SLONG slR = slGray + (((ubR-slGray)*slSaturation)>>8);
SLONG slG = slGray + (((ubG-slGray)*slSaturation)>>8);
SLONG slB = slGray + (((ubB-slGray)*slSaturation)>>8);
// clamp color components
colRes = RGBToColor( pubClipByte[slR], pubClipByte[slG], pubClipByte[slB]);
}
// hue?
if( slHueShift==0) return colRes|ubA;
UBYTE ubH,ubS,ubV;
ColorToHSV( colRes, ubH,ubS,ubV);
ubH += slHueShift;
return HSVAToColor( ubH,ubS,ubV,ubA);
}
// adjust color gamma correction
COLOR AdjustGamma( COLOR const col, FLOAT const fGamma)
{
if( fGamma==1.0f || fGamma<0.2f) return col;
const FLOAT f1oGamma = 1.0f / fGamma;
const FLOAT f1o255 = 1.0f / 255.0f;
UBYTE ubR,ubG,ubB,ubA;
ColorToRGBA( col, ubR,ubG,ubB,ubA);
ubR = ClampUp( NormFloatToByte(pow(ubR*f1o255,f1oGamma)), (ULONG) 255);
ubG = ClampUp( NormFloatToByte(pow(ubG*f1o255,f1oGamma)), (ULONG) 255);
ubB = ClampUp( NormFloatToByte(pow(ubB*f1o255,f1oGamma)), (ULONG) 255);
return RGBAToColor( ubR,ubG,ubB,ubA);
}
// color lerping functions
void LerpColor( COLOR col0, COLOR col1, FLOAT fRatio, UBYTE &ubR, UBYTE &ubG, UBYTE &ubB)
{
UBYTE ubR0, ubG0, ubB0;
UBYTE ubR1, ubG1, ubB1;
ColorToRGB( col0, ubR0, ubG0, ubB0);
ColorToRGB( col1, ubR1, ubG1, ubB1);
ubR = Lerp( ubR0, ubR1, fRatio);
ubG = Lerp( ubG0, ubG1, fRatio);
ubB = Lerp( ubB0, ubB1, fRatio);
}
COLOR LerpColor( COLOR col0, COLOR col1, FLOAT fRatio)
{
UBYTE ubR0, ubG0, ubB0, ubA0;
UBYTE ubR1, ubG1, ubB1, ubA1;
ColorToRGBA( col0, ubR0, ubG0, ubB0, ubA0);
ColorToRGBA( col1, ubR1, ubG1, ubB1, ubA1);
ubR0 = Lerp( ubR0, ubR1, fRatio);
ubG0 = Lerp( ubG0, ubG1, fRatio);
ubB0 = Lerp( ubB0, ubB1, fRatio);
ubA0 = Lerp( ubA0, ubA1, fRatio);
return RGBAToColor( ubR0, ubG0, ubB0, ubA0);
}
// fast color multiply function - RES = 1ST * 2ND /255
COLOR MulColors( COLOR col1, COLOR col2)
{
if( col1==0xFFFFFFFF) return col2;
if( col2==0xFFFFFFFF) return col1;
if( col1==0 || col2==0) return 0;
#if (defined USE_PORTABLE_C)
// !!! FIXME: This...is not fast.
union
{
COLOR col;
UBYTE bytes[4];
} conv1;
union
{
COLOR col;
UBYTE bytes[4];
} conv2;
conv1.col = col1;
conv2.col = col2;
conv1.bytes[0] = (UBYTE) ((((DWORD) conv1.bytes[0]) * ((DWORD) conv2.bytes[0])) / 255);
conv1.bytes[1] = (UBYTE) ((((DWORD) conv1.bytes[1]) * ((DWORD) conv2.bytes[1])) / 255);
conv1.bytes[2] = (UBYTE) ((((DWORD) conv1.bytes[2]) * ((DWORD) conv2.bytes[2])) / 255);
conv1.bytes[3] = (UBYTE) ((((DWORD) conv1.bytes[3]) * ((DWORD) conv2.bytes[3])) / 255);
return(conv1.col);
#elif (defined __MSVC_INLINE__)
COLOR colRet;
__asm {
xor ebx,ebx
// red
mov eax,D [col1]
and eax,CT_RMASK
shr eax,CT_RSHIFT
mov ecx,eax
shl ecx,8
or eax,ecx
mov edx,D [col2]
and edx,CT_RMASK
shr edx,CT_RSHIFT
mov ecx,edx
shl ecx,8
or edx,ecx
imul eax,edx
shr eax,16+8
shl eax,CT_RSHIFT
or ebx,eax
// green
mov eax,D [col1]
and eax,CT_GMASK
shr eax,CT_GSHIFT
mov ecx,eax
shl ecx,8
or eax,ecx
mov edx,D [col2]
and edx,CT_GMASK
shr edx,CT_GSHIFT
mov ecx,edx
shl ecx,8
or edx,ecx
imul eax,edx
shr eax,16+8
shl eax,CT_GSHIFT
or ebx,eax
// blue
mov eax,D [col1]
and eax,CT_BMASK
shr eax,CT_BSHIFT
mov ecx,eax
shl ecx,8
or eax,ecx
mov edx,D [col2]
and edx,CT_BMASK
shr edx,CT_BSHIFT
mov ecx,edx
shl ecx,8
or edx,ecx
imul eax,edx
shr eax,16+8
shl eax,CT_BSHIFT
or ebx,eax
// alpha
mov eax,D [col1]
and eax,CT_AMASK
shr eax,CT_ASHIFT
mov ecx,eax
shl ecx,8
or eax,ecx
mov edx,D [col2]
and edx,CT_AMASK
shr edx,CT_ASHIFT
mov ecx,edx
shl ecx,8
or edx,ecx
imul eax,edx
shr eax,16+8
shl eax,CT_ASHIFT
or ebx,eax
// done
mov D [colRet],ebx
}
return colRet;
#elif (defined __GNU_INLINE__)
COLOR colRet;
__asm__ __volatile__ (
"pushl %%ebx \n\t"
"xorl %%ebx, %%ebx \n\t"
// red
"movl %%esi, %%eax \n\t"
"andl $0xFF000000, %%eax \n\t"
"shrl $24, %%eax \n\t"
"movl %%eax, %%ecx \n\t"
"shll $8, %%ecx \n\t"
"orl %%ecx, %%eax \n\t"
"movl %%edi, %%edx \n\t"
"andl $0xFF000000, %%edx \n\t"
"shrl $24, %%edx \n\t"
"movl %%edx, %%ecx \n\t"
"shll $8, %%ecx \n\t"
"orl %%ecx, %%edx \n\t"
"imull %%edx, %%eax \n\t"
"shrl $24, %%eax \n\t"
"shll $24, %%eax \n\t"
"orl %%eax, %%ebx \n\t"
// green
"movl %%esi, %%eax \n\t"
"andl $0x00FF0000, %%eax \n\t"
"shrl $16, %%eax \n\t"
"movl %%eax, %%ecx \n\t"
"shll $8,%%ecx \n\t"
"orl %%ecx, %%eax \n\t"
"movl %%edi, %%edx \n\t"
"andl $0x00FF0000, %%edx \n\t"
"shrl $16, %%edx \n\t"
"movl %%edx, %%ecx \n\t"
"shll $8, %%ecx \n\t"
"orl %%ecx, %%edx \n\t"
"imull %%edx, %%eax \n\t"
"shrl $24, %%eax \n\t"
"shll $16, %%eax \n\t"
"orl %%eax, %%ebx \n\t"
// blue
"movl %%esi, %%eax \n\t"
"andl $0x0000FF00, %%eax \n\t"
"shrl $8, %%eax \n\t"
"movl %%eax, %%ecx \n\t"
"shll $8, %%ecx \n\t"
"orl %%ecx, %%eax \n\t"
"movl %%edi, %%edx \n\t"
"andl $0x0000FF00, %%edx \n\t"
"shrl $8, %%edx \n\t"
"movl %%edx, %%ecx \n\t"
"shll $8, %%ecx \n\t"
"orl %%ecx, %%edx \n\t"
"imull %%edx, %%eax \n\t"
"shrl $24, %%eax \n\t"
"shll $8, %%eax \n\t"
"orl %%eax, %%ebx \n\t"
// alpha
"movl %%esi, %%eax \n\t"
"andl $0x000000FF, %%eax \n\t"
"shrl $0, %%eax \n\t" // !!! FIXME: Lose this line.
"movl %%eax, %%ecx \n\t"
"shll $8, %%ecx \n\t"
"orl %%ecx, %%eax \n\t"
"movl %%edi, %%edx \n\t"
"andl $0x000000FF, %%edx \n\t"
"shrl $0, %%edx \n\t" // !!! FIXME: Lose this line.
"movl %%edx, %%ecx \n\t"
"shll $8, %%ecx \n\t"
"orl %%ecx, %%edx \n\t"
"imull %%edx, %%eax \n\t"
"shrl $24, %%eax \n\t"
"shll $0, %%eax \n\t" // !!! FIXME: Lose this line.
"orl %%eax, %%ebx \n\t"
"movl %%ebx, %%ecx \n\t"
"popl %%ebx \n\t"
: "=c" (colRet)
: "S" (col1), "D" (col2)
: "eax", "edx", "cc", "memory"
);
return colRet;
#else
#error please fill in inline assembly for your platform.
#endif
}
// fast color additon function - RES = clamp (1ST + 2ND)
COLOR AddColors( COLOR col1, COLOR col2)
{
if( col1==0) return col2;
if( col2==0) return col1;
if( col1==0xFFFFFFFF || col2==0xFFFFFFFF) return 0xFFFFFFFF;
COLOR colRet;
#if (defined USE_PORTABLE_C)
// !!! FIXME: This...is not fast.
union
{
COLOR col;
UBYTE bytes[4];
} conv1;
union
{
COLOR col;
UBYTE bytes[4];
} conv2;
#define MINVAL(a, b) ((a)>(b))?(b):(a)
conv1.col = col1;
conv2.col = col2;
conv1.bytes[0] = (UBYTE) MINVAL((((WORD) conv1.bytes[0]) + ((WORD) conv2.bytes[0])) , 255);
conv1.bytes[1] = (UBYTE) MINVAL((((WORD) conv1.bytes[1]) + ((WORD) conv2.bytes[1])) , 255);
conv1.bytes[2] = (UBYTE) MINVAL((((WORD) conv1.bytes[2]) + ((WORD) conv2.bytes[2])) , 255);
conv1.bytes[3] = (UBYTE) MINVAL((((WORD) conv1.bytes[3]) + ((WORD) conv2.bytes[3])) , 255);
#undef MINVAL
colRet = conv1.col;
#elif (defined __MSVC_INLINE__)
__asm {
xor ebx,ebx
mov esi,255
// red
mov eax,D [col1]
and eax,CT_RMASK
shr eax,CT_RSHIFT
mov edx,D [col2]
and edx,CT_RMASK
shr edx,CT_RSHIFT
add eax,edx
cmp esi,eax // clamp
sbb ecx,ecx
or eax,ecx
shl eax,CT_RSHIFT
and eax,CT_RMASK
or ebx,eax
// green
mov eax,D [col1]
and eax,CT_GMASK
shr eax,CT_GSHIFT
mov edx,D [col2]
and edx,CT_GMASK
shr edx,CT_GSHIFT
add eax,edx
cmp esi,eax // clamp
sbb ecx,ecx
or eax,ecx
shl eax,CT_GSHIFT
and eax,CT_GMASK
or ebx,eax
// blue
mov eax,D [col1]
and eax,CT_BMASK
shr eax,CT_BSHIFT
mov edx,D [col2]
and edx,CT_BMASK
shr edx,CT_BSHIFT
add eax,edx
cmp esi,eax // clamp
sbb ecx,ecx
or eax,ecx
shl eax,CT_BSHIFT
and eax,CT_BMASK
or ebx,eax
// alpha
mov eax,D [col1]
and eax,CT_AMASK
shr eax,CT_ASHIFT
mov edx,D [col2]
and edx,CT_AMASK
shr edx,CT_ASHIFT
add eax,edx
cmp esi,eax // clamp
sbb ecx,ecx
or eax,ecx
shl eax,CT_ASHIFT
and eax,CT_AMASK
or ebx,eax
// done
mov D [colRet],ebx
}
#elif (defined __GNU_INLINE__)
__asm__ __volatile__ (
"pushl %%ebx \n\t"
"pushl %%edi \n\t"
"pushl %%esi \n\t"
"xorl %%ebx, %%ebx \n\t"
"mov $255, %%esi \n\t"
// red
"movl (%%esp), %%eax \n\t"
"andl $0xFF000000, %%eax \n\t"
"shrl $24, %%eax \n\t"
"movl 4(%%esp), %%edx \n\t"
"andl $0xFF000000, %%edx \n\t"
"shrl $24, %%edx \n\t"
"addl %%edx, %%eax \n\t"
"cmpl %%eax, %%esi \n\t" // clamp
"sbbl %%ecx, %%ecx \n\t"
"orl %%ecx, %%eax \n\t"
"shll $24, %%eax \n\t"
"andl $0xFF000000, %%eax \n\t"
"orl %%eax, %%ebx \n\t"
// green
"movl (%%esp), %%eax \n\t"
"andl $0x00FF0000, %%eax \n\t"
"shrl $16, %%eax \n\t"
"movl 4(%%esp), %%edx \n\t"
"andl $0x00FF0000, %%edx \n\t"
"shrl $16, %%edx \n\t"
"addl %%edx, %%eax \n\t"
"cmpl %%eax, %%esi \n\t" // clamp
"sbbl %%ecx, %%ecx \n\t"
"orl %%ecx, %%eax \n\t"
"shll $16, %%eax \n\t"
"andl $0x00FF0000, %%eax \n\t"
"orl %%eax, %%ebx \n\t"
// blue
"movl (%%esp), %%eax \n\t"
"andl $0x0000FF00, %%eax \n\t"
"shrl $8, %%eax \n\t"
"movl 4(%%esp), %%edx \n\t"
"andl $0x0000FF00, %%edx \n\t"
"shrl $8, %%edx \n\t"
"addl %%edx, %%eax \n\t"
"cmpl %%eax, %%esi \n\t" // clamp
"sbbl %%ecx, %%ecx \n\t"
"orl %%ecx, %%eax \n\t"
"shll $8, %%eax \n\t"
"andl $0x0000FF00, %%eax \n\t"
"orl %%eax, %%ebx \n\t"
// alpha
"movl (%%esp), %%eax \n\t"
"andl $0x000000FF, %%eax \n\t"
"shrl $0, %%eax \n\t"
"movl 4(%%esp), %%edx \n\t"
"andl $0x000000FF, %%edx \n\t"
"shrl $0, %%edx \n\t"
"addl %%edx, %%eax \n\t"
"cmpl %%eax, %%esi \n\t" // clamp
"sbbl %%ecx, %%ecx \n\t"
"orl %%ecx, %%eax \n\t"
"shll $0, %%eax \n\t"
"andl $0x000000FF, %%eax \n\t"
"orl %%eax, %%ebx \n\t"
"movl %%ebx, %%ecx \n\t"
// done.
"addl $8, %%esp \n\t"
"popl %%ebx \n\t"
: "=c" (colRet)
: "S" (col1), "D" (col2)
: "eax", "edx", "cc", "memory"
);
#else
#error please fill in inline assembly for your platform.
#endif
return colRet;
}
// multiple conversion from OpenGL color to DirectX color
extern void abgr2argb( ULONG *pulSrc, ULONG *pulDst, INDEX ct)
{
#if (defined USE_PORTABLE_C)
//#error write me.
for (int i=0; i<ct; i++) {
ULONG tmp = pulSrc[i];
pulDst[i] = (tmp&0xff00ff00) | ((tmp&0x00ff0000)>>16) | ((tmp&0x000000ff)<<16);
}
#elif (defined __MSVC_INLINE__)
__asm {
mov esi,dword ptr [pulSrc]
mov edi,dword ptr [pulDst]
mov ecx,dword ptr [ct]
shr ecx,2
jz colSkip4
colLoop4:
push ecx
mov eax,dword ptr [esi+ 0]
mov ebx,dword ptr [esi+ 4]
mov ecx,dword ptr [esi+ 8]
mov edx,dword ptr [esi+12]
bswap eax
bswap ebx
bswap ecx
bswap edx
ror eax,8
ror ebx,8
ror ecx,8
ror edx,8
mov dword ptr [edi+ 0],eax
mov dword ptr [edi+ 4],ebx
mov dword ptr [edi+ 8],ecx
mov dword ptr [edi+12],edx
add esi,4*4
add edi,4*4
pop ecx
dec ecx
jnz colLoop4
colSkip4:
test dword ptr [ct],2
jz colSkip2
mov eax,dword ptr [esi+0]
mov ebx,dword ptr [esi+4]
bswap eax
bswap ebx
ror eax,8
ror ebx,8
mov dword ptr [edi+0],eax
mov dword ptr [edi+4],ebx
add esi,4*2
add edi,4*2
colSkip2:
test dword ptr [ct],1
jz colSkip1
mov eax,dword ptr [esi]
bswap eax
ror eax,8
mov dword ptr [edi],eax
colSkip1:
}
#elif (defined __GNU_INLINE__)
STUBBED("convert to inline asm.");
#else
#error please fill in inline assembly for your platform.
#endif
}