mirror of
https://github.com/dborth/snes9xgx.git
synced 2025-01-12 11:19:07 +01:00
minor optimizations
This commit is contained in:
parent
9e0bff0219
commit
0e5d796a44
@ -54,9 +54,9 @@ uint32_t* Metaphrasis::convertBufferToI4(uint32_t* rgbaBuffer, uint16_t bufferWi
|
|||||||
uint32_t *src = (uint32_t *)rgbaBuffer;
|
uint32_t *src = (uint32_t *)rgbaBuffer;
|
||||||
uint8_t *dst = (uint8_t *)dataBufferI4;
|
uint8_t *dst = (uint8_t *)dataBufferI4;
|
||||||
|
|
||||||
for(uint16_t y = 0; y < bufferHeight; y += 8) {
|
for(uint32_t y = 0; y < bufferHeight; y += 8) {
|
||||||
for(uint16_t x = 0; x < bufferWidth; x += 8) {
|
for(uint32_t x = 0; x < bufferWidth; x += 8) {
|
||||||
for(uint16_t rows = 0; rows < 8; rows++) {
|
for(uint32_t rows = 0; rows < 8; rows++) {
|
||||||
*dst++ = (src[((y + rows) * bufferWidth) + (x + 0)] & 0xf0) | ((src[((y + rows) * bufferWidth) + (x + 1)] & 0xf0) >> 4);
|
*dst++ = (src[((y + rows) * bufferWidth) + (x + 0)] & 0xf0) | ((src[((y + rows) * bufferWidth) + (x + 1)] & 0xf0) >> 4);
|
||||||
*dst++ = (src[((y + rows) * bufferWidth) + (x + 2)] & 0xf0) | ((src[((y + rows) * bufferWidth) + (x + 3)] & 0xf0) >> 4);
|
*dst++ = (src[((y + rows) * bufferWidth) + (x + 2)] & 0xf0) | ((src[((y + rows) * bufferWidth) + (x + 3)] & 0xf0) >> 4);
|
||||||
*dst++ = (src[((y + rows) * bufferWidth) + (x + 4)] & 0xf0) | ((src[((y + rows) * bufferWidth) + (x + 5)] & 0xf0) >> 4);
|
*dst++ = (src[((y + rows) * bufferWidth) + (x + 4)] & 0xf0) | ((src[((y + rows) * bufferWidth) + (x + 5)] & 0xf0) >> 4);
|
||||||
@ -88,17 +88,19 @@ uint32_t* Metaphrasis::convertBufferToI8(uint32_t* rgbaBuffer, uint16_t bufferWi
|
|||||||
uint32_t *src = (uint32_t *)rgbaBuffer;
|
uint32_t *src = (uint32_t *)rgbaBuffer;
|
||||||
uint8_t *dst = (uint8_t *)dataBufferI8;
|
uint8_t *dst = (uint8_t *)dataBufferI8;
|
||||||
|
|
||||||
for(uint16_t y = 0; y < bufferHeight; y += 4) {
|
for(uint32_t rows = 0; rows < 4; rows++) {
|
||||||
for(uint16_t x = 0; x < bufferWidth; x += 8) {
|
for(uint32_t y = 0; y < bufferHeight; y += 4) {
|
||||||
for(uint16_t rows = 0; rows < 4; rows++) {
|
uint32_t bufWid = ((y + rows) * bufferWidth);
|
||||||
*dst++ = src[((y + rows) * bufferWidth) + (x + 0)] & 0xff;
|
for(uint32_t x = 0; x < bufferWidth; x += 8) {
|
||||||
*dst++ = src[((y + rows) * bufferWidth) + (x + 1)] & 0xff;
|
|
||||||
*dst++ = src[((y + rows) * bufferWidth) + (x + 2)] & 0xff;
|
*dst++ = src[bufWid + (x + 0)] & 0xff;
|
||||||
*dst++ = src[((y + rows) * bufferWidth) + (x + 3)] & 0xff;
|
*dst++ = src[bufWid + (x + 1)] & 0xff;
|
||||||
*dst++ = src[((y + rows) * bufferWidth) + (x + 4)] & 0xff;
|
*dst++ = src[bufWid + (x + 2)] & 0xff;
|
||||||
*dst++ = src[((y + rows) * bufferWidth) + (x + 5)] & 0xff;
|
*dst++ = src[bufWid + (x + 3)] & 0xff;
|
||||||
*dst++ = src[((y + rows) * bufferWidth) + (x + 6)] & 0xff;
|
*dst++ = src[bufWid + (x + 4)] & 0xff;
|
||||||
*dst++ = src[((y + rows) * bufferWidth) + (x + 7)] & 0xff;
|
*dst++ = src[bufWid + (x + 5)] & 0xff;
|
||||||
|
*dst++ = src[bufWid + (x + 6)] & 0xff;
|
||||||
|
*dst++ = src[bufWid + (x + 7)] & 0xff;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -117,11 +119,8 @@ uint32_t* Metaphrasis::convertBufferToI8(uint32_t* rgbaBuffer, uint16_t bufferWi
|
|||||||
*/
|
*/
|
||||||
|
|
||||||
uint8_t Metaphrasis::convertRGBAToIA4(uint32_t rgba) {
|
uint8_t Metaphrasis::convertRGBAToIA4(uint32_t rgba) {
|
||||||
uint8_t i, a;
|
uint8_t i = (rgba >> 8) & 0xf0;
|
||||||
|
uint8_t a = (rgba ) & 0xff;
|
||||||
i = (rgba >> 8) & 0xf0;
|
|
||||||
a = (rgba ) & 0xff;
|
|
||||||
|
|
||||||
return i | (a >> 4);
|
return i | (a >> 4);
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -144,9 +143,9 @@ uint32_t* Metaphrasis::convertBufferToIA4(uint32_t* rgbaBuffer, uint16_t bufferW
|
|||||||
uint32_t *src = (uint32_t *)rgbaBuffer;
|
uint32_t *src = (uint32_t *)rgbaBuffer;
|
||||||
uint8_t *dst = (uint8_t *)dataBufferIA4;
|
uint8_t *dst = (uint8_t *)dataBufferIA4;
|
||||||
|
|
||||||
for(uint16_t y = 0; y < bufferHeight; y += 4) {
|
for(uint32_t y = 0; y < bufferHeight; y += 4) {
|
||||||
for(uint16_t x = 0; x < bufferWidth; x += 8) {
|
for(uint32_t x = 0; x < bufferWidth; x += 8) {
|
||||||
for(uint16_t rows = 0; rows < 4; rows++) {
|
for(uint32_t rows = 0; rows < 4; rows++) {
|
||||||
*dst++ = Metaphrasis::convertRGBAToIA4(src[((y + rows) * bufferWidth) + (x + 0)]);
|
*dst++ = Metaphrasis::convertRGBAToIA4(src[((y + rows) * bufferWidth) + (x + 0)]);
|
||||||
*dst++ = Metaphrasis::convertRGBAToIA4(src[((y + rows) * bufferWidth) + (x + 1)]);
|
*dst++ = Metaphrasis::convertRGBAToIA4(src[((y + rows) * bufferWidth) + (x + 1)]);
|
||||||
*dst++ = Metaphrasis::convertRGBAToIA4(src[((y + rows) * bufferWidth) + (x + 2)]);
|
*dst++ = Metaphrasis::convertRGBAToIA4(src[((y + rows) * bufferWidth) + (x + 2)]);
|
||||||
@ -173,12 +172,7 @@ uint32_t* Metaphrasis::convertBufferToIA4(uint32_t* rgbaBuffer, uint16_t bufferW
|
|||||||
*/
|
*/
|
||||||
|
|
||||||
uint16_t Metaphrasis::convertRGBAToIA8(uint32_t rgba) {
|
uint16_t Metaphrasis::convertRGBAToIA8(uint32_t rgba) {
|
||||||
uint8_t i, a;
|
return (((rgba >> 8) & 0xff) << 8) | ((rgba ) & 0xff);
|
||||||
|
|
||||||
i = (rgba >> 8) & 0xff;
|
|
||||||
a = (rgba ) & 0xff;
|
|
||||||
|
|
||||||
return (i << 8) | a;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
@ -200,13 +194,15 @@ uint32_t* Metaphrasis::convertBufferToIA8(uint32_t* rgbaBuffer, uint16_t bufferW
|
|||||||
uint32_t *src = (uint32_t *)rgbaBuffer;
|
uint32_t *src = (uint32_t *)rgbaBuffer;
|
||||||
uint16_t *dst = (uint16_t *)dataBufferIA8;
|
uint16_t *dst = (uint16_t *)dataBufferIA8;
|
||||||
|
|
||||||
for(uint16_t y = 0; y < bufferHeight; y += 4) {
|
for(uint32_t rows = 0; rows < 4; ++rows) {
|
||||||
for(uint16_t x = 0; x < bufferWidth; x += 4) {
|
for(uint32_t y = 0; y < bufferHeight; y += 4) {
|
||||||
for(uint16_t rows = 0; rows < 4; rows++) {
|
uint32_t bufWid = ((y + rows) * bufferWidth);
|
||||||
*dst++ = Metaphrasis::convertRGBAToIA8(src[((y + rows) * bufferWidth) + (x + 0)]);
|
for(uint32_t x = 0; x < bufferWidth; x += 4) {
|
||||||
*dst++ = Metaphrasis::convertRGBAToIA8(src[((y + rows) * bufferWidth) + (x + 1)]);
|
|
||||||
*dst++ = Metaphrasis::convertRGBAToIA8(src[((y + rows) * bufferWidth) + (x + 2)]);
|
*dst++ = Metaphrasis::convertRGBAToIA8(src[bufWid + (x + 0)]);
|
||||||
*dst++ = Metaphrasis::convertRGBAToIA8(src[((y + rows) * bufferWidth) + (x + 3)]);
|
*dst++ = Metaphrasis::convertRGBAToIA8(src[bufWid + (x + 1)]);
|
||||||
|
*dst++ = Metaphrasis::convertRGBAToIA8(src[bufWid + (x + 2)]);
|
||||||
|
*dst++ = Metaphrasis::convertRGBAToIA8(src[bufWid + (x + 3)]);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -234,19 +230,31 @@ uint32_t* Metaphrasis::convertBufferToRGBA8(uint32_t* rgbaBuffer, uint16_t buffe
|
|||||||
uint8_t *src = (uint8_t *)rgbaBuffer;
|
uint8_t *src = (uint8_t *)rgbaBuffer;
|
||||||
uint8_t *dst = (uint8_t *)dataBufferRGBA8;
|
uint8_t *dst = (uint8_t *)dataBufferRGBA8;
|
||||||
|
|
||||||
for(uint16_t block = 0; block < bufferHeight; block += 4) {
|
for(uint32_t block = 0; block < bufferHeight; block += 4) {
|
||||||
for(uint16_t i = 0; i < bufferWidth; i += 4) {
|
for(uint32_t i = 0; i < bufferWidth; i += 4) {
|
||||||
for (uint16_t c = 0; c < 4; c++) {
|
for (uint32_t c = 0; c < 4; c++) {
|
||||||
for (uint16_t ar = 0; ar < 4; ar++) {
|
uint32_t blockWid = (((block + c) * bufferWidth)+i)<<2 ;
|
||||||
*dst++ = src[(((i + ar) + ((block + c) * bufferWidth)) * 4) + 3];
|
|
||||||
*dst++ = src[((i + ar) + ((block + c) * bufferWidth)) * 4];
|
*dst++ = src[blockWid+ 3]; // ar = 0
|
||||||
}
|
*dst++ = src[blockWid+ 0];
|
||||||
|
*dst++ = src[blockWid+ 7]; // ar = 1
|
||||||
|
*dst++ = src[blockWid+ 4];
|
||||||
|
*dst++ = src[blockWid+ 11]; // ar = 2
|
||||||
|
*dst++ = src[blockWid+ 8];
|
||||||
|
*dst++ = src[blockWid+ 15]; // ar = 3
|
||||||
|
*dst++ = src[blockWid+ 12];
|
||||||
}
|
}
|
||||||
for (uint16_t c = 0; c < 4; c++) {
|
for (uint32_t c = 0; c < 4; c++) {
|
||||||
for (uint16_t gb = 0; gb < 4; gb++) {
|
uint32_t blockWid = (((block + c) * bufferWidth)+i)<<2 ;
|
||||||
*dst++ = src[(((i + gb) + ((block + c) * bufferWidth)) * 4) + 1];
|
|
||||||
*dst++ = src[(((i + gb) + ((block + c) * bufferWidth)) * 4) + 2];
|
*dst++ = src[blockWid+ 1]; // gb = 0
|
||||||
}
|
*dst++ = src[blockWid+ 2];
|
||||||
|
*dst++ = src[blockWid+ 5]; // gb = 1
|
||||||
|
*dst++ = src[blockWid+ 6];
|
||||||
|
*dst++ = src[blockWid+ 9]; // gb = 2
|
||||||
|
*dst++ = src[blockWid+ 10];
|
||||||
|
*dst++ = src[blockWid+ 13]; // gb = 3
|
||||||
|
*dst++ = src[blockWid+ 14];
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -266,12 +274,9 @@ uint32_t* Metaphrasis::convertBufferToRGBA8(uint32_t* rgbaBuffer, uint16_t buffe
|
|||||||
*/
|
*/
|
||||||
|
|
||||||
uint16_t Metaphrasis::convertRGBAToRGB565(uint32_t rgba) {
|
uint16_t Metaphrasis::convertRGBAToRGB565(uint32_t rgba) {
|
||||||
uint8_t r, g, b;
|
uint8_t r = (((rgba >> 24) & 0xff) * 31) / 255;
|
||||||
|
uint8_t g = (((rgba >> 16) & 0xff) * 63) / 255;
|
||||||
r = (((rgba >> 24) & 0xff) * 31) / 255;
|
uint8_t b = (((rgba >> 8) & 0xff) * 31) / 255;
|
||||||
g = (((rgba >> 16) & 0xff) * 63) / 255;
|
|
||||||
b = (((rgba >> 8) & 0xff) * 31) / 255;
|
|
||||||
|
|
||||||
return (((r << 6) | g ) << 5 ) | b;
|
return (((r << 6) | g ) << 5 ) | b;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -294,13 +299,14 @@ uint32_t* Metaphrasis::convertBufferToRGB565(uint32_t* rgbaBuffer, uint16_t buff
|
|||||||
uint32_t *src = (uint32_t *)rgbaBuffer;
|
uint32_t *src = (uint32_t *)rgbaBuffer;
|
||||||
uint16_t *dst = (uint16_t *)dataBufferRGB565;
|
uint16_t *dst = (uint16_t *)dataBufferRGB565;
|
||||||
|
|
||||||
for(uint16_t y = 0; y < bufferHeight; y += 4) {
|
for(uint32_t rows = 0; rows < 4; rows++) {
|
||||||
for(uint16_t x = 0; x < bufferWidth; x += 4) {
|
for(uint32_t y = 0; y < bufferHeight; y += 4) {
|
||||||
for(uint16_t rows = 0; rows < 4; rows++) {
|
uint32_t bufWid = ((y + rows) * bufferWidth);
|
||||||
*dst++ = Metaphrasis::convertRGBAToRGB565(src[((y + rows) * bufferWidth) + (x + 0)]);
|
for(uint32_t x = 0; x < bufferWidth; x += 4) {
|
||||||
*dst++ = Metaphrasis::convertRGBAToRGB565(src[((y + rows) * bufferWidth) + (x + 1)]);
|
*dst++ = Metaphrasis::convertRGBAToRGB565(src[bufWid + (x + 0)]);
|
||||||
*dst++ = Metaphrasis::convertRGBAToRGB565(src[((y + rows) * bufferWidth) + (x + 2)]);
|
*dst++ = Metaphrasis::convertRGBAToRGB565(src[bufWid + (x + 1)]);
|
||||||
*dst++ = Metaphrasis::convertRGBAToRGB565(src[((y + rows) * bufferWidth) + (x + 3)]);
|
*dst++ = Metaphrasis::convertRGBAToRGB565(src[bufWid + (x + 2)]);
|
||||||
|
*dst++ = Metaphrasis::convertRGBAToRGB565(src[bufWid + (x + 3)]);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -320,31 +326,28 @@ uint32_t* Metaphrasis::convertBufferToRGB565(uint32_t* rgbaBuffer, uint16_t buff
|
|||||||
*/
|
*/
|
||||||
|
|
||||||
uint16_t Metaphrasis::convertRGBAToRGB5A3(uint32_t rgba) {
|
uint16_t Metaphrasis::convertRGBAToRGB5A3(uint32_t rgba) {
|
||||||
uint32_t r, g, b, a;
|
uint32_t r = (rgba >> 24) & 0xff;
|
||||||
|
uint32_t g = (rgba >> 16) & 0xff;
|
||||||
|
uint32_t b = (rgba >> 8) & 0xff;
|
||||||
|
uint32_t a = (rgba ) & 0xff;
|
||||||
uint16_t color;
|
uint16_t color;
|
||||||
|
|
||||||
r = (rgba >> 24) & 0xff;
|
// No predictive misses, faster shifting
|
||||||
g = (rgba >> 16) & 0xff;
|
|
||||||
b = (rgba >> 8) & 0xff;
|
|
||||||
a = (rgba ) & 0xff;
|
|
||||||
|
|
||||||
if (a > 0xe0) {
|
if (a > 0xe0) {
|
||||||
r = r >> 3;
|
r >>= 3;
|
||||||
g = g >> 3;
|
g >>= 3;
|
||||||
b = b >> 3;
|
b >>= 3;
|
||||||
|
|
||||||
color = (r << 10) | (g << 5) | b;
|
color = (r << 10) | (g << 5) | b;
|
||||||
color |= 0x8000;
|
color |= 0x8000;
|
||||||
|
return color;
|
||||||
}
|
}
|
||||||
else {
|
|
||||||
r = r >> 4;
|
|
||||||
g = g >> 4;
|
|
||||||
b = b >> 4;
|
|
||||||
a = a >> 5;
|
|
||||||
|
|
||||||
color = (a << 12) | (r << 8) | (g << 4) | b;
|
r >>= 4;
|
||||||
}
|
g >>= 4;
|
||||||
|
b >>= 4;
|
||||||
|
a >>= 5;
|
||||||
|
color = (a << 12) | (r << 8) | (g << 4) | b;
|
||||||
return color;
|
return color;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -367,13 +370,14 @@ uint32_t* Metaphrasis::convertBufferToRGB5A3(uint32_t* rgbaBuffer, uint16_t buff
|
|||||||
uint32_t *src = (uint32_t *)rgbaBuffer;
|
uint32_t *src = (uint32_t *)rgbaBuffer;
|
||||||
uint16_t *dst = (uint16_t *)dataBufferRGB5A3;
|
uint16_t *dst = (uint16_t *)dataBufferRGB5A3;
|
||||||
|
|
||||||
for(uint16_t y = 0; y < bufferHeight; y += 4) {
|
for(uint32_t rows = 0; rows < 4; rows++) {
|
||||||
for(uint16_t x = 0; x < bufferWidth; x += 4) {
|
for(uint32_t y = 0; y < bufferHeight; y += 4) {
|
||||||
for(uint16_t rows = 0; rows < 4; rows++) {
|
uint32_t bufWid = ((y + rows) * bufferWidth);
|
||||||
*dst++ = Metaphrasis::convertRGBAToRGB5A3(src[((y + rows) * bufferWidth) + (x + 0)]);
|
for(uint32_t x = 0; x < bufferWidth; x += 4) {
|
||||||
*dst++ = Metaphrasis::convertRGBAToRGB5A3(src[((y + rows) * bufferWidth) + (x + 1)]);
|
*dst++ = Metaphrasis::convertRGBAToRGB5A3(src[bufWid + (x + 0)]);
|
||||||
*dst++ = Metaphrasis::convertRGBAToRGB5A3(src[((y + rows) * bufferWidth) + (x + 2)]);
|
*dst++ = Metaphrasis::convertRGBAToRGB5A3(src[bufWid + (x + 1)]);
|
||||||
*dst++ = Metaphrasis::convertRGBAToRGB5A3(src[((y + rows) * bufferWidth) + (x + 3)]);
|
*dst++ = Metaphrasis::convertRGBAToRGB5A3(src[bufWid + (x + 2)]);
|
||||||
|
*dst++ = Metaphrasis::convertRGBAToRGB5A3(src[bufWid + (x + 3)]);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -303,7 +303,7 @@ copy_to_xfb (u32 arg)
|
|||||||
GX_Flush ();
|
GX_Flush ();
|
||||||
copynow = GX_FALSE;
|
copynow = GX_FALSE;
|
||||||
}
|
}
|
||||||
FrameTimer++;
|
++FrameTimer;
|
||||||
}
|
}
|
||||||
|
|
||||||
/****************************************************************************
|
/****************************************************************************
|
||||||
@ -972,8 +972,9 @@ void Menu_DrawImg(f32 xpos, f32 ypos, u16 width, u16 height, u8 data[],
|
|||||||
GX_SetVtxDesc (GX_VA_TEX0, GX_DIRECT);
|
GX_SetVtxDesc (GX_VA_TEX0, GX_DIRECT);
|
||||||
|
|
||||||
Mtx m,m1,m2, mv;
|
Mtx m,m1,m2, mv;
|
||||||
width *=.5;
|
width >>= 1;
|
||||||
height*=.5;
|
height >>= 1;
|
||||||
|
|
||||||
guMtxIdentity (m1);
|
guMtxIdentity (m1);
|
||||||
guMtxScaleApply(m1,m1,scaleX,scaleY,1.0);
|
guMtxScaleApply(m1,m1,scaleX,scaleY,1.0);
|
||||||
guVector axis = (guVector) {0 , 0, 1 };
|
guVector axis = (guVector) {0 , 0, 1 };
|
||||||
@ -1014,26 +1015,20 @@ void Menu_DrawImg(f32 xpos, f32 ypos, u16 width, u16 height, u8 data[],
|
|||||||
***************************************************************************/
|
***************************************************************************/
|
||||||
void Menu_DrawRectangle(f32 x, f32 y, f32 width, f32 height, GXColor color, u8 filled)
|
void Menu_DrawRectangle(f32 x, f32 y, f32 width, f32 height, GXColor color, u8 filled)
|
||||||
{
|
{
|
||||||
u8 fmt;
|
long n = 4;
|
||||||
long n;
|
|
||||||
int i;
|
|
||||||
f32 x2 = x+width;
|
f32 x2 = x+width;
|
||||||
f32 y2 = y+height;
|
f32 y2 = y+height;
|
||||||
guVector v[] = {{x,y,0.0f}, {x2,y,0.0f}, {x2,y2,0.0f}, {x,y2,0.0f}, {x,y,0.0f}};
|
guVector v[] = {{x,y,0.0f}, {x2,y,0.0f}, {x2,y2,0.0f}, {x,y2,0.0f}, {x,y,0.0f}};
|
||||||
|
u8 fmt = GX_TRIANGLEFAN;
|
||||||
|
|
||||||
if(!filled)
|
if(!filled)
|
||||||
{
|
{
|
||||||
fmt = GX_LINESTRIP;
|
fmt = GX_LINESTRIP;
|
||||||
n = 5;
|
n = 5;
|
||||||
}
|
}
|
||||||
else
|
|
||||||
{
|
|
||||||
fmt = GX_TRIANGLEFAN;
|
|
||||||
n = 4;
|
|
||||||
}
|
|
||||||
|
|
||||||
GX_Begin(fmt, GX_VTXFMT0, n);
|
GX_Begin(fmt, GX_VTXFMT0, n);
|
||||||
for(i=0; i<n; i++)
|
for(long i=0; i<n; ++i)
|
||||||
{
|
{
|
||||||
GX_Position3f32(v[i].x, v[i].y, v[i].z);
|
GX_Position3f32(v[i].x, v[i].y, v[i].z);
|
||||||
GX_Color4u8(color.r, color.g, color.b, color.a);
|
GX_Color4u8(color.r, color.g, color.b, color.a);
|
||||||
|
Loading…
x
Reference in New Issue
Block a user