Files
pspsdk/src/samples/gu/speed/speed.c
2024-07-14 17:01:20 +02:00

461 lines
13 KiB
C

/*
* PSP Software Development Kit - https://github.com/pspdev
* -----------------------------------------------------------------------
* Licensed under the BSD license, see LICENSE in PSPSDK root for details.
*
* Copyright (c) 2005 Jesper Svennevid
*/
#include <pspkernel.h>
#include <pspdisplay.h>
#include <pspdebug.h>
#include <stdlib.h>
#include <stdio.h>
#include <math.h>
#include <string.h>
#include <pspctrl.h>
#include <pspgu.h>
#include <psprtc.h>
#include "../common/callbacks.h"
PSP_MODULE_INFO("Memory Speed Sample", 0, 1, 1);
PSP_MAIN_THREAD_ATTR(THREAD_ATTR_USER);
#define SLICE_SIZE 32 // change this to experiment with different page-cache sizes
#define BUF_WIDTH (512)
#define SCR_WIDTH (480)
#define SCR_HEIGHT (272)
static unsigned int __attribute__((aligned(16))) list[262144];
static u32 __attribute__((aligned(16))) pixels[BUF_WIDTH*SCR_HEIGHT];
static u32 __attribute__((aligned(16))) swizzled_pixels[BUF_WIDTH*SCR_HEIGHT];
struct Vertex
{
unsigned short u, v;
unsigned short color;
short x, y, z;
} __attribute__ ((packed));
static void spriteBlit(int sx, int sy, int sw, int sh, int dx, int dy)
{
// simple blit, this just copies A->B, with all the cache-misses that apply
struct Vertex* vertices = (struct Vertex*)sceGuGetMemory(2 * sizeof(struct Vertex));
vertices[0].u = sx; vertices[0].v = sy;
vertices[0].color = 0;
vertices[0].x = dx; vertices[0].y = dy; vertices[0].z = 0;
vertices[1].u = sx+sw; vertices[1].v = sy+sh;
vertices[1].color = 0;
vertices[1].x = dx+sw; vertices[1].y = dy+sh; vertices[1].z = 0;
sceGuDrawArray(GU_SPRITES,GU_TEXTURE_16BIT|GU_COLOR_4444|GU_VERTEX_16BIT|GU_TRANSFORM_2D,2,0,vertices);
}
static void triangleBlit(int sx, int sy, int sw, int sh, int dx, int dy)
{
// simple blit, this just copies A->B, with all the cache-misses that apply
struct Vertex* vertices = (struct Vertex*)sceGuGetMemory(6 * sizeof(struct Vertex));
vertices[0].u = sx; vertices[0].v = sy;
vertices[0].color = 0;
vertices[0].x = dx; vertices[0].y = dy; vertices[0].z = 0;
vertices[1].u = sx+sw; vertices[1].v = sy;
vertices[1].color = 0;
vertices[1].x = dx+sw; vertices[1].y = dy; vertices[1].z = 0;
vertices[2].u = sx+sw; vertices[2].v = sy+sh;
vertices[2].color = 0;
vertices[2].x = dx+sw; vertices[2].y = dy+sh; vertices[2].z = 0;
vertices[3].u = sx; vertices[3].v = sy;
vertices[3].color = 0;
vertices[3].x = dx; vertices[3].y = dy; vertices[3].z = 0;
vertices[4].u = sx+sw; vertices[4].v = sy+sh;
vertices[4].color = 0;
vertices[4].x = dx+sw; vertices[4].y = dy+sh; vertices[4].z = 0;
vertices[5].u = sx; vertices[5].v = sy+sh;
vertices[5].color = 0;
vertices[5].x = dx; vertices[5].y = dy+sh; vertices[5].z = 0;
sceGuDrawArray(GU_TRIANGLES,GU_TEXTURE_16BIT|GU_COLOR_4444|GU_VERTEX_16BIT|GU_TRANSFORM_2D,6,0,vertices);
}
static void advancedSpriteBlit(int sx, int sy, int sw, int sh, int dx, int dy, int slice)
{
int start, end, i;
// blit maximizing the use of the texture-cache
// Calculate needed vertices
int numVertices = 0;
for (start = sx, end = sx+sw; start < end; start += slice)
numVertices += 2;
struct Vertex* vertices = (struct Vertex*)sceGuGetMemory(numVertices * sizeof(struct Vertex));
for (start = sx, end = sx+sw, i = 0; start < end; start += slice, dx += slice, i += 2)
{
int width = (start + slice) < end ? slice : end-start;
vertices[i+0].u = start; vertices[i+0].v = sy;
vertices[i+0].color = 0;
vertices[i+0].x = dx; vertices[i+0].y = dy; vertices[i+0].z = 0;
vertices[i+1].u = start + width; vertices[i+1].v = sy + sh;
vertices[i+1].color = 0;
vertices[i+1].x = dx + width; vertices[i+1].y = dy + sh; vertices[i+1].z = 0;
}
sceGuDrawArray(GU_SPRITES,GU_TEXTURE_16BIT|GU_COLOR_4444|GU_VERTEX_16BIT|GU_TRANSFORM_2D,numVertices,0,vertices);
}
static void advancedTriangleBlit(int sx, int sy, int sw, int sh, int dx, int dy, int slice)
{
int start, end, i;
// blit maximizing the use of the texture-cache
// Calculate needed vertices
int numVertices = 0;
for (start = sx, end = sx+sw; start < end; start += slice)
numVertices += 6;
struct Vertex* vertices = (struct Vertex*)sceGuGetMemory(numVertices * sizeof(struct Vertex));
for (start = sx, end = sx+sw, i=0; start < end; start += slice, dx += slice, i +=6)
{
int width = (start + slice) < end ? slice : end-start;
vertices[i+0].u = start; vertices[i+0].v = sy;
vertices[i+0].color = 0;
vertices[i+0].x = dx; vertices[i+0].y = dy; vertices[i+0].z = 0;
vertices[i+1].u = start+width; vertices[i+1].v = sy;
vertices[i+1].color = 0;
vertices[i+1].x = dx+width; vertices[i+1].y = dy; vertices[i+1].z = 0;
vertices[i+2].u = start+width; vertices[i+2].v = sy+sh;
vertices[i+2].color = 0;
vertices[i+2].x = dx+width; vertices[i+2].y = dy+sh; vertices[i+2].z = 0;
vertices[i+3].u = start; vertices[i+3].v = sy;
vertices[i+3].color = 0;
vertices[i+3].x = dx; vertices[i+3].y = dy; vertices[i+3].z = 0;
vertices[i+4].u = start+width; vertices[i+4].v = sy+sh;
vertices[i+4].color = 0;
vertices[i+4].x = dx+width; vertices[i+4].y = dy+sh; vertices[i+4].z = 0;
vertices[i+5].u = start; vertices[i+5].v = sy+sh;
vertices[i+5].color = 0;
vertices[i+5].x = dx; vertices[i+5].y = dy+sh; vertices[i+5].z = 0;
}
sceGuDrawArray(GU_TRIANGLES,GU_TEXTURE_16BIT|GU_COLOR_4444|GU_VERTEX_16BIT|GU_TRANSFORM_2D,numVertices,0,vertices);
}
void swizzle_fast(u8* out, const u8* in, unsigned int width, unsigned int height)
{
unsigned int blockx, blocky;
unsigned int j;
unsigned int width_blocks = (width / 16);
unsigned int height_blocks = (height / 8);
unsigned int src_pitch = (width-16)/4;
unsigned int src_row = width * 8;
const u8* ysrc = in;
u32* dst = (u32*)out;
for (blocky = 0; blocky < height_blocks; ++blocky)
{
const u8* xsrc = ysrc;
for (blockx = 0; blockx < width_blocks; ++blockx)
{
const u32* src = (u32*)xsrc;
for (j = 0; j < 8; ++j)
{
*(dst++) = *(src++);
*(dst++) = *(src++);
*(dst++) = *(src++);
*(dst++) = *(src++);
src += src_pitch;
}
xsrc += 16;
}
ysrc += src_row;
}
}
enum BlitMode
{
BLITMODE_SPRITE,
BLITMODE_TRIANGLE,
BLITMODE_ADVANCED_SPRITE,
BLITMODE_ADVANCED_TRIANGLE,
BLITMODE_COUNT
};
static char *blitName(enum BlitMode blit_mode) {
switch (blit_mode) {
case BLITMODE_SPRITE: return "Sprite";
case BLITMODE_TRIANGLE: return "Triangle";
case BLITMODE_ADVANCED_SPRITE: return "Adv Sprite";
case BLITMODE_ADVANCED_TRIANGLE: return "Adv Triangle";
default: return "Unknown BlitMode";
}
}
static void blitTexture(enum BlitMode blit_mode, int sx, int sy, int sw, int sh, int dx, int dy, int slice) {
switch (blit_mode) {
case BLITMODE_SPRITE: spriteBlit(sx, sy, sw, sh, dx, dy); break;
case BLITMODE_TRIANGLE: triangleBlit(sx, sy, sw, sh, dx, dy); break;
case BLITMODE_ADVANCED_SPRITE: advancedSpriteBlit(sx, sy, sw, sh, dx, dy, slice); break;
case BLITMODE_ADVANCED_TRIANGLE: advancedTriangleBlit(sx, sy, sw, sh, dx, dy, slice); break;
case BLITMODE_COUNT: break;
}
}
struct StripWidthDeclaration
{
int width;
const char* name;
} strip_widths[] =
{
{16,"16"},
{32,"32"},
{64,"64"},
{128,"128"}
};
struct PixelFormatDeclaration
{
int psm;
int size;
int row_pitch;
const char* name;
} pixel_formats[] =
{
{GU_PSM_4444,SCR_WIDTH*SCR_HEIGHT*2,1024,"16-bit RGBA"},
{GU_PSM_T4,(SCR_WIDTH*SCR_HEIGHT)>>1,256,"4-bit CLUT"},
{GU_PSM_T8,SCR_WIDTH*SCR_HEIGHT,512,"8-bit CLUT"},
{GU_PSM_8888,SCR_WIDTH*SCR_HEIGHT*4,2048,"32-bit RGBA"}
};
u16 __attribute__((aligned(16))) palette[256];
int main(int argc, char* argv[])
{
unsigned int i;
setupCallbacks();
for (i = 0; i < 256; ++i)
palette[i] = i;
sceKernelDcacheWritebackAll();
// setup GU
void* fbp0 = guGetStaticVramBuffer(BUF_WIDTH,SCR_HEIGHT,GU_PSM_8888);
void* fbp1 = guGetStaticVramBuffer(BUF_WIDTH,SCR_HEIGHT,GU_PSM_8888);
void* zbp = guGetStaticVramBuffer(BUF_WIDTH,SCR_HEIGHT,GU_PSM_4444);
pspDebugScreenInit();
sceGuInit();
sceGuStart(GU_DIRECT,list);
sceGuDrawBuffer(GU_PSM_5650,fbp0,BUF_WIDTH);
sceGuDispBuffer(SCR_WIDTH,SCR_HEIGHT,fbp1,BUF_WIDTH);
sceGuDepthBuffer(zbp,BUF_WIDTH);
sceGuOffset(2048 - (SCR_WIDTH/2),2048 - (SCR_HEIGHT/2));
sceGuViewport(2048,2048,SCR_WIDTH,SCR_HEIGHT);
sceGuDepthRange(65535,0);
sceGuScissor(0,0,SCR_WIDTH,SCR_HEIGHT);
sceGuEnable(GU_SCISSOR_TEST);
sceGuFrontFace(GU_CW);
sceGuEnable(GU_TEXTURE_2D);
sceGuDepthMask(0xffff);
sceGuDisable(GU_DEPTH_TEST);
sceGuClear(GU_COLOR_BUFFER_BIT|GU_DEPTH_BUFFER_BIT);
sceGuClutMode(GU_PSM_4444,0,255,0);
sceGuClutLoad(256/8,palette);
sceGuFinish();
sceGuSync(0,0);
sceDisplayWaitVblankStart();
sceGuDisplay(1);
// get vram buffer for vram -> vram blit
void* vram_buffer;
vram_buffer = guGetStaticVramTexture(BUF_WIDTH,SCR_HEIGHT,GU_PSM_8888);
// flush caches to make sure no stray data remains
sceKernelDcacheWritebackAll();
float curr_ms = 1.0f;
enum BlitMode blit_method = BLITMODE_SPRITE;
int swizzle = 0;
int vram_select = 0;
int strip_width = 0;
int pixel_format = 0;
int initialized = 0;
SceCtrlData oldPad;
oldPad.Buttons = 0;
sceCtrlSetSamplingCycle(0);
sceCtrlSetSamplingMode(0);
u64 last_tick;
sceRtcGetCurrentTick(&last_tick);
u32 tick_res = sceRtcGetTickResolution();
int frame_count = 0;
while (running())
{
int texture_change = 0;
// deal with input
SceCtrlData pad;
if(sceCtrlPeekBufferPositive(&pad, 1))
{
if (pad.Buttons != oldPad.Buttons)
{
if (pad.Buttons & PSP_CTRL_CROSS) {
blit_method += 1;
if (blit_method == BLITMODE_COUNT)
blit_method = BLITMODE_SPRITE;
}
if (pad.Buttons & PSP_CTRL_CIRCLE)
{
swizzle ^= 1;
texture_change = 1;
}
if (pad.Buttons & PSP_CTRL_SQUARE)
{
vram_select ^= 1;
texture_change = 1;
}
if (pad.Buttons & PSP_CTRL_TRIANGLE)
strip_width = (strip_width+1) % (sizeof(strip_widths)/sizeof(struct StripWidthDeclaration));
if (pad.Buttons & (PSP_CTRL_RTRIGGER|PSP_CTRL_LTRIGGER))
{
if (pad.Buttons & PSP_CTRL_RTRIGGER)
++pixel_format;
else
--pixel_format;
pixel_format %= sizeof(pixel_formats) / sizeof(struct PixelFormatDeclaration);
texture_change = 1;
}
}
oldPad = pad;
}
// generate new texture if settings have changed
if (texture_change || !initialized)
{
u8* output = (u8*)pixels;
unsigned int x,y;
for (y = 0; y < 512; ++y)
for (x = 0; x < pixel_formats[pixel_format].row_pitch; ++x)
*output++ = x*y;
if (swizzle)
{
if (vram_select)
swizzle_fast((u8*)vram_buffer,(const u8*)pixels,pixel_formats[pixel_format].row_pitch,SCR_HEIGHT);
else
swizzle_fast((u8*)swizzled_pixels,(const u8*)pixels,pixel_formats[pixel_format].row_pitch,SCR_HEIGHT);
}
else
{
if (vram_select)
memcpy(vram_buffer,pixels,pixel_formats[pixel_format].row_pitch * SCR_HEIGHT);
}
sceKernelDcacheWritebackAll();
initialized = 1;
}
// begin rendering
sceGuStart(GU_DIRECT,list);
sceGuTexMode(pixel_formats[pixel_format].psm,0,0,swizzle); // 16-bit RGBA
sceGuTexImage(0,512,512,512,vram_select ? vram_buffer : swizzle ? swizzled_pixels : pixels); // setup texture as a 512x512 texture, even though the buffer is only 512x272 (480 visible)
sceGuTexFunc(GU_TFX_REPLACE,GU_TCC_RGBA); // don't get influenced by any vertex colors
sceGuTexFilter(GU_NEAREST,GU_NEAREST); // point-filtered sampling
blitTexture(blit_method,0,0,SCR_WIDTH,SCR_HEIGHT,0,0,strip_widths[strip_width].width);
sceGuFinish();
sceGuSync(0,0);
// sum results and update report if more than one second has passed since last time
++frame_count;
u64 curr_tick;
sceRtcGetCurrentTick(&curr_tick);
if ((curr_tick-last_tick) >= tick_res)
{
float curr_fps = 1.0f / curr_ms;
int transfer_rate = (curr_fps * pixel_formats[pixel_format].size) / (1024*1024);
pspDebugScreenSetOffset((int)fbp0);
pspDebugScreenSetXY(0,0);
pspDebugScreenPrintf("fps: %d.%03d (%dMB/s)",(int)curr_fps,(int)((curr_fps-(int)curr_fps) * 1000.0f),transfer_rate);
pspDebugScreenSetXY(0,1);
pspDebugScreenPrintf("%s %s %s %s", blitName(blit_method), swizzle ? "swizzled" : "linear",vram_select ? "video ram" : "system ram", strip_widths[strip_width].name);
pspDebugScreenSetXY(0,2);
pspDebugScreenPrintf("%s",pixel_formats[pixel_format].name);
pspDebugScreenSetXY(0,32);
pspDebugScreenPrintf("L/R = pixel format");
pspDebugScreenSetXY(0,33);
pspDebugScreenPrintf("X = blit method, O = swizzling, [] = memory, /\\ = strip width");
fbp0 = sceGuSwapBuffers();
// update timing for next pass
double time_span = ((curr_tick-last_tick)) / (float)tick_res;
curr_ms = time_span / frame_count;
frame_count = 0;
sceRtcGetCurrentTick(&last_tick);
}
}
sceGuTerm();
sceKernelExitGame();
return 0;
}