libctru/libctru/source/gpu/shdr.c
2014-12-17 22:41:31 -08:00

200 lines
4.7 KiB
C

/*
shdr.c _ Shader loader.
*/
#include <stdlib.h>
#include <string.h>
#include <3ds/types.h>
#include <3ds/gpu/gpu.h>
#include <3ds/gpu/shdr.h>
//please don't feed this an invalid SHBIN
DVLB_s* SHDR_ParseSHBIN(u32* shbinData, u32 shbinSize)
{
if(!shbinData)return NULL;
DVLB_s* ret=malloc(sizeof(DVLB_s));
if(!ret)goto exit;
//parse DVLB
ret->numDVLE=shbinData[1];
ret->DVLE=malloc(sizeof(DVLE_s)*ret->numDVLE);
if(!ret->DVLE)goto clean1;
//parse DVLP
u32* dvlpData=&shbinData[2+ret->numDVLE];
ret->DVLP.codeSize=dvlpData[3];
ret->DVLP.codeData=&dvlpData[dvlpData[2]/4];
ret->DVLP.opdescSize=dvlpData[5];
ret->DVLP.opcdescData=&dvlpData[dvlpData[4]/4];
//parse DVLE
int i;
for(i=0;i<ret->numDVLE;i++)
{
DVLE_s* dvle=&ret->DVLE[i];
u32* dvleData=&shbinData[shbinData[2+i]/4];
dvle->type=(dvleData[1]>>16)&0xFF;
dvle->mainOffset=dvleData[2];
dvle->endmainOffset=dvleData[3];
dvle->constTableSize=dvleData[7];
dvle->constTableData=(DVLE_constEntry_s*)&dvleData[dvleData[6]/4];
dvle->outTableSize=dvleData[11];
dvle->outTableData=(DVLE_outEntry_s*)&dvleData[dvleData[10]/4];
dvle->uniformTableSize=dvleData[13];
dvle->uniformTableData=(DVLE_uniformEntry_s*)&dvleData[dvleData[12]/4];
dvle->symbolTableData=(char*)&dvleData[dvleData[14]/4];
}
goto exit;
clean1:
free(ret);
exit:
return ret;
}
s8 SHDR_GetUniformRegister(DVLB_s* dvlb, const char* name, u8 programID)
{
if(!dvlb || !name)return -1;
DVLE_s* dvle=&dvlb->DVLE[programID];
int i; DVLE_uniformEntry_s* u=dvle->uniformTableData;
for(i=0;i<dvle->uniformTableSize;i++)
{
if(!strcmp(&dvle->symbolTableData[u->symbolOffset],name))return (s8)u->startReg-0x10;
u++;
}
return -1;
}
void DVLP_SendCode(DVLP_s* dvlp)
{
if(!dvlp)return;
GPUCMD_AddSingleParam(0x000F02CB, 0x00000000);
int i;
for(i=0;i<dvlp->codeSize;i+=0x80)GPUCMD_Add(0x000F02CC, &dvlp->codeData[i], ((dvlp->codeSize-i)<0x80)?(dvlp->codeSize-i):0x80);
GPUCMD_AddSingleParam(0x000F02BF, 0x00000001);
}
void DVLP_SendOpDesc(DVLP_s* dvlp)
{
if(!dvlp)return;
GPUCMD_AddSingleParam(0x000F02D5, 0x00000000);
u32 param[0x20];
int i;
//TODO : should probably preprocess this
for(i=0;i<dvlp->opdescSize;i++)param[i]=dvlp->opcdescData[i*2];
GPUCMD_Add(0x000F02D6, param, dvlp->opdescSize);
}
void DVLE_SendOutmap(DVLE_s* dvle)
{
if(!dvle)return;
u32 param[0x7]={0x1F1F1F1F,0x1F1F1F1F,0x1F1F1F1F,0x1F1F1F1F,
0x1F1F1F1F,0x1F1F1F1F,0x1F1F1F1F};
int i;
u8 numAttr=0;
u8 maxAttr=0;
u8 attrMask=0;
//TODO : should probably preprocess this
for(i=0;i<dvle->outTableSize;i++)
{
u32* out=&param[dvle->outTableData[i].regID];
if(*out==0x1F1F1F1F)numAttr++;
//desc could include masking/swizzling info not currently taken into account
//also TODO : map out other output register values
switch(dvle->outTableData[i].type)
{
case RESULT_POSITION: *out=0x03020100; break;
case RESULT_COLOR: *out=0x0B0A0908; break;
case RESULT_TEXCOORD0: *out=0x1F1F0D0C; break;
case RESULT_TEXCOORD1: *out=0x1F1F0F0E; break;
case RESULT_TEXCOORD2: *out=0x1F1F1716; break;
}
attrMask|=1<<dvle->outTableData[i].regID;
if(dvle->outTableData[i].regID+1>maxAttr)maxAttr=dvle->outTableData[i].regID+1;
}
GPUCMD_AddSingleParam(0x000F0251, numAttr-1); //?
GPUCMD_AddSingleParam(0x000F024A, numAttr-1); //?
GPUCMD_AddSingleParam(0x000F02BD, attrMask); //?
GPUCMD_AddSingleParam(0x0001025E, numAttr-1); //?
GPUCMD_AddSingleParam(0x000F004F, numAttr); //?
GPUCMD_Add(0x800F0050, param, 0x00000007);
}
void DVLE_SendConstants(DVLE_s* dvle)
{
if(!dvle)return;
u32 param[4];
u32 rev[3];
u8* rev8=(u8*)rev;
int i;
DVLE_constEntry_s* cnst=dvle->constTableData;
for(i=0;i<dvle->constTableSize;i++,cnst++)
{
memcpy(&rev8[0], &cnst->data[0], 3);
memcpy(&rev8[3], &cnst->data[1], 3);
memcpy(&rev8[6], &cnst->data[2], 3);
memcpy(&rev8[9], &cnst->data[3], 3);
param[0x0]=(cnst->header>>16)&0xFF;
param[0x1]=rev[2];
param[0x2]=rev[1];
param[0x3]=rev[0];
GPUCMD_Add(0x800F02C0, param, 0x00000004);
}
}
void SHDR_UseProgram(DVLB_s* dvlb, u8 id)
{
if(!dvlb || id>dvlb->numDVLE)return;
DVLE_s* dvle=&dvlb->DVLE[id];
//?
GPUCMD_AddSingleParam(0x00010229, 0x00000000);
GPUCMD_AddSingleParam(0x00010244, 0x00000000);
DVLP_SendCode(&dvlb->DVLP);
DVLP_SendOpDesc(&dvlb->DVLP);
DVLE_SendConstants(dvle);
GPUCMD_AddSingleParam(0x00080229, 0x00000000);
GPUCMD_AddSingleParam(0x000F02BA, 0x7FFF0000|(dvle->mainOffset&0xFFFF)); //set entrypoint
GPUCMD_AddSingleParam(0x000F0252, 0x00000000); // should all be part of DVLE_SendOutmap ?
DVLE_SendOutmap(dvle);
//?
GPUCMD_AddSingleParam(0x000F0064, 0x00000001);
GPUCMD_AddSingleParam(0x000F006F, 0x00000703);
}
//TODO
void SHDR_FreeDVLB(DVLB_s* dvlb)
{
if(!dvlb)return;
}