Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

pbkit: Enable flip stall; expose ramin, print_char, depth buffer internals #628

Open
wants to merge 8 commits into
base: master
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from 2 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
53 changes: 25 additions & 28 deletions lib/pbkit/pbkit.c
Original file line number Diff line number Diff line change
Expand Up @@ -42,15 +42,6 @@
#define ADDR_FBMEM 2
#define ADDR_AGPMEM 3

#define DMA_CLASS_2 2
#define DMA_CLASS_3 3
#define DMA_CLASS_3D 0x3D

#define GR_CLASS_30 0x30
#define GR_CLASS_39 0x39
#define GR_CLASS_62 0x62
#define GR_CLASS_97 0x97
#define GR_CLASS_9F 0x9F

#define GPU_IRQ 3

Expand All @@ -69,14 +60,6 @@
#define PB_SETNOISE 0xBAA
#define PB_FINISHED 0xFAB

struct s_CtxDma
{
DWORD ChannelID;
DWORD Inst; //Addr in PRAMIN area, unit=16 bytes blocks, baseaddr=VIDEO_BASE+NV_PRAMIN
DWORD Class;
DWORD isGr;
};

static unsigned int pb_ColorFmt = NV097_SET_SURFACE_FORMAT_COLOR_LE_A8R8G8B8;
static unsigned int pb_DepthFmt = NV097_SET_SURFACE_FORMAT_ZETA_Z24S8;

Expand Down Expand Up @@ -1344,7 +1327,7 @@ static void pb_prepare_tiles(void)



static void pb_create_dma_ctx( DWORD ChannelID,
void pb_create_dma_ctx( DWORD ChannelID,
DWORD Class,
DWORD Base,
DWORD Limit,
Expand Down Expand Up @@ -1393,7 +1376,7 @@ static void pb_create_dma_ctx( DWORD ChannelID,



static void pb_bind_channel(struct s_CtxDma *pCtxDmaObject)
void pb_bind_channel(struct s_CtxDma *pCtxDmaObject)
{
DWORD entry;
DWORD *p;
Expand Down Expand Up @@ -1628,7 +1611,7 @@ static void pb_3D_init(void)



static void pb_create_gr_ctx( int ChannelID,
void pb_create_gr_ctx( int ChannelID,
int Class,
struct s_CtxDma *pGrObject )
{
Expand Down Expand Up @@ -3109,6 +3092,7 @@ int pb_init(void)
pb_create_dma_ctx(8,DMA_CLASS_3D,(DWORD)pb_DmaBuffer8,0x20,&sDmaObject8);
pb_create_dma_ctx(6,DMA_CLASS_2,0,MAXRAM,&sDmaObject6);


//we initialized channel 0 first, that will match graphic context 0
pb_FifoChannelID=0;
pb_FifoChannelsMode=NV_PFIFO_MODE_ALL_PIO;
Expand Down Expand Up @@ -3253,14 +3237,14 @@ int pb_init(void)
//These commands assign DMA channels to push buffer subchannels
//and associate some specific GPU parts to specific Dma channels
p=pb_begin();
p=pb_push1_to(SUBCH_2,p,NV20_TCL_PRIMITIVE_SET_MAIN_OBJECT,14);
p=pb_push1_to(SUBCH_3,p,NV20_TCL_PRIMITIVE_SET_MAIN_OBJECT,16);
p=pb_push1_to(SUBCH_4,p,NV20_TCL_PRIMITIVE_SET_MAIN_OBJECT,17);
p=pb_push1_to(SUBCH_3D,p,NV20_TCL_PRIMITIVE_SET_MAIN_OBJECT,13);
p=pb_push1_to(SUBCH_2,p,NV20_TCL_PRIMITIVE_3D_SET_OBJECT0,7);
p=pb_push1_to(SUBCH_3,p,NV20_TCL_PRIMITIVE_3D_SET_OBJECT5,17);
p=pb_push1_to(SUBCH_3,p,NV20_TCL_PRIMITIVE_3D_SET_OBJECT_UNKNOWN,3);
p=pb_push2_to(SUBCH_4,p,NV20_TCL_PRIMITIVE_3D_SET_OBJECT1,3,11);
p=pb_push1_to(SUBCH_2,p,NV20_TCL_PRIMITIVE_SET_MAIN_OBJECT,14); // Class 39
p=pb_push1_to(SUBCH_3,p,NV20_TCL_PRIMITIVE_SET_MAIN_OBJECT,16); // Class 9F
p=pb_push1_to(SUBCH_4,p,NV20_TCL_PRIMITIVE_SET_MAIN_OBJECT,17); // Class 62
p=pb_push1_to(SUBCH_3D,p,NV20_TCL_PRIMITIVE_SET_MAIN_OBJECT,13); // Class 97
p=pb_push1_to(SUBCH_2,p,NV20_TCL_PRIMITIVE_3D_SET_OBJECT0,7); // NV039_SET_CONTEXT_DMA_NOTIFIES
p=pb_push1_to(SUBCH_3,p,NV20_TCL_PRIMITIVE_3D_SET_OBJECT5,17); // NV09F_SET_CONTEXT_SURFACES
p=pb_push1_to(SUBCH_3,p,NV20_TCL_PRIMITIVE_3D_SET_OBJECT_UNKNOWN,3); // Set operation to SRCCOPY
p=pb_push2_to(SUBCH_4,p,NV20_TCL_PRIMITIVE_3D_SET_OBJECT1,3,11); // Source ch 3, Dest ch 11
pb_end(p); //calls pb_start() which will trigger the reading and sending to GPU (asynchronous, no waiting)

//setup needed for color computations
Expand Down Expand Up @@ -3728,3 +3712,16 @@ static NTAPI VOID pb_shutdown_notification_routine (PHAL_SHUTDOWN_REGISTRATION S
{
pb_kill();
}

uint8_t* pb_depth_stencil_buffer()
{
return (uint8_t*)pb_DepthStencilAddr;
}

DWORD pb_depth_stencil_pitch() {
return pb_DepthStencilPitch;
}

DWORD pb_depth_stencil_size() {
return pb_DSSize;
}
32 changes: 32 additions & 0 deletions lib/pbkit/pbkit.h
Original file line number Diff line number Diff line change
Expand Up @@ -51,6 +51,24 @@ extern "C"
#define SUBCH_3 3
#define SUBCH_4 4

//DMA and graphics classes
#define DMA_CLASS_2 0x02
#define DMA_CLASS_3 0x03
#define DMA_CLASS_3D 0x3D
#define GR_CLASS_19 0x19
#define GR_CLASS_30 0x30
#define GR_CLASS_39 0x39
#define GR_CLASS_62 0x62
#define GR_CLASS_97 0x97
#define GR_CLASS_9F 0x9F

struct s_CtxDma
{
DWORD ChannelID;
DWORD Inst; //Addr in PRAMIN area, unit=16 bytes blocks, baseaddr=VIDEO_BASE+NV_PRAMIN
DWORD Class;
DWORD isGr;
};

void pb_show_front_screen(void); //shows scene (allows VBL synced screen swapping)
void pb_show_debug_screen(void); //shows debug screen (default openxdk+SDL buffer)
Expand Down Expand Up @@ -116,6 +134,20 @@ void pb_set_viewport(int dwx,int dwy,int width,int height,float zmin,float zm
int pb_busy(void);


void pb_create_dma_ctx(DWORD ChannelID,
DWORD Class,
DWORD Base,
DWORD Limit,
struct s_CtxDma *pDmaObject );
void pb_create_gr_ctx( int ChannelID,
int Class,
struct s_CtxDma *pGrObject );
void pb_bind_channel(struct s_CtxDma *pCtxDmaObject);

uint8_t *pb_depth_stencil_buffer();
DWORD pb_depth_stencil_pitch();
DWORD pb_depth_stencil_size();
Copy link
Member

@JayFoxRox JayFoxRox Mar 4, 2023

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I always thought pbkit had this interface backwards. Currently pbkit is a mix of a low-level and high-level driver.

pbkit can submit pushbuffers, but it also constructs them, some using rather high level operations.
Instead, I believe that pbkit should allow submission of pushbuffers, but it should primarily be the users responsibility to construct them.
pbkit should only control the hardware so it can process commands from the pushbuffers.

More importantly, pbkit also manages buffers internally (sometimes like a singleton), but doesn't allow the user to manually create or control these buffers.
Instead, I believe that pbkit should provide the user with buffer creation / managing functions, but the user should always explicitly create these buffers and keep track of them.

This means I'd prefer to see something like pb_create_depth_stencil_buffer(size, pitch) and then the user should be responsible for creating these buffers.
So, in an ideal world, the application would never even have to query for the buffer address / pitch / size, because it created the buffer itself.

This (explicit buffer creation by application) is also required (or at least helpful) for more advanced applications which want to switch render-targets.


#ifdef __cplusplus
}
#endif
Expand Down