diff --git a/dlls/wined3d/device.c b/dlls/wined3d/device.c index 17fe5cd37ac..5304cdd1db7 100644 --- a/dlls/wined3d/device.c +++ b/dlls/wined3d/device.c @@ -1451,14 +1451,15 @@ HRESULT WINAPI IWineD3DDeviceImpl_CreateVertexDeclaration(IWineD3DDevice* iface, } /* http://msdn.microsoft.com/archive/default.asp?url=/archive/en-us/directx9_c/directx/graphics/programmingguide/programmable/vertexshaders/vscreate.asp */ -HRESULT WINAPI IWineD3DDeviceImpl_CreateVertexShader(IWineD3DDevice* iface, CONST DWORD* pFunction, IWineD3DVertexShader** ppVertexShader, IUnknown *parent) { +HRESULT WINAPI IWineD3DDeviceImpl_CreateVertexShader(IWineD3DDevice *iface, CONST DWORD *pFunction, IWineD3DVertexShader** ppVertexShader, IUnknown *parent) { IWineD3DDeviceImpl *This = (IWineD3DDeviceImpl *)iface; IWineD3DVertexShaderImpl *object; /* NOTE: impl usage is ok, this is a create */ D3DCREATEOBJECTINSTANCE(object, VertexShader) - object->function = pFunction; - FIXME("(%p) : STUB: Created Vertex shader %p\n", This, ppVertexShader); - return D3D_OK; + TRACE("(%p) : Created Vertex shader %p\n", This, ppVertexShader); + IWineD3DVertexShader_SetFunction(*ppVertexShader, pFunction); + + return D3D_OK; } HRESULT WINAPI IWineD3DDeviceImpl_CreatePixelShader(IWineD3DDevice* iface, CONST DWORD* pFunction, IWineD3DPixelShader** ppPixelShader, IUnknown *parent) { @@ -1473,7 +1474,6 @@ HRESULT WINAPI IWineD3DDeviceImpl_GetDirect3D(IWineD3DDevice* iface, IWineD3D** TRACE("(%p) : wineD3D returning %p\n", This, *ppD3D); IWineD3D_AddRef(*ppD3D); return D3D_OK; - } UINT WINAPI IWineD3DDeviceImpl_GetAvailableTextureMem(IWineD3DDevice *iface) { @@ -3417,41 +3417,30 @@ HRESULT WINAPI IWineD3DDeviceImpl_GetVertexDeclaration(IWineD3DDevice* iface, IW HRESULT WINAPI IWineD3DDeviceImpl_SetVertexShader(IWineD3DDevice *iface, IWineD3DVertexShader* pShader) { IWineD3DDeviceImpl *This = (IWineD3DDeviceImpl *)iface; - - static BOOL showFixmes = TRUE; + IWineD3DVertexShader *oldShader = This->updateStateBlock->vertexShader; This->updateStateBlock->vertexShader = pShader; This->updateStateBlock->changed.vertexShader = TRUE; This->updateStateBlock->set.vertexShader = TRUE; - if(pShader == NULL) { - /* clear down the shader */ - TRACE("Clear down the shader\n"); - }else{ - if(showFixmes) { - FIXME("(%p) : stub pShader(%p)\n", This, pShader); - showFixmes = FALSE; - } - } - - return D3D_OK; - - /** FIXME: refernece counting? **/ - if (pShader == NULL) { /* only valid with non FVF shaders */ - TRACE_(d3d_shader)("(%p) : FVF Shader, pShader=%p\n", This, pShader); - This->updateStateBlock->vertexShader = NULL; - } else { - TRACE_(d3d_shader)("(%p) : Created shader, pShader=%p\n", This, pShader); - This->updateStateBlock->vertexShader = pShader; - } - - This->updateStateBlock->changed.vertexShader = TRUE; - This->updateStateBlock->set.vertexShader = TRUE; - - /* Handle recording of state blocks */ if (This->isRecordingState) { - TRACE("Recording... not performing anything\n"); - return D3D_OK; + TRACE("Recording... not performing anything\n"); + return D3D_OK; + } + + if (pShader != NULL) { + IUnknown *newVertexShaderParent; + /* GetParent will add a ref, so leave it hanging until the vertex buffer is cleared */ + TRACE("(%p) : setting pShader(%p)\n", This, pShader); + IWineD3DVertexShader_GetParent(pShader, &newVertexShaderParent); + } else { + TRACE("Clear down the shader\n"); + } + if (oldShader != NULL) { + IUnknown *oldVertexShaderParent; + IWineD3DVertexShader_GetParent(oldShader, &oldVertexShaderParent); + IUnknown_Release(oldVertexShaderParent); + IUnknown_Release(oldVertexShaderParent); } /** * TODO: merge HAL shaders context switching from prototype @@ -3461,7 +3450,7 @@ HRESULT WINAPI IWineD3DDeviceImpl_SetVertexShader(IWineD3DDevice *iface, IWineD3 HRESULT WINAPI IWineD3DDeviceImpl_GetVertexShader(IWineD3DDevice *iface, IWineD3DVertexShader** ppShader) { IWineD3DDeviceImpl *This = (IWineD3DDeviceImpl *)iface; - *ppShader = This->stateBlock->vertexShader; + *ppShader = This->updateStateBlock->vertexShader; if(*ppShader != NULL) IWineD3DVertexShader_AddRef(*ppShader); TRACE("(%p) : returning %p\n", This, *ppShader); diff --git a/dlls/wined3d/vertexshader.c b/dlls/wined3d/vertexshader.c index 86d1cdcb524..13556e286bb 100644 --- a/dlls/wined3d/vertexshader.c +++ b/dlls/wined3d/vertexshader.c @@ -23,11 +23,14 @@ #include "config.h" #include +#include #include "wined3d_private.h" WINE_DEFAULT_DEBUG_CHANNEL(d3d_shader); +#define GLINFO_LOCATION ((IWineD3DImpl *)(((IWineD3DDeviceImpl *)This->wineD3DDevice)->wineD3D))->gl_info + /* Shader debugging - Change the following line to enable debugging of software vertex shaders */ #if 0 /* Musxt not be 1 in cvs version */ @@ -72,17 +75,23 @@ WINE_DEFAULT_DEBUG_CHANNEL(d3d_shader); * http://developer.nvidia.com/view.asp?IO=var_memory_management */ +/* TODO: Vertex and Pixel shaders are almost identicle, the only exception being the way that some of the data is looked up or the availablity of some of the data i.e. some instructions are only valid for pshaders and some for vshaders +because of this the bulk of the software pipeline can be shared between pixel and vertex shaders... and it wouldn't supprise me if the programes can be cross compiled using a large body body shared code */ + typedef void (*shader_fct_t)(); typedef struct SHADER_OPCODE { - CONST BYTE opcode; + unsigned int opcode; const char* name; + const char* glname; CONST UINT num_params; shader_fct_t soft_fct; DWORD min_version; DWORD max_version; } SHADER_OPCODE; +#define GLNAME_REQUIRE_GLSL ((const char *)1) + /******************************* * vshader functions software VM */ @@ -196,7 +205,8 @@ void vshader_mul(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0, WINED3DSHADERV } void vshader_nop(void) { - /* NOPPPP ahhh too easy ;) */ + /* NOPPPP ahhh too easy ;) */ + VSTRACE(("executing nop\n")); } void vshader_rcp(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { @@ -343,53 +353,367 @@ void vshader_lrp(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0, WINED3DSHADERV d->w = s0->w * (s1->w - s2->w) + s2->x; } +void vshader_crs(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0, WINED3DSHADERVECTOR* s1) { + d->x = s0->y * s1->z - s0->z * s1->y; + d->y = s0->z * s1->x - s0->x * s1->z; + d->z = s0->x * s1->y - s0->y * s1->x; + d->w = 0.9f; /* w is undefined, so set it to something safeish */ + + VSTRACE(("executing crs: s0=(%f, %f, %f, %f) s1=(%f, %f, %f, %f) => d=(%f, %f, %f, %f)\n", + s0->x, s0->y, s0->z, s0->w, s1->x, s1->y, s1->z, s1->w, d->x, d->y, d->z, d->w)); +} + +void vshader_abs(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + + d->x = fabsf(s0->x); + d->y = fabsf(s0->y); + d->z = fabsf(s0->z); + d->w = fabsf(s0->w); + VSTRACE(("executing abs: s0=(%f, %f, %f, %f) => d=(%f, %f, %f, %f)\n", + s0->x, s0->y, s0->z, s0->w, d->x, d->y, d->z, d->w)); +} + + /* Stubs */ +void vshader_texcoord(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_texkill(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_tex(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} +void vshader_texld(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_texbem(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_texbeml(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_texreg2ar(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_texreg2gb(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_texm3x2pad(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_texm3x2tex(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_texm3x3pad(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_texm3x3tex(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_texm3x3diff(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_texm3x3spec(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0, WINED3DSHADERVECTOR* s1) { + FIXME(" : Stub\n"); +} + +void vshader_texm3x3vspec(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_cnd(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0, WINED3DSHADERVECTOR* s1, WINED3DSHADERVECTOR* s2) { + FIXME(" : Stub\n"); +} + +/* Def is C[n] = {n.nf, n.nf, n.nf, n.nf} */ +void vshader_def(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0, WINED3DSHADERVECTOR* s1, WINED3DSHADERVECTOR* s2, WINED3DSHADERVECTOR* s3) { + FIXME(" : Stub\n"); +} + +void vshader_texreg2rgb(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_texdp3tex(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_texm3x2depth(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_texdp3(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_texm3x3(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_texdepth(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_cmp(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0, WINED3DSHADERVECTOR* s1, WINED3DSHADERVECTOR* s2) { + FIXME(" : Stub\n"); +} + +void vshader_bem(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0, WINED3DSHADERVECTOR* s1) { + FIXME(" : Stub\n"); +} + +void vshader_call(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_callnz(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_loop(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_ret(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_endloop(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_dcl(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_pow(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0, WINED3DSHADERVECTOR* s1) { + FIXME(" : Stub\n"); +} + +void vshader_sng(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_nrm(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_sincos(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_rep(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_endrep(void) { + FIXME(" : Stub\n"); +} + +void vshader_if(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_ifc(WINED3DSHADERVECTOR* d, WINED3DSHADERVECTOR* s0) { + FIXME(" : Stub\n"); +} + +void vshader_else(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_label(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_endif(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_break(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_breakc(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_mova(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_defb(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_defi(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_dp2add(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_dsx(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_dsy(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_texldd(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_setp(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_texldl(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + +void vshader_breakp(WINED3DSHADERVECTOR* d) { + FIXME(" : Stub\n"); +} + + /** * log, exp, frc, m*x* seems to be macros ins ... to see */ static CONST SHADER_OPCODE vshader_ins [] = { - {D3DSIO_NOP, "nop", 0, vshader_nop, 0, 0}, - {D3DSIO_MOV, "mov", 2, vshader_mov, 0, 0}, - {D3DSIO_ADD, "add", 3, vshader_add, 0, 0}, - {D3DSIO_SUB, "sub", 3, vshader_sub, 0, 0}, - {D3DSIO_MAD, "mad", 4, vshader_mad, 0, 0}, - {D3DSIO_MUL, "mul", 3, vshader_mul, 0, 0}, - {D3DSIO_RCP, "rcp", 2, vshader_rcp, 0, 0}, - {D3DSIO_RSQ, "rsq", 2, vshader_rsq, 0, 0}, - {D3DSIO_DP3, "dp3", 3, vshader_dp3, 0, 0}, - {D3DSIO_DP4, "dp4", 3, vshader_dp4, 0, 0}, - {D3DSIO_MIN, "min", 3, vshader_min, 0, 0}, - {D3DSIO_MAX, "max", 3, vshader_max, 0, 0}, - {D3DSIO_SLT, "slt", 3, vshader_slt, 0, 0}, - {D3DSIO_SGE, "sge", 3, vshader_sge, 0, 0}, - {D3DSIO_EXP, "exp", 2, vshader_exp, 0, 0}, - {D3DSIO_LOG, "log", 2, vshader_log, 0, 0}, - {D3DSIO_LIT, "lit", 2, vshader_lit, 0, 0}, - {D3DSIO_DST, "dst", 3, vshader_dst, 0, 0}, - {D3DSIO_LRP, "lrp", 5, vshader_lrp, 0, 0}, - {D3DSIO_FRC, "frc", 2, vshader_frc, 0, 0}, - {D3DSIO_M4x4, "m4x4", 3, vshader_m4x4, 0, 0}, - {D3DSIO_M4x3, "m4x3", 3, vshader_m4x3, 0, 0}, - {D3DSIO_M3x4, "m3x4", 3, vshader_m3x4, 0, 0}, - {D3DSIO_M3x3, "m3x3", 3, vshader_m3x3, 0, 0}, - {D3DSIO_M3x2, "m3x2", 3, vshader_m3x2, 0, 0}, - /** FIXME: use direct access so add the others opcodes as stubs */ - {D3DSIO_EXPP, "expp", 2, vshader_expp, 0, 0}, - {D3DSIO_LOGP, "logp", 2, vshader_logp, 0, 0}, + {D3DSIO_NOP, "nop", "NOP", 0, vshader_nop, 0, 0}, + {D3DSIO_MOV, "mov", "MOV", 2, vshader_mov, 0, 0}, + {D3DSIO_ADD, "add", "ADD", 3, vshader_add, 0, 0}, + {D3DSIO_SUB, "sub", "SUB", 3, vshader_sub, 0, 0}, + {D3DSIO_MAD, "mad", "MAD", 4, vshader_mad, 0, 0}, + {D3DSIO_MUL, "mul", "MUL", 3, vshader_mul, 0, 0}, + {D3DSIO_RCP, "rcp", "RCP", 2, vshader_rcp, 0, 0}, + {D3DSIO_RSQ, "rsq", "RSQ", 2, vshader_rsq, 0, 0}, + {D3DSIO_DP3, "dp3", "DP3", 3, vshader_dp3, 0, 0}, + {D3DSIO_DP4, "dp4", "DP4", 3, vshader_dp4, 0, 0}, + {D3DSIO_MIN, "min", "MIN", 3, vshader_min, 0, 0}, + {D3DSIO_MAX, "max", "MAX", 3, vshader_max, 0, 0}, + {D3DSIO_SLT, "slt", "SLT", 3, vshader_slt, 0, 0}, + {D3DSIO_SGE, "sge", "SGE", 3, vshader_sge, 0, 0}, + {D3DSIO_ABS, "abs", "ABS", 2, vshader_abs, 0, 0}, + {D3DSIO_EXP, "exp", "EX2", 2, vshader_exp, 0, 0}, + {D3DSIO_LOG, "log", "LG2", 2, vshader_log, 0, 0}, + {D3DSIO_LIT, "lit", "LIT", 2, vshader_lit, 0, 0}, + {D3DSIO_DST, "dst", "DST", 3, vshader_dst, 0, 0}, + {D3DSIO_LRP, "lrp", "LRP", 5, vshader_lrp, 0, 0}, + {D3DSIO_FRC, "frc", "FRC", 2, vshader_frc, 0, 0}, + {D3DSIO_M4x4, "m4x4", "undefined", 3, vshader_m4x4, 0, 0}, + {D3DSIO_M4x3, "m4x3", "undefined", 3, vshader_m4x3, 0, 0}, + {D3DSIO_M3x4, "m3x4", "undefined", 3, vshader_m3x4, 0, 0}, + {D3DSIO_M3x3, "m3x3", "undefined", 3, vshader_m3x3, 0, 0}, + {D3DSIO_M3x2, "m3x2", "undefined", 3, vshader_m3x2, 0, 0}, + /** FIXME: use direct access so add the others opcodes as stubs */ + /* NOTE: gl function is currently NULL for calls and loops because they are not yet supported + They can be easly managed in software by introducing a call/loop stack and should be possible to implement in glsl ol NV_shader's */ + {D3DSIO_CALL, "call", GLNAME_REQUIRE_GLSL, 1, vshader_call, 0, 0}, + {D3DSIO_CALLNZ, "callnz", GLNAME_REQUIRE_GLSL, 2, vshader_callnz, 0, 0}, + {D3DSIO_LOOP, "loop", GLNAME_REQUIRE_GLSL, 2, vshader_loop, 0, 0}, + {D3DSIO_RET, "ret", GLNAME_REQUIRE_GLSL, 0, vshader_ret, 0, 0}, + {D3DSIO_ENDLOOP, "endloop", GLNAME_REQUIRE_GLSL, 0, vshader_endloop, 0, 0}, + {D3DSIO_LABEL, "label", GLNAME_REQUIRE_GLSL, 1, vshader_label, 0, 0}, + /* DCL is a specil operation */ + {D3DSIO_DCL, "dcl", NULL, 1, vshader_dcl, 0, 0}, + {D3DSIO_POW, "pow", "POW", 3, vshader_pow, 0, 0}, + {D3DSIO_CRS, "crs", "XPS", 3, vshader_crs, 0, 0}, + /* TODO: sng can possibly be performed as + RCP tmp, vec + MUL out, tmp, vec*/ + {D3DSIO_SGN, "sng", NULL, 2, vshader_sng, 0, 0}, + /* TODO: xyz normalise can be performed is VS_ARB using one tempory register, + DP3 tmp , vec, vec; + RSQ tmp, tmp.x; + MUL vec.xyz, vec, tmp; + but I think this is better because it accounts for w properly. + DP3 tmp , vec, vec; + RSQ tmp, tmp.x; + MUL vec, vec, tmp; + + */ + {D3DSIO_NRM, "nrm", NULL, 2, vshader_nrm, 0, 0}, + {D3DSIO_SINCOS, "sincos", NULL, 2, vshader_sincos, 0, 0}, + {D3DSIO_REP , "rep", GLNAME_REQUIRE_GLSL, 2, vshader_rep, 0, 0}, + {D3DSIO_ENDREP, "endrep", GLNAME_REQUIRE_GLSL, 0, vshader_endrep, 0, 0}, + {D3DSIO_IF, "if", GLNAME_REQUIRE_GLSL, 2, vshader_if, 0, 0}, + {D3DSIO_IFC, "ifc", GLNAME_REQUIRE_GLSL, 2, vshader_ifc, 0, 0}, + {D3DSIO_ELSE, "else", GLNAME_REQUIRE_GLSL, 2, vshader_else, 0, 0}, + {D3DSIO_ENDIF, "endif", GLNAME_REQUIRE_GLSL, 2, vshader_endif, 0, 0}, + {D3DSIO_BREAK, "break", GLNAME_REQUIRE_GLSL, 2, vshader_break, 0, 0}, + {D3DSIO_BREAKC, "breakc", GLNAME_REQUIRE_GLSL, 2, vshader_breakc, 0, 0}, + {D3DSIO_MOVA, "mova", GLNAME_REQUIRE_GLSL, 2, vshader_mova, 0, 0}, + {D3DSIO_DEFB, "defb", GLNAME_REQUIRE_GLSL, 2, vshader_defb, 0, 0}, + {D3DSIO_DEFI, "defi", GLNAME_REQUIRE_GLSL, 2, vshader_defi, 0, 0}, - {0, NULL, 0, NULL, 0, 0} + {D3DSIO_TEXCOORD, "texcoord", GLNAME_REQUIRE_GLSL, 1, vshader_texcoord, D3DPS_VERSION(1,0), D3DPS_VERSION(1,3)}, + {D3DSIO_TEXCOORD, "texcrd", GLNAME_REQUIRE_GLSL, 2, vshader_texcoord, D3DPS_VERSION(1,4), D3DPS_VERSION(1,4)}, + {D3DSIO_TEXKILL, "texkill", GLNAME_REQUIRE_GLSL, 1, vshader_texkill, D3DPS_VERSION(1,0), D3DPS_VERSION(1,4)}, + {D3DSIO_TEX, "tex", GLNAME_REQUIRE_GLSL, 1, vshader_tex, D3DPS_VERSION(1,0), D3DPS_VERSION(1,3)}, + {D3DSIO_TEX, "texld", GLNAME_REQUIRE_GLSL, 2, vshader_texld, D3DPS_VERSION(1,4), D3DPS_VERSION(1,4)}, + {D3DSIO_TEXBEM, "texbem", GLNAME_REQUIRE_GLSL, 2, vshader_texbem, D3DPS_VERSION(1,0), D3DPS_VERSION(1,3)}, + {D3DSIO_TEXBEML, "texbeml", GLNAME_REQUIRE_GLSL, 2, vshader_texbeml, D3DPS_VERSION(1,0), D3DPS_VERSION(1,3)}, + {D3DSIO_TEXREG2AR,"texreg2ar",GLNAME_REQUIRE_GLSL, 2, vshader_texreg2ar, D3DPS_VERSION(1,1), D3DPS_VERSION(1,3)}, + {D3DSIO_TEXREG2GB,"texreg2gb",GLNAME_REQUIRE_GLSL, 2, vshader_texreg2gb, D3DPS_VERSION(1,2), D3DPS_VERSION(1,3)}, + {D3DSIO_TEXM3x2PAD, "texm3x2pad", GLNAME_REQUIRE_GLSL, 2, vshader_texm3x2pad, D3DPS_VERSION(1,0), D3DPS_VERSION(1,3)}, + {D3DSIO_TEXM3x2TEX, "texm3x2tex", GLNAME_REQUIRE_GLSL, 2, vshader_texm3x2tex, D3DPS_VERSION(1,0), D3DPS_VERSION(1,3)}, + {D3DSIO_TEXM3x3DIFF, "texm3x3diff", GLNAME_REQUIRE_GLSL, 2, vshader_texm3x3diff, D3DPS_VERSION(0,0), D3DPS_VERSION(0,0)}, + {D3DSIO_TEXM3x3SPEC, "texm3x3spec", GLNAME_REQUIRE_GLSL, 3, vshader_texm3x3spec, D3DPS_VERSION(1,0), D3DPS_VERSION(1,3)}, + {D3DSIO_TEXM3x3VSPEC, "texm3x3vspe", GLNAME_REQUIRE_GLSL, 2, vshader_texm3x3vspec, D3DPS_VERSION(1,0), D3DPS_VERSION(1,3)}, + + {D3DSIO_EXPP, "expp", "EXP", 2, vshader_expp, 0, 0}, + {D3DSIO_LOGP, "logp", "LOG", 2, vshader_logp, 0, 0}, + {D3DSIO_CND, "cnd", GLNAME_REQUIRE_GLSL, 4, vshader_cnd, D3DPS_VERSION(1,1), D3DPS_VERSION(1,4)}, + /* def is a special opperation */ + {D3DSIO_DEF, "def", NULL, 5, vshader_def, D3DPS_VERSION(1,0), D3DPS_VERSION(3,0)}, + {D3DSIO_TEXREG2RGB, "texreg2rgb", GLNAME_REQUIRE_GLSL, 2, vshader_texreg2rgb, D3DPS_VERSION(1,2), D3DPS_VERSION(1,3)}, + {D3DSIO_TEXDP3TEX, "texdp3tex", GLNAME_REQUIRE_GLSL, 2, vshader_texdp3tex, D3DPS_VERSION(1,2), D3DPS_VERSION(1,3)}, + {D3DSIO_TEXM3x2DEPTH, "texm3x2depth", GLNAME_REQUIRE_GLSL, 2, vshader_texm3x2depth,D3DPS_VERSION(1,3), D3DPS_VERSION(1,3)}, + {D3DSIO_TEXDP3, "texdp3", GLNAME_REQUIRE_GLSL, 2, vshader_texdp3, D3DPS_VERSION(1,2), D3DPS_VERSION(1,3)}, + {D3DSIO_TEXM3x3, "texm3x3", GLNAME_REQUIRE_GLSL, 2, vshader_texm3x3, D3DPS_VERSION(1,2), D3DPS_VERSION(1,3)}, + {D3DSIO_TEXDEPTH, "texdepth", GLNAME_REQUIRE_GLSL,1, vshader_texdepth, D3DPS_VERSION(1,4), D3DPS_VERSION(1,4)}, + {D3DSIO_CMP, "cmp", GLNAME_REQUIRE_GLSL, 4, vshader_cmp, D3DPS_VERSION(1,1), D3DPS_VERSION(3,0)}, + {D3DSIO_BEM, "bem", GLNAME_REQUIRE_GLSL, 3, vshader_bem, D3DPS_VERSION(1,4), D3DPS_VERSION(1,4)}, + /* TODO: dp2add can be made out of multiple instuctions */ + {D3DSIO_DP2ADD, "dp2add", GLNAME_REQUIRE_GLSL, 2, vshader_dp2add, 0, 0}, + {D3DSIO_DSX, "dsx", GLNAME_REQUIRE_GLSL, 2, vshader_dsx, 0, 0}, + {D3DSIO_DSY, "dsy", GLNAME_REQUIRE_GLSL, 2, vshader_dsy, 0, 0}, + {D3DSIO_TEXLDD, "texldd", GLNAME_REQUIRE_GLSL, 2, vshader_texldd, 0, 0}, + {D3DSIO_SETP, "setp", GLNAME_REQUIRE_GLSL, 2, vshader_setp, 0, 0}, + {D3DSIO_TEXLDL, "texdl", GLNAME_REQUIRE_GLSL, 2, vshader_texldl, 0, 0}, + {D3DSIO_BREAKP, "breakp", GLNAME_REQUIRE_GLSL, 2, vshader_breakp, 0, 0}, + {D3DSIO_PHASE, "phase", GLNAME_REQUIRE_GLSL, 0, vshader_nop, 0, 0}, + {0, NULL, NULL, 0, NULL, 0, 0} }; inline static const SHADER_OPCODE* vshader_program_get_opcode(const DWORD code) { - DWORD i = 0; - /** TODO: use dichotomic search */ - while (NULL != vshader_ins[i].name) { - if ((code & D3DSI_OPCODE_MASK) == vshader_ins[i].opcode) { - return &vshader_ins[i]; + DWORD i = 0; + /** TODO: use dichotomic search or hash table */ + while (NULL != vshader_ins[i].name) { + if ((code & D3DSI_OPCODE_MASK) == vshader_ins[i].opcode) { + return &vshader_ins[i]; + } + ++i; } - ++i; - } - return NULL; + FIXME("Unsupported opcode %lx\n",code); + return NULL; } inline static void vshader_program_dump_param(const DWORD param, int input) { @@ -401,12 +725,12 @@ inline static void vshader_program_dump_param(const DWORD param, int input) { if ((param & D3DSP_SRCMOD_MASK) == D3DSPSM_NEG) TRACE("-"); - switch (regtype << D3DSP_REGTYPE_SHIFT) { + switch (regtype) { case D3DSPR_TEMP: TRACE("R[%lu]", reg); break; case D3DSPR_INPUT: - TRACE("V[%lu]", reg); + TRACE("v%lu", reg); break; case D3DSPR_CONST: TRACE("C[%s%lu]", (param & D3DVS_ADDRMODE_RELATIVE) ? "a0.x + " : "", reg); @@ -424,6 +748,7 @@ inline static void vshader_program_dump_param(const DWORD param, int input) { TRACE("oT[%lu]", reg); break; default: + FIXME("Unknown %lu %u reg %lu\n",regtype, D3DSPR_ATTROUT, reg); break; } @@ -462,6 +787,98 @@ inline static void vshader_program_dump_param(const DWORD param, int input) { } } +inline static void vshader_program_dump_vs_param(const DWORD param, int input) { + static const char* rastout_reg_names[] = { "oPos", "oFog", "oPts" }; + static const char swizzle_reg_chars[] = "xyzw"; + /* the unknown mask is for bits not yet accounted for by any other mask... */ +#define UNKNOWN_MASK 0xC000 + + /* for registeres about 7 we have to add on bits 11 and 12 to get the correct register */ +#define EXTENDED_REG 0x1800 + + DWORD reg = param & D3DSP_REGNUM_MASK; /* 0x00001FFF; isn't this D3DSP_REGNUM_MASK? */ + DWORD regtype = ((param & D3DSP_REGTYPE_MASK) >> D3DSP_REGTYPE_SHIFT) | ((param & EXTENDED_REG) >> 8); + + if(param & UNKNOWN_MASK) { /* if this register has any of the unknown bits set then report them*/ + FIXME("Unknown bits set regtype %lx , %lx, UK(%lx)\n", regtype, (param & EXTENDED_REG), param & UNKNOWN_MASK); + } + + if ((param & D3DSP_SRCMOD_MASK) == D3DSPSM_NEG) TRACE("-"); + + switch (regtype /*<< D3DSP_REGTYPE_SHIFT*/) { + case D3DSPR_TEMP: + TRACE("r%lu", reg); + break; + case D3DSPR_INPUT: + TRACE("v%lu", reg); + break; + case D3DSPR_CONST: + TRACE("c%s%lu", (param & D3DVS_ADDRMODE_RELATIVE) ? "a0.x + " : "", reg); + break; + case D3DSPR_ADDR: /*case D3DSPR_TEXTURE:*/ + TRACE("a%lu", reg); + break; + case D3DSPR_RASTOUT: + TRACE("%s", rastout_reg_names[reg]); + break; + case D3DSPR_ATTROUT: + TRACE("oD%lu", reg); + break; + case D3DSPR_TEXCRDOUT: + TRACE("oT%lu", reg); + break; + case D3DSPR_CONSTINT: + TRACE("i%s%lu", (param & D3DVS_ADDRMODE_RELATIVE) ? "a0.x + " : "", reg); + break; + case D3DSPR_CONSTBOOL: + TRACE("b%s%lu", (param & D3DVS_ADDRMODE_RELATIVE) ? "a0.x + " : "", reg); + break; + case D3DSPR_LABEL: + TRACE("l%lu", reg); + break; + case D3DSPR_LOOP: + TRACE("aL%s%lu", (param & D3DVS_ADDRMODE_RELATIVE) ? "a0.x + " : "", reg); + break; + default: + FIXME("Unknown %lu reg %lu\n",regtype, reg); + break; + } + + if (!input) { + /** operand output */ + if ((param & D3DSP_WRITEMASK_ALL) != D3DSP_WRITEMASK_ALL) { + if (param & D3DSP_WRITEMASK_0) TRACE(".x"); + if (param & D3DSP_WRITEMASK_1) TRACE(".y"); + if (param & D3DSP_WRITEMASK_2) TRACE(".z"); + if (param & D3DSP_WRITEMASK_3) TRACE(".w"); + } + } else { + /** operand input */ + DWORD swizzle = (param & D3DVS_SWIZZLE_MASK) >> D3DVS_SWIZZLE_SHIFT; + DWORD swizzle_x = swizzle & 0x03; + DWORD swizzle_y = (swizzle >> 2) & 0x03; + DWORD swizzle_z = (swizzle >> 4) & 0x03; + DWORD swizzle_w = (swizzle >> 6) & 0x03; + /** + * swizzle bits fields: + * WWZZYYXX + */ + if ((D3DVS_NOSWIZZLE >> D3DVS_SWIZZLE_SHIFT) != swizzle) { /* ! D3DVS_NOSWIZZLE == 0xE4 << D3DVS_SWIZZLE_SHIFT */ + if (swizzle_x == swizzle_y && + swizzle_x == swizzle_z && + swizzle_x == swizzle_w) { + TRACE(".%c", swizzle_reg_chars[swizzle_x]); + } else { + TRACE(".%c%c%c%c", + swizzle_reg_chars[swizzle_x], + swizzle_reg_chars[swizzle_y], + swizzle_reg_chars[swizzle_z], + swizzle_reg_chars[swizzle_w]); + } + } + } +} + inline static BOOL vshader_is_version_token(DWORD token) { return 0xFFFE0000 == (token & 0xFFFE0000); } @@ -470,71 +887,755 @@ inline static BOOL vshader_is_comment_token(DWORD token) { return D3DSIO_COMMENT == (token & D3DSI_OPCODE_MASK); } +inline static void vshader_program_add_param(const DWORD param, int input, char *hwLine, BOOL namedArrays, CHAR constantsUsedBitmap[]) { + /*static const char* rastout_reg_names[] = { "oPos", "oFog", "oPts" }; */ + static const char* hwrastout_reg_names[] = { "result.position", "result.fogcoord", "result.pointsize" }; + static const char swizzle_reg_chars[] = "xyzw"; + + DWORD reg = param & 0x00001FFF; + DWORD regtype = ((param & D3DSP_REGTYPE_MASK) >> D3DSP_REGTYPE_SHIFT); + char tmpReg[255]; + + if ((param & D3DSP_SRCMOD_MASK) == D3DSPSM_NEG) { + strcat(hwLine, " -"); + } else { + strcat(hwLine, " "); + } + + switch (regtype) { + case D3DSPR_TEMP: + sprintf(tmpReg, "T%lu", reg); + strcat(hwLine, tmpReg); + break; + case D3DSPR_INPUT: + /* if the attributes come in as named dcl's then use a named vertex (called namedVertexN) */ + if (namedArrays) { + sprintf(tmpReg, "namedVertex%lu", reg); + } else { + /* otherwise the input is on a numbered attribute so use opengl numbered attributes */ + sprintf(tmpReg, "vertex.attrib[%lu]", reg); + } + strcat(hwLine, tmpReg); + break; + case D3DSPR_CONST: + /* FIXME: some constants are named so we need a constants map*/ + if (constantsUsedBitmap[reg] == VS_CONSTANT_CONSTANT) { + if (param & D3DVS_ADDRMODE_RELATIVE) { + FIXME("Relitive addressing not expected for a named constant %lu\n", reg); + } + sprintf(tmpReg, "const%lu", reg); + } else { + sprintf(tmpReg, "C[%s%lu]", (param & D3DVS_ADDRMODE_RELATIVE) ? "A0.x + " : "", reg); + } + strcat(hwLine, tmpReg); + break; + case D3DSPR_ADDR: /*case D3DSPR_TEXTURE:*/ + sprintf(tmpReg, "A%lu", reg); + strcat(hwLine, tmpReg); + break; + case D3DSPR_RASTOUT: + sprintf(tmpReg, "%s", hwrastout_reg_names[reg]); + strcat(hwLine, tmpReg); + break; + case D3DSPR_ATTROUT: + if (reg==0) { + strcat(hwLine, "result.color.primary"); + } else { + strcat(hwLine, "result.color.secondary"); + } + break; + case D3DSPR_TEXCRDOUT: + sprintf(tmpReg, "result.texcoord[%lu]", reg); + strcat(hwLine, tmpReg); + break; + default: + FIXME("Unknown reg type %ld %ld\n", regtype, reg); + break; + } + + if (!input) { + /** operand output */ + if ((param & D3DSP_WRITEMASK_ALL) != D3DSP_WRITEMASK_ALL) { + strcat(hwLine, "."); + if (param & D3DSP_WRITEMASK_0) { + strcat(hwLine, "x"); + } + if (param & D3DSP_WRITEMASK_1) { + strcat(hwLine, "y"); + } + if (param & D3DSP_WRITEMASK_2) { + strcat(hwLine, "z"); + } + if (param & D3DSP_WRITEMASK_3) { + strcat(hwLine, "w"); + } + } + } else { + /** operand input */ + DWORD swizzle = (param & D3DVS_SWIZZLE_MASK) >> D3DVS_SWIZZLE_SHIFT; + DWORD swizzle_x = swizzle & 0x03; + DWORD swizzle_y = (swizzle >> 2) & 0x03; + DWORD swizzle_z = (swizzle >> 4) & 0x03; + DWORD swizzle_w = (swizzle >> 6) & 0x03; + /** + * swizzle bits fields: + * WWZZYYXX + */ + if ((D3DVS_NOSWIZZLE >> D3DVS_SWIZZLE_SHIFT) != swizzle) { /* ! D3DVS_NOSWIZZLE == 0xE4 << D3DVS_SWIZZLE_SHIFT */ + if (swizzle_x == swizzle_y && + swizzle_x == swizzle_z && + swizzle_x == swizzle_w) + { + sprintf(tmpReg, ".%c", swizzle_reg_chars[swizzle_x]); + strcat(hwLine, tmpReg); + } else { + sprintf(tmpReg, ".%c%c%c%c", + swizzle_reg_chars[swizzle_x], + swizzle_reg_chars[swizzle_y], + swizzle_reg_chars[swizzle_z], + swizzle_reg_chars[swizzle_w]); + strcat(hwLine, tmpReg); + } + } + } +} + +DWORD MacroExpansion[4*4]; + +int ExpandMxMacro(DWORD macro_opcode, const DWORD* args) { + int i; + int nComponents = 0; + DWORD opcode =0; + switch(macro_opcode) { + case D3DSIO_M4x4: + nComponents = 4; + opcode = D3DSIO_DP4; + break; + case D3DSIO_M4x3: + nComponents = 3; + opcode = D3DSIO_DP4; + break; + case D3DSIO_M3x4: + nComponents = 4; + opcode = D3DSIO_DP3; + break; + case D3DSIO_M3x3: + nComponents = 3; + opcode = D3DSIO_DP3; + break; + case D3DSIO_M3x2: + nComponents = 2; + opcode = D3DSIO_DP3; + break; + default: + break; + } + for (i = 0; i < nComponents; i++) { + MacroExpansion[i*4+0] = opcode; + MacroExpansion[i*4+1] = ((*args) & ~D3DSP_WRITEMASK_ALL)|(D3DSP_WRITEMASK_0<device->fixupVertexBufferSize < PGMSIZE) { + HeapFree(GetProcessHeap(), 0, This->fixupVertexBuffer); + This->fixupVertexBuffer = HeapAlloc(GetProcessHeap() , 0, PGMSIZE); + This->fixupVertexBufferSize = PGMSIZE; + This->fixupVertexBuffer[0] = 0; + } + pgmStr = This->device->fixupVertexBuffer; +#endif +#define PNSTRCAT(_pgmStr, _tmpLine) { \ + int _tmpLineLen = strlen(_tmpLine); \ + if(_tmpLineLen + pgmLength > PGMSIZE) { \ + ERR("The buffer allocated for the vertex program string pgmStr is too small at %d bytes, at least %d bytes in total are required.\n", PGMSIZE, _tmpLineLen + pgmLength); \ + } else { \ + memcpy(_pgmStr + pgmLength, _tmpLine, _tmpLineLen); \ + } \ + pgmLength += _tmpLineLen; \ + } + + pgmStr = HeapAlloc(GetProcessHeap(), HEAP_ZERO_MEMORY, 65535); /* 64kb should be enough */ + /* Initilise the shader */ + This->namedArrays = FALSE; + This->declaredArrays = FALSE; + for (i = 0; i < WINED3DSHADERDECLUSAGE_MAX_USAGE; i++) { + This->arrayUsageMap[i] = -1; + } + /* set all the tmpsUsed to not used */ + memset(tmpsUsed, FALSE , sizeof(tmpsUsed)); + + /* TODO: renumbering of attributes if the values are higher than the highest supported attribute but the total number of attributes is less than the highest supported attribute */ + This->highestConstant = -1; + + + /** + * First pass to determine what we need to declare: + * - Temporary variables + * - Address variables + */ if (NULL != pToken) { while (D3DVS_END() != *pToken) { - if (vshader_is_version_token(*pToken)) { /** version */ - TRACE("vs.%lu.%lu\n", (*pToken >> 8) & 0x0F, (*pToken & 0x0F)); + if (vshader_is_version_token(*pToken)) { + /** skip version */ + ++pToken; + continue; + } + if (vshader_is_comment_token(*pToken)) { /** comment */ + DWORD comment_len = (*pToken & D3DSI_COMMENTSIZE_MASK) >> D3DSI_COMMENTSIZE_SHIFT; ++pToken; - ++len; + pToken += comment_len; continue; + } + curOpcode = vshader_program_get_opcode(*pToken); + ++pToken; + /* TODO: dcl's */ + /* TODO: Consts */ + + if (NULL == curOpcode) { + while (*pToken & 0x80000000) { + TRACE("unrecognized opcode: %08lx\n", *pToken); + /* skip unrecognized opcode */ + ++pToken; + } + } else { + if (curOpcode->opcode == D3DSIO_DCL){ + INT usage = *pToken++; + INT arrayNo = (*pToken++ & 0x00001FFF); + switch(usage & 0xFFFF) { + case D3DDECLUSAGE_POSITION: + if((usage & 0xF0000) >> 16 == 0) { /* tween data */ + TRACE("Setting position to %d\n", arrayNo); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_POSITION] = arrayNo; + This->namedArrays = TRUE; + } else { + /* TODO: position indexes go fro 0-8!!*/ + TRACE("Setting position 2 to %d because usage = %d\n", arrayNo, (usage & 0xF0000) >> 16); + /* robots uses positions upto 8, the position arrays are just packed.*/ + if ((usage & 0xF0000) >> 16 > 1) { + TRACE("Loaded for position %d (greater than 2)\n", (usage & 0xF0000) >> 16); + } + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_POSITION2 + ((usage & 0xF0000) >> 16) -1] = arrayNo; + This->declaredArrays = TRUE; + } + break; + case D3DDECLUSAGE_BLENDINDICES: + /* not supported by openGL */ + TRACE("Setting BLENDINDICES to %d\n", arrayNo); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_BLENDINDICES] = arrayNo; + This->declaredArrays = TRUE; + if ((usage & 0xF0000) >> 16 != 0) FIXME("Extended BLENDINDICES\n"); + break; + case D3DDECLUSAGE_BLENDWEIGHT: + TRACE("Setting BLENDWEIGHT to %d\n", arrayNo); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_BLENDWEIGHT] = arrayNo; + This->namedArrays = TRUE; + if ((usage & 0xF0000) >> 16 != 0) FIXME("Extended blend weights\n"); + break; + case D3DDECLUSAGE_NORMAL: + if((usage & 0xF0000) >> 16 == 0) { /* tween data */ + TRACE("Setting normal to %d\n", arrayNo); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_NORMAL] = arrayNo; + This->namedArrays = TRUE; + } else { + TRACE("Setting normal 2 to %d because usage = %d\n", arrayNo, (usage & 0xF0000) >> 16); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_NORMAL2] = arrayNo; + This->declaredArrays = TRUE; + } + break; + case D3DDECLUSAGE_PSIZE: + TRACE("Setting PSIZE to %d\n", arrayNo); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_PSIZE] = arrayNo; + This->namedArrays = TRUE; + if ((usage & 0xF0000) >> 16 != 0) FIXME("Extended PSIZE\n"); + break; + case D3DDECLUSAGE_COLOR: + if((usage & 0xF0000) >> 16 == 0) { + TRACE("Setting DIFFUSE to %d\n", arrayNo); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_DIFFUSE] = arrayNo; + This->namedArrays = TRUE; + } else { + TRACE("Setting SPECULAR to %d\n", arrayNo); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_SPECULAR] = arrayNo; + This->namedArrays = TRUE; + } + break; + case D3DDECLUSAGE_TEXCOORD: + This->namedArrays = TRUE; + /* only 7 texture coords have been designed for, so run a quick sanity check */ + if ((usage & 0xF0000) >> 16 > 7) { + FIXME("(%p) : Program uses texture coordinate %d but only 0-7 have been implemented\n", This, (usage & 0xF0000) >> 16); + } else { + TRACE("Setting TEXCOORD %d to %d\n", ((usage & 0xF0000) >> 16), arrayNo); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_TEXCOORD0 + ((usage & 0xF0000) >> 16)] = arrayNo; + } + break; + /* The following aren't supported by openGL, + if we get them then everything needs to be mapped to numbered attributes instead of named ones. + this should be caught in the first pass */ + case D3DDECLUSAGE_TANGENT: + TRACE("Setting TANGENT to %d\n", arrayNo); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_TANGENT] = arrayNo; + This->declaredArrays = TRUE; + break; + case D3DDECLUSAGE_BINORMAL: + TRACE("Setting BINORMAL to %d\n", arrayNo); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_BINORMAL] = arrayNo; + This->declaredArrays = TRUE; + break; + case D3DDECLUSAGE_TESSFACTOR: + TRACE("Setting TESSFACTOR to %d\n", arrayNo); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_TESSFACTOR] = arrayNo; + This->declaredArrays = TRUE; + break; + case D3DDECLUSAGE_POSITIONT: + if((usage & 0xF0000) >> 16 == 0) { /* tween data */ + FIXME("Setting positiont to %d\n", arrayNo); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_POSITIONT] = arrayNo; + This->namedArrays = TRUE; + } else { + FIXME("Setting positiont 2 to %d because usage = %d\n", arrayNo, (usage & 0xF0000) >> 16); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_POSITIONT2] = arrayNo; + This->declaredArrays = TRUE; + if ((usage & 0xF0000) >> 16 != 0) FIXME("Extended positiont\n"); + } + break; + case D3DDECLUSAGE_FOG: + /* supported by OpenGL */ + TRACE("Setting FOG to %d\n", arrayNo); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_FOG] = arrayNo; + This->namedArrays = TRUE; + break; + case D3DDECLUSAGE_DEPTH: + TRACE("Setting DEPTH to %d\n", arrayNo); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_DEPTH] = arrayNo; + This->declaredArrays = TRUE; + break; + case D3DDECLUSAGE_SAMPLE: + TRACE("Setting SAMPLE to %d\n", arrayNo); + This->arrayUsageMap[WINED3DSHADERDECLUSAGE_SAMPLE] = arrayNo; + This->declaredArrays = TRUE; + break; + default: + FIXME("Unrecognised dcl %08x", usage & 0xFFFF); + } + } else if(curOpcode->opcode == D3DSIO_DEF) { + This->constantsUsedBitmap[*pToken & 0xFF] = VS_CONSTANT_CONSTANT; + FIXME("Constant %ld\n", *pToken & 0xFF); + ++pToken; + ++pToken; + ++pToken; + ++pToken; + ++pToken; + + } else { + /* Check to see if and tmp or addressing redisters are used */ + if (curOpcode->num_params > 0) { + regtype = ((((*pToken) & D3DSP_REGTYPE_MASK) >> D3DSP_REGTYPE_SHIFT)); + reg = ((*pToken) & 0x00001FFF); + if (D3DSPR_ADDR == regtype && nUseAddressRegister <= reg) nUseAddressRegister = reg + 1; + if (D3DSPR_TEMP == regtype){ + tmpsUsed[reg] = TRUE; + if(nUseTempRegister <= reg) nUseTempRegister = reg + 1; + } + ++pToken; + for (i = 1; i < curOpcode->num_params; ++i) { + regtype = ((((*pToken) & D3DSP_REGTYPE_MASK) >> D3DSP_REGTYPE_SHIFT)); + reg = ((*pToken) & 0x00001FFF); + if (D3DSPR_ADDR == regtype && nUseAddressRegister <= reg) nUseAddressRegister = reg + 1; + if (D3DSPR_TEMP == regtype){ + tmpsUsed[reg] = TRUE; + if(nUseTempRegister <= reg) nUseTempRegister = reg + 1; + } + ++pToken; + } + } + } +#if 1 /* TODO: if the shaders uses calls or loops then we need to convert the shader into glsl */ + if (curOpcode->glname == GLNAME_REQUIRE_GLSL) { + FIXME("This shader requires gl shader language support\n"); +#if 0 + This->shaderLanguage = GLSHADER_GLSL; +#endif + } +#endif + } + } + } +#if 1 +#define VSHADER_ALWAYS_NUMBERED +#endif + +#ifdef VSHADER_ALWAYS_NUMBERED /* handy for debugging using numbered arrays instead of named arrays */ + /* TODO: using numbered arrays for software shaders makes things easier */ + This->declaredArrays = TRUE; +#endif + + /* named arrays and declared arrays are mutually exclusive */ + if (This->declaredArrays) { + This->namedArrays = FALSE; + } + /* TODO: validate + nUseAddressRegister < = GL_MAX_PROGRAM_ADDRESS_REGISTERS_AR + nUseTempRegister <= GL_MAX_PROGRAM_LOCAL_PARAMETERS_ARB + */ + + /** second pass, now generate */ + pToken = pFunction; + + if (NULL != pToken) { + while (1) { + tmpLine[0] = 0; + if ((nRemInstr >= 0) && (--nRemInstr == -1)) + /* Macro is finished, continue normal path */ + pToken = pSavedToken; + if (D3DVS_END() == *pToken) + break; + + if (vshader_is_version_token(*pToken)) { /** version */ + /* Extract version *10 into integer value (ie. 1.0 == 10, 1.1==11 etc */ + int version = (((*pToken >> 8) & 0x0F) * 10) + (*pToken & 0x0F); + int numTemps; + int numConstants; + + TRACE("found version token vs.%lu.%lu;\n", (*pToken >> 8) & 0x0F, (*pToken & 0x0F)); + + /* Each release of vertex shaders has had different numbers of temp registers */ + switch (version) { + case 10: + case 11: numTemps=12; + numConstants=96;/* min(GL_LIMITS(constants),96) */ + strcpy(tmpLine, "!!ARBvp1.0\n"); + TRACE("GL HW (%u) : %s", pgmLength, tmpLine); /* Don't add \n to this line as already in tmpLine */ + break; + /* FIXME: if there are no calls or loops then use ARBvp1 otherwise use GLSL instead + TODO: see if there are any operations in vs2/3 that aren't supported by ARBvp + TODO: only map the maximum possible number of constants supported by openGL and not the maximum required by d3d (even better only map the used constants)*/ + case 20: numTemps=12; /* min(GL_LIMITS(temps),12) */ + numConstants=96; /* min(GL_LIMITS(constants),256) */ + strcpy(tmpLine, "!!ARBvp1.0\n"); + FIXME("No work done yet to support vs2.0 in hw\n"); + TRACE("GL HW (%u) : %s", pgmLength, tmpLine); /* Don't add \n to this line as already in tmpLine */ + break; + case 21: numTemps=12; /* min(GL_LIMITS(temps),12) */ + numConstants=96; /* min(GL_LIMITS(constants),256) */ + strcpy(tmpLine, "!!ARBvp1.0\n"); + FIXME("No work done yet to support vs2.1 in hw\n"); + TRACE("GL HW (%u) : %s", pgmLength, tmpLine); /* Don't add \n to this line as already in tmpLine */ + break; + case 30: numTemps=32; /* min(GL_LIMITS(temps),32) */ + numConstants=96;/* min(GL_LIMITS(constants),256) */ + strcpy(tmpLine, "!!ARBvp3.0\n"); + FIXME("No work done yet to support vs3.0 in hw\n"); + TRACE("GL HW (%u) : %s", pgmLength, tmpLine); /* Don't add \n to this line as already in tmpLine */ + break; + default: + numTemps=12;/* min(GL_LIMITS(temps),12) */ + numConstants=96;/* min(GL_LIMITS(constants),96) */ + strcpy(tmpLine, "!!ARBvp1.0\n"); + FIXME("Unrecognized vertex shader version %d!\n", version); + } + PNSTRCAT(pgmStr, tmpLine); + + ++lineNum; + + /* This should be a bitmap so that only temp registers that are used are declared. */ + for (i = 0; i < nUseTempRegister /* we should check numTemps here */ ; i++) { + if (tmpsUsed[i]) { /* only write out the temps if they are actually in use */ + sprintf(tmpLine, "TEMP T%ld;\n", i); + ++lineNum; + TRACE("GL HW (%u, %u) : %s", lineNum, pgmLength, tmpLine); /* Don't add \n to this line as already in tmpLine */ + PNSTRCAT(pgmStr, tmpLine); + + } + } + /* TODO: loop register counts as an addres register */ + for (i = 0; i < nUseAddressRegister; i++) { + sprintf(tmpLine, "ADDRESS A%ld;\n", i); + ++lineNum; + TRACE("GL HW (%u, %u) : %s", lineNum, pgmLength, tmpLine); /* Don't add \n to this line as already in tmpLine */ + PNSTRCAT(pgmStr, tmpLine); + + } + /* Due to the dynamic constants binding mechanism, we need to declare + * all the constants for relative addressing. */ + /* Mesa supports only 95 constants for VS1.X although we should have at least 96. */ + if (GL_VEND(MESA) || GL_VEND(WINE)) { + numConstants = 95; + } + /* FIXME: We should be counting the number of constants in the first pass and then validating that many are supported + Looking at some of the shaders inuse by applications we'd need to create a list of all used env variables + */ + sprintf(tmpLine, "PARAM C[%d] = { program.env[0..%d] };\n", numConstants, numConstants - 1); + TRACE("GL HW (%u,%u) : %s", lineNum, pgmLength, tmpLine); /* Don't add \n to this line as already in tmpLine */ + PNSTRCAT(pgmStr, tmpLine); + + ++lineNum; + + ++pToken; + continue; } if (vshader_is_comment_token(*pToken)) { /** comment */ DWORD comment_len = (*pToken & D3DSI_COMMENTSIZE_MASK) >> D3DSI_COMMENTSIZE_SHIFT; ++pToken; - /*TRACE("comment[%ld] ;%s\n", comment_len, (char*)pToken);*/ + FIXME("#%s\n", (char*)pToken); pToken += comment_len; - len += comment_len + 1; continue; - } - curOpcode = vshader_program_get_opcode(*pToken); + } + + curOpcode = vshader_program_get_opcode(*pToken); + ++pToken; + if (NULL == curOpcode) { + /* unkown current opcode ... (shouldn't be any!) */ + while (*pToken & 0x80000000) { + TRACE("unrecognized opcode: %08lx\n", *pToken); ++pToken; - ++len; - if (NULL == curOpcode) { - /* unkown current opcode ... */ - while (*pToken & 0x80000000) { - TRACE("unrecognized opcode: %08lx\n", *pToken); - ++pToken; - ++len; + } + } else if (GLNAME_REQUIRE_GLSL == curOpcode->glname) { + /* if the token isn't supported by this cross compiler then skip it and it's parameters */ + + FIXME("Token %s requires greater functionality than Vertex_Progarm_ARB supports\n", curOpcode->name); + pToken += curOpcode->num_params; + } else { + /* Build opcode for GL vertex_program */ + switch (curOpcode->opcode) { + case D3DSIO_NOP: + continue; + case D3DSIO_MOV: + /* Address registers must be loaded with the ARL instruction */ + if ((((*pToken) & D3DSP_REGTYPE_MASK) >> D3DSP_REGTYPE_SHIFT) == D3DSPR_ADDR) { + if (((*pToken) & 0x00001FFF) < nUseAddressRegister) { + strcpy(tmpLine, "ARL"); + break; + } else + FIXME("(%p) Try to load A%ld an undeclared address register!\n", This, ((*pToken) & 0x00001FFF)); + } + /* fall through */ + case D3DSIO_ADD: + case D3DSIO_SUB: + case D3DSIO_MAD: + case D3DSIO_MUL: + case D3DSIO_RCP: + case D3DSIO_RSQ: + case D3DSIO_DP3: + case D3DSIO_DP4: + case D3DSIO_MIN: + case D3DSIO_MAX: + case D3DSIO_SLT: + case D3DSIO_SGE: + case D3DSIO_LIT: + case D3DSIO_DST: + case D3DSIO_FRC: + case D3DSIO_EXPP: + case D3DSIO_LOGP: + case D3DSIO_EXP: + case D3DSIO_LOG: + strcpy(tmpLine, curOpcode->glname); + break; + case D3DSIO_M4x4: + case D3DSIO_M4x3: + case D3DSIO_M3x4: + case D3DSIO_M3x3: + case D3DSIO_M3x2: + /* Expand the macro and get nusprintf(tmpLine,mber of generated instruction */ + nRemInstr = ExpandMxMacro(curOpcode->opcode, pToken); + /* Save point to next instruction */ + pSavedToken = pToken + 3; + /* Execute expanded macro */ + pToken = MacroExpansion; + continue; + /* dcl and def are handeled in the first pass */ + case D3DSIO_DCL: + if (This->namedArrays) { + const char* attribName = "undefined"; + switch(*pToken & 0xFFFF) { + case D3DDECLUSAGE_POSITION: + attribName = "vertex.position"; + break; + case D3DDECLUSAGE_BLENDINDICES: + /* not supported by openGL */ + attribName = "vertex.blend"; + break; + case D3DDECLUSAGE_BLENDWEIGHT: + attribName = "vertex.weight"; + break; + case D3DDECLUSAGE_NORMAL: + attribName = "vertex.normal"; + break; + case D3DDECLUSAGE_PSIZE: + attribName = "vertex.psize"; + break; + case D3DDECLUSAGE_COLOR: + if((*pToken & 0xF0000) >> 16 == 0) { + attribName = "vertex.color"; + } else { + attribName = "vertex.color.secondary"; + } + break; + case D3DDECLUSAGE_TEXCOORD: + { + char tmpChar[100]; + tmpChar[0] = 0; + sprintf(tmpChar,"vertex.texcoord[%lu]",(*pToken & 0xF0000) >> 16); + attribName = tmpChar; + break; + } + /* The following aren't directly supported by openGL, so shouldn't come up using namedarrays. */ + case D3DDECLUSAGE_TANGENT: + attribName = "vertex.tangent"; + break; + case D3DDECLUSAGE_BINORMAL: + attribName = "vertex.binormal"; + break; + case D3DDECLUSAGE_TESSFACTOR: + attribName = "vertex.tessfactor"; + break; + case D3DDECLUSAGE_POSITIONT: + attribName = "vertex.possitionT"; + break; + case D3DDECLUSAGE_FOG: + attribName = "vertex.fogcoord"; + break; + case D3DDECLUSAGE_DEPTH: + attribName = "vertex.depth"; + break; + case D3DDECLUSAGE_SAMPLE: + attribName = "vertex.sample"; + break; + default: + FIXME("Unrecognised dcl %08lx", *pToken & 0xFFFF); } - } else { - TRACE("%s ", curOpcode->name); - if (curOpcode->num_params > 0) { - vshader_program_dump_param(*pToken, 0); + { + char tmpChar[80]; ++pToken; - ++len; - for (i = 1; i < curOpcode->num_params; ++i) { - TRACE(", "); - vshader_program_dump_param(*pToken, 1); - ++pToken; - ++len; + sprintf(tmpLine, "ATTRIB "); + vshader_program_add_param(*pToken, 0, tmpLine, This->namedArrays, This->constantsUsedBitmap); + sprintf(tmpChar," = %s", attribName); + strcat(tmpLine, tmpChar); + strcat(tmpLine,";\n"); + ++lineNum; + if (This->namedArrays) { + TRACE("GL HW (%u, %u) : %s", lineNum, pgmLength, tmpLine); + PNSTRCAT(pgmStr, tmpLine); + + } else { + TRACE("GL HW (%u, %u) : %s", lineNum, pgmLength, tmpLine); } } - TRACE("\n"); + } else { + /* eat the token so it doesn't generate a warning */ + ++pToken; + } + ++pToken; + continue; + case D3DSIO_DEF: + { + char tmpChar[80]; + sprintf(tmpLine, "PARAM const%lu = {", *pToken & 0xFF); + ++pToken; + sprintf(tmpChar,"%f ,", *(float *)pToken); + strcat(tmpLine, tmpChar); + ++pToken; + sprintf(tmpChar,"%f ,", *(float *)pToken); + strcat(tmpLine, tmpChar); + ++pToken; + sprintf(tmpChar,"%f ,", *(float *)pToken); + strcat(tmpLine, tmpChar); + ++pToken; + sprintf(tmpChar,"%f}", *(float *)pToken); + strcat(tmpLine, tmpChar); + + strcat(tmpLine,";\n"); + ++lineNum; + TRACE("GL HW (%u, %u) : %s", lineNum, pgmLength, tmpLine); /* Don't add \n to this line as already in tmpLine */ + PNSTRCAT(pgmStr, tmpLine); + + ++pToken; + continue; + } + default: + if (curOpcode->glname == GLNAME_REQUIRE_GLSL) { + FIXME("Opcode %s requires Gl Shader languange 1.0\n", curOpcode->name); + } else { + FIXME("Can't handle opcode %s in hwShader\n", curOpcode->name); } } - This->functionLength = (len + 1) * sizeof(DWORD); - } else { - This->functionLength = 1; /* no Function defined use fixed function vertex processing */ - } - /* copy the function ... because it will certainly be released by application */ + if (curOpcode->num_params > 0) { + vshader_program_add_param(*pToken, 0, tmpLine, This->namedArrays, This->constantsUsedBitmap); - if (NULL != pFunction) { - This->function = HeapAlloc(GetProcessHeap(), HEAP_ZERO_MEMORY, This->functionLength); - memcpy((void *)This->function, pFunction, This->functionLength); - } else { - This->function = NULL; + ++pToken; + for (i = 1; i < curOpcode->num_params; ++i) { + strcat(tmpLine, ","); + vshader_program_add_param(*pToken, 1, tmpLine, This->namedArrays, This->constantsUsedBitmap); + ++pToken; + } + } + strcat(tmpLine,";\n"); + ++lineNum; + TRACE("GL HW (%u, %u) : %s", lineNum, pgmLength, tmpLine); /* Don't add \n to this line as already in tmpLine */ + PNSTRCAT(pgmStr, tmpLine); + + } } - return D3D_OK; + strcpy(tmpLine, "END\n"); + ++lineNum; + TRACE("GL HW (%u, %u) : %s", lineNum, pgmLength, tmpLine); /* Don't add \n to this line as already in tmpLine */ + PNSTRCAT(pgmStr, tmpLine); + + } +/* finally null terminate the pgmStr*/ + pgmStr[pgmLength] = 0; + /* Create the hw shader */ + /* TODO: change to resource.glObjectHandel or something like that */ + GL_EXTCALL(glGenProgramsARB(1, &This->prgId)); + TRACE("Creating a hw vertex shader, prg=%d\n", This->prgId); + + GL_EXTCALL(glBindProgramARB(GL_VERTEX_PROGRAM_ARB, This->prgId)); + + + /* Create the program and check for errors */ + GL_EXTCALL(glProgramStringARB(GL_VERTEX_PROGRAM_ARB, GL_PROGRAM_FORMAT_ASCII_ARB, strlen(pgmStr)/*pgmLength*/, pgmStr)); + if (glGetError() == GL_INVALID_OPERATION) { + GLint errPos; + glGetIntegerv(GL_PROGRAM_ERROR_POSITION_ARB, &errPos); + FIXME("HW VertexShader Error at position: %d\n%s\n", errPos, glGetString(GL_PROGRAM_ERROR_STRING_ARB)); + This->prgId = -1; + } +#if 1 /* if were using the data buffer of device then we don't need to free it */ + HeapFree(GetProcessHeap(), 0, pgmStr); +#endif +#undef PNSTRCAT } BOOL IWineD3DVertexShaderImpl_ExecuteHAL(IWineD3DVertexShader* iface, WINEVSHADERINPUTDATA* input, WINEVSHADEROUTPUTDATA* output) { @@ -591,6 +1692,7 @@ HRESULT WINAPI IWineD3DVertexShaderImpl_ExecuteSW(IWineD3DVertexShader* iface, W #endif TRACE_VSVECTOR(vshader->data->C[64]); + /* TODO: Run through all the tokens and find and labels, if, endifs, loops etc...., and make a labels list */ /* the first dword is the version tag */ /* TODO: parse it */ @@ -610,7 +1712,8 @@ HRESULT WINAPI IWineD3DVertexShaderImpl_ExecuteSW(IWineD3DVertexShader* iface, W if (NULL == curOpcode) { i = 0; /* unkown current opcode ... */ - while (*pToken & 0x80000000) { + /* TODO: Think of a name for 0x80000000 and repalce it's use with a constant */ + while (*pToken & 0x80000000) { if (i == 0) { TRACE("unrecognized opcode: pos=%d token=%08lX\n", (pToken - 1) - This->function, *(pToken - 1)); } @@ -673,12 +1776,17 @@ HRESULT WINAPI IWineD3DVertexShaderImpl_ExecuteSW(IWineD3DVertexShader* iface, W /* TRACE("p[%d]=oT[%d]\n", i, reg); */ p[i] = &output->oT[reg]; break; + /* TODO Decls and defs */ +#if 0 + case D3DSPR_DCL: + case D3DSPR_DEF: +#endif default: break; } - + if (i > 0) { /* input reg */ - DWORD swizzle = (pToken[i] & D3DVS_SWIZZLE_MASK) >> D3DVS_SWIZZLE_SHIFT; + DWORD swizzle = (pToken[i] & D3DVS_SWIZZLE_MASK) >> D3DVS_SWIZZLE_SHIFT; UINT isNegative = ((pToken[i] & D3DSP_SRCMOD_MASK) == D3DSPSM_NEG); if (!isNegative && (D3DVS_NOSWIZZLE >> D3DVS_SWIZZLE_SHIFT) == swizzle) { @@ -726,6 +1834,9 @@ HRESULT WINAPI IWineD3DVertexShaderImpl_ExecuteSW(IWineD3DVertexShader* iface, W case 5: curOpcode->soft_fct(p_send[0], p_send[1], p_send[2], p_send[3], p_send[4]); break; + case 6: + curOpcode->soft_fct(p_send[0], p_send[1], p_send[2], p_send[3], p_send[4], p_send[5]); + break; default: ERR("%s too many params: %u\n", curOpcode->name, curOpcode->num_params); } @@ -918,7 +2029,156 @@ HRESULT WINAPI IWineD3DVertexShaderImpl_GetFunction(IWineD3DVertexShader* impl, return D3D_OK; } +HRESULT WINAPI IWineD3DVertexShaderImpl_SetFunction(IWineD3DVertexShader *iface, CONST DWORD *pFunction) { + IWineD3DVertexShaderImpl *This =(IWineD3DVertexShaderImpl *)iface; + const DWORD* pToken = pFunction; + const SHADER_OPCODE* curOpcode = NULL; + DWORD len = 0; + DWORD i; + TRACE("(%p) : Parsing programme\n", This); + if (NULL != pToken) { + while (D3DVS_END() != *pToken) { + if (vshader_is_version_token(*pToken)) { /** version */ + TRACE("vs_%lu_%lu\n", (*pToken >> 8) & 0x0F, (*pToken & 0x0F)); + ++pToken; + ++len; + continue; + } + if (vshader_is_comment_token(*pToken)) { /** comment */ + DWORD comment_len = (*pToken & D3DSI_COMMENTSIZE_MASK) >> D3DSI_COMMENTSIZE_SHIFT; + ++pToken; + TRACE("//%s\n", (char*)pToken); + pToken += comment_len; + len += comment_len + 1; + continue; + } + curOpcode = vshader_program_get_opcode(*pToken); + ++pToken; + ++len; + if (NULL == curOpcode) { + /* TODO: Think of a good name for 0x80000000 and replace it with a constant */ + while (*pToken & 0x80000000) { + /* unkown current opcode ... */ + TRACE("unrecognized opcode: %08lx", *pToken); + ++pToken; + ++len; + TRACE("\n"); + } + + } else { + if (curOpcode->opcode == D3DSIO_DCL) { + TRACE("dcl_"); + switch(*pToken & 0xFFFF) { + case D3DDECLUSAGE_POSITION: + TRACE("%s%ld ", "position",(*pToken & 0xF0000) >> 16); + break; + case D3DDECLUSAGE_BLENDINDICES: + TRACE("%s ", "blend"); + break; + case D3DDECLUSAGE_BLENDWEIGHT: + TRACE("%s ", "weight"); + break; + case D3DDECLUSAGE_NORMAL: + TRACE("%s%ld ", "normal",(*pToken & 0xF0000) >> 16); + break; + case D3DDECLUSAGE_PSIZE: + TRACE("%s ", "psize"); + break; + case D3DDECLUSAGE_COLOR: + if((*pToken & 0xF0000) >> 16 == 0) { + TRACE("%s ", "color"); + } else { + TRACE("%s ", "specular"); + } + break; + case D3DDECLUSAGE_TEXCOORD: + TRACE("%s%ld ", "texture", (*pToken & 0xF0000) >> 16); + break; + case D3DDECLUSAGE_TANGENT: + TRACE("%s ", "tangent"); + break; + case D3DDECLUSAGE_BINORMAL: + TRACE("%s ", "binormal"); + break; + case D3DDECLUSAGE_TESSFACTOR: + TRACE("%s ", "tessfactor"); + break; + case D3DDECLUSAGE_POSITIONT: + TRACE("%s%ld ", "positionT",(*pToken & 0xF0000) >> 16); + break; + case D3DDECLUSAGE_FOG: + TRACE("%s ", "fog"); + break; + case D3DDECLUSAGE_DEPTH: + TRACE("%s ", "depth"); + break; + case D3DDECLUSAGE_SAMPLE: + TRACE("%s ", "sample"); + break; + default: + FIXME("Unrecognised dcl %08lx", *pToken & 0xFFFF); + } + ++pToken; + ++len; + vshader_program_dump_vs_param(*pToken, 0); + ++pToken; + ++len; + } else + if (curOpcode->opcode == D3DSIO_DEF) { + TRACE("def c%lu = ", *pToken & 0xFF); + ++pToken; + ++len; + TRACE("%f ,", *(float *)pToken); + ++pToken; + ++len; + TRACE("%f ,", *(float *)pToken); + ++pToken; + ++len; + TRACE("%f ,", *(float *)pToken); + ++pToken; + ++len; + TRACE("%f", *(float *)pToken); + ++pToken; + ++len; + } else { + TRACE("%s ", curOpcode->name); + if (curOpcode->num_params > 0) { + vshader_program_dump_vs_param(*pToken, 0); + ++pToken; + ++len; + for (i = 1; i < curOpcode->num_params; ++i) { + TRACE(", "); + vshader_program_dump_vs_param(*pToken, 1); + ++pToken; + ++len; + } + } + } + TRACE("\n"); + } + } + This->functionLength = (len + 1) * sizeof(DWORD); + } else { + This->functionLength = 1; /* no Function defined use fixed function vertex processing */ + } + + /* Generate HW shader in needed */ + if (NULL != pFunction && wined3d_settings.vs_mode == VS_HW) { +#if 1 + IWineD3DVertexShaderImpl_GenerateProgramArbHW(iface, pFunction); +#endif + } + + /* copy the function ... because it will certainly be released by application */ + if (NULL != pFunction) { + This->function = HeapAlloc(GetProcessHeap(), HEAP_ZERO_MEMORY, This->functionLength); + memcpy((void *)This->function, pFunction, This->functionLength); + } else { + This->function = NULL; + } + return D3D_OK; +} const IWineD3DVertexShaderVtbl IWineD3DVertexShader_Vtbl = { @@ -929,5 +2189,6 @@ const IWineD3DVertexShaderVtbl IWineD3DVertexShader_Vtbl = /*** IWineD3DVertexShader methods ***/ IWineD3DVertexShaderImpl_GetParent, IWineD3DVertexShaderImpl_GetDevice, - IWineD3DVertexShaderImpl_GetFunction + IWineD3DVertexShaderImpl_GetFunction, + IWineD3DVertexShaderImpl_SetFunction }; diff --git a/dlls/wined3d/wined3d_private.h b/dlls/wined3d/wined3d_private.h index 6be07eef4be..cb7395e3fb2 100644 --- a/dlls/wined3d/wined3d_private.h +++ b/dlls/wined3d/wined3d_private.h @@ -155,6 +155,7 @@ extern int num_lock; #define GL_SUPPORT(ExtName) (GLINFO_LOCATION.supported[ExtName] != 0) #define GL_LIMITS(ExtName) (GLINFO_LOCATION.max_##ExtName) #define GL_EXTCALL(FuncName) (GLINFO_LOCATION.FuncName) +#define GL_VEND(_VendName) (GLINFO_LOCATION.gl_vendor == VENDOR_##_VendName ? TRUE : FALSE) #define D3DCOLOR_R(dw) (((float) (((dw) >> 16) & 0xFF)) / 255.0f) #define D3DCOLOR_G(dw) (((float) (((dw) >> 8) & 0xFF)) / 255.0f) @@ -888,9 +889,9 @@ struct IWineD3DStateBlockImpl /* Drawing - Vertex Shader or FVF related */ DWORD fvf; /* Vertex Shader Declaration */ - IWineD3DVertexDeclaration* vertexDecl; + IWineD3DVertexDeclaration *vertexDecl; - void *vertexShader; /* @TODO: Replace void * with IWineD3DVertexShader * */ + IWineD3DVertexShader *vertexShader; /* @TODO: Replace void * with IWineD3DVertexShader * */ /* Vertex Shader Constants */ BOOL vertexShaderConstantB[MAX_VSHADER_CONSTANTS]; @@ -1094,6 +1095,15 @@ int D3DFmtMakeGlCfg(D3DFORMAT BackBufferFormat, D3DFORMAT StencilBufferFormat, i /*** class static members ***/ void IWineD3DBaseTextureImpl_CleanUp(IWineD3DBaseTexture *iface); +/* an emul for the type of constants that are used... adressing causes problems with being able to work out what's used and what's not.. so maybe we'll have to rely on the server vertex shader const functions? */ +enum vsConstantsEnum { + VS_CONSTANT_NOT_USED = 0, + VS_CONSTANT_CONSTANT, + VS_CONSTANT_INTEGER, + VS_CONSTANT_BOOLEAN, + VS_CONSTANT_FLOAT +}; + /***************************************************************************** * IDirect3DVertexShader implementation structure */ @@ -1105,19 +1115,25 @@ typedef struct IWineD3DVertexShaderImpl { IUnknown *parent; IWineD3DDeviceImpl *wineD3DDevice; - /* IWineD3DVertexShaderImpl*/ + /* IWineD3DVertexShaderImpl */ CONST DWORD *function; UINT functionLength; DWORD usage; DWORD version; + + /* vertex declaration array mapping */ + BOOL namedArrays; /* don't map use named functions */ + BOOL declaredArrays; /* mapping requires */ + INT arrayUsageMap[WINED3DSHADERDECLUSAGE_MAX_USAGE]; /* lookup table for the maps */ + INT highestConstant; + CHAR constantsUsedBitmap[256]; + /* FIXME: This needs to be populated with some flags of VS_CONSTANT_NOT_USED, VS_CONSTANT_CONSTANT, VS_CONSTANT_INTEGER, VS_CONSTANT_BOOLEAN, VS_CONSTANT_FLOAT, a half byte bitmap will be the best option, but I'll keep it as chards for siplicity */ /* run time datas... */ VSHADERDATA* data; + GLint prgId; #if 0 /* needs reworking */ - DWORD usage; - DWORD version; /* run time datas */ - VSHADERDATA* data; VSHADERINPUTDATA input; VSHADEROUTPUTDATA output; #endif diff --git a/include/wine/wined3d_interface.h b/include/wine/wined3d_interface.h index 57c1c3edec9..70cf0e54be0 100644 --- a/include/wine/wined3d_interface.h +++ b/include/wine/wined3d_interface.h @@ -1250,8 +1250,9 @@ DECLARE_INTERFACE_(IWineD3DVertexShader,IUnknown) STDMETHOD_(ULONG,Release)(THIS) PURE; /*** IWineD3DVertexShader methods ***/ STDMETHOD(GetParent)(THIS_ IUnknown **pParent) PURE; - STDMETHOD(GetDevice)(THIS_ IWineD3DDevice** ppDevice) PURE; - STDMETHOD(GetFunction)(THIS_ VOID* pData, UINT* pSizeOfData) PURE; + STDMETHOD(GetDevice)(THIS_ IWineD3DDevice** ppDevice) PURE; + STDMETHOD(GetFunction)(THIS_ VOID *pData, UINT *pSizeOfData) PURE; + STDMETHOD(SetFunction)(THIS_ CONST DWORD *pFunction) PURE; STDMETHOD(SetConstantB)(THIS_ UINT StartRegister, CONST BOOL* pConstantData, UINT BoolCount) PURE; STDMETHOD(SetConstantI)(THIS_ UINT StartRegister, CONST INT* pConstantData, UINT Vector4iCount) PURE; STDMETHOD(SetConstantF)(THIS_ UINT StartRegister, CONST FLOAT* pConstantData, UINT Vector4fCount) PURE; @@ -1272,6 +1273,7 @@ DECLARE_INTERFACE_(IWineD3DVertexShader,IUnknown) #define IWineD3DVertexShader_GetParent(p,a) (p)->lpVtbl->GetParent(p,a) #define IWineD3DVertexShader_GetDevice(p,a) (p)->lpVtbl->GetDevice(p,a) #define IWineD3DVertexShader_GetFunction(p,a,b) (p)->lpVtbl->GetFunction(p,a,b) +#define IWineD3DVertexShader_SetFunction(p,a) (p)->lpVtbl->SetFunction(p,a) #define IWineD3DVertexShader_SetConstantB(p,a,b,c) (p)->lpVtbl->SetConstantB(p,a,b,c) #define IWineD3DVertexShader_SetConstantI(p,a,b,c) (p)->lpVtbl->SetConstantI(p,a,b,c) #define IWineD3DVertexShader_SetConstantF(p,a,b,c) (p)->lpVtbl->SetConstantF(p,a,b,c)