2005-08-25 21:24:21 +02:00
|
|
|
/*
|
|
|
|
* shaders implementation
|
|
|
|
*
|
2006-05-08 21:44:25 +02:00
|
|
|
* Copyright 2002-2003 Jason Edmeades
|
|
|
|
* Copyright 2002-2003 Raphael Junqueira
|
2006-07-17 20:35:14 +02:00
|
|
|
* Copyright 2004 Christian Costa
|
2006-05-08 21:44:25 +02:00
|
|
|
* Copyright 2005 Oliver Stieber
|
2006-05-17 08:04:30 +02:00
|
|
|
* Copyright 2006 Ivan Gyurdiev
|
2005-08-25 21:24:21 +02:00
|
|
|
*
|
|
|
|
* This library is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
|
|
* License as published by the Free Software Foundation; either
|
|
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This library is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
* Lesser General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
|
|
* License along with this library; if not, write to the Free Software
|
2006-05-18 14:49:52 +02:00
|
|
|
* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
|
2005-08-25 21:24:21 +02:00
|
|
|
*/
|
|
|
|
|
|
|
|
#include "config.h"
|
|
|
|
|
|
|
|
#include <math.h>
|
2005-11-21 17:27:55 +01:00
|
|
|
#include <stdio.h>
|
2005-08-25 21:24:21 +02:00
|
|
|
|
|
|
|
#include "wined3d_private.h"
|
|
|
|
|
|
|
|
WINE_DEFAULT_DEBUG_CHANNEL(d3d_shader);
|
|
|
|
|
2007-06-09 14:27:41 +02:00
|
|
|
#define GLINFO_LOCATION ((IWineD3DDeviceImpl *) This->baseShader.device)->adapter->gl_info
|
2005-08-25 21:24:21 +02:00
|
|
|
|
2005-11-21 17:27:55 +01:00
|
|
|
#if 0 /* Must not be 1 in cvs version */
|
|
|
|
# define PSTRACE(A) TRACE A
|
|
|
|
# define TRACE_VSVECTOR(name) TRACE( #name "=(%f, %f, %f, %f)\n", name.x, name.y, name.z, name.w)
|
|
|
|
#else
|
|
|
|
# define PSTRACE(A)
|
|
|
|
# define TRACE_VSVECTOR(name)
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#define GLNAME_REQUIRE_GLSL ((const char *)1)
|
2005-08-25 21:24:21 +02:00
|
|
|
/* *******************************************
|
|
|
|
IWineD3DPixelShader IUnknown parts follow
|
|
|
|
******************************************* */
|
2006-06-10 13:15:32 +02:00
|
|
|
static HRESULT WINAPI IWineD3DPixelShaderImpl_QueryInterface(IWineD3DPixelShader *iface, REFIID riid, LPVOID *ppobj)
|
2005-08-25 21:24:21 +02:00
|
|
|
{
|
|
|
|
IWineD3DPixelShaderImpl *This = (IWineD3DPixelShaderImpl *)iface;
|
|
|
|
TRACE("(%p)->(%s,%p)\n",This,debugstr_guid(riid),ppobj);
|
|
|
|
if (IsEqualGUID(riid, &IID_IUnknown)
|
2006-02-06 11:32:41 +01:00
|
|
|
|| IsEqualGUID(riid, &IID_IWineD3DBase)
|
2006-03-28 21:10:51 +02:00
|
|
|
|| IsEqualGUID(riid, &IID_IWineD3DBaseShader)
|
2005-08-25 21:24:21 +02:00
|
|
|
|| IsEqualGUID(riid, &IID_IWineD3DPixelShader)) {
|
|
|
|
IUnknown_AddRef(iface);
|
|
|
|
*ppobj = This;
|
2006-04-25 23:59:12 +02:00
|
|
|
return S_OK;
|
2005-08-25 21:24:21 +02:00
|
|
|
}
|
2006-04-25 23:59:12 +02:00
|
|
|
*ppobj = NULL;
|
2005-08-25 21:24:21 +02:00
|
|
|
return E_NOINTERFACE;
|
|
|
|
}
|
|
|
|
|
2006-06-10 13:15:32 +02:00
|
|
|
static ULONG WINAPI IWineD3DPixelShaderImpl_AddRef(IWineD3DPixelShader *iface) {
|
2005-08-25 21:24:21 +02:00
|
|
|
IWineD3DPixelShaderImpl *This = (IWineD3DPixelShaderImpl *)iface;
|
2006-10-01 05:20:10 +02:00
|
|
|
TRACE("(%p) : AddRef increasing from %d\n", This, This->ref);
|
2005-08-25 21:24:21 +02:00
|
|
|
return InterlockedIncrement(&This->ref);
|
|
|
|
}
|
|
|
|
|
2007-09-21 23:47:40 +02:00
|
|
|
static void destroy_glsl_pshader(IWineD3DPixelShaderImpl *This) {
|
|
|
|
struct list *linked_programs = &This->baseShader.linked_programs;
|
|
|
|
|
|
|
|
TRACE("Deleting linked programs\n");
|
|
|
|
if (linked_programs->next) {
|
|
|
|
struct glsl_shader_prog_link *entry, *entry2;
|
|
|
|
LIST_FOR_EACH_ENTRY_SAFE(entry, entry2, linked_programs, struct glsl_shader_prog_link, pshader_entry) {
|
|
|
|
delete_glsl_program_entry(This->baseShader.device, entry);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
TRACE("Deleting shader object %u\n", This->baseShader.prgId);
|
|
|
|
GL_EXTCALL(glDeleteObjectARB(This->baseShader.prgId));
|
|
|
|
checkGLcall("glDeleteObjectARB");
|
|
|
|
}
|
|
|
|
|
2006-06-10 13:15:32 +02:00
|
|
|
static ULONG WINAPI IWineD3DPixelShaderImpl_Release(IWineD3DPixelShader *iface) {
|
2005-08-25 21:24:21 +02:00
|
|
|
IWineD3DPixelShaderImpl *This = (IWineD3DPixelShaderImpl *)iface;
|
|
|
|
ULONG ref;
|
2006-10-01 05:20:10 +02:00
|
|
|
TRACE("(%p) : Releasing from %d\n", This, This->ref);
|
2005-08-25 21:24:21 +02:00
|
|
|
ref = InterlockedDecrement(&This->ref);
|
|
|
|
if (ref == 0) {
|
wined3d: Rework shader mode selection.
- currently half the shader selection code (GLSL vs ARB) is in
fillGLcaps. The parts that check for software shaders are in
GetDeviceCaps. That placement, will work, but is definitely not optimal.
FillGLcaps should detect support - it should not make decision as to
what's used, because that's not what the purpose of the function is.
GetDeviceCaps should report support as it has already been selected.
Instead, select shader mode in its own function, called in the
appropriate places.
- unifying pixel and vertex shaders into a single selection is a
mistake. A software vertex shader can be coupled with a hardware arb or
glsl pixel shader, or no shader at all. Split them back into two and add
a SHADER_NONE variant.
- drawprim is doing support checks for ARB_PROGRAM, and making shader
decisions based on that - that's wrong, support has already been
checked, and decided upon, and shaders can be implemented via software,
ARB_PROGRAm or GLSL, so that support check isn't valid.
- Store the shader selected mode into the shader itself. Different types
of shaders can be combined, so this is an improvement. In fact, storing
the mode into the settings globally is a mistake as well - it should be
done per device, since different cards have different capabilities.
2006-07-04 09:21:53 +02:00
|
|
|
if (This->baseShader.shader_mode == SHADER_GLSL && This->baseShader.prgId != 0) {
|
2007-09-21 23:47:40 +02:00
|
|
|
destroy_glsl_pshader(This);
|
2006-06-09 09:35:49 +02:00
|
|
|
}
|
2006-07-10 06:51:03 +02:00
|
|
|
shader_delete_constant_list(&This->baseShader.constantsF);
|
|
|
|
shader_delete_constant_list(&This->baseShader.constantsB);
|
|
|
|
shader_delete_constant_list(&This->baseShader.constantsI);
|
|
|
|
HeapFree(GetProcessHeap(), 0, This);
|
2005-08-25 21:24:21 +02:00
|
|
|
}
|
|
|
|
return ref;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* *******************************************
|
|
|
|
IWineD3DPixelShader IWineD3DPixelShader parts follow
|
|
|
|
******************************************* */
|
|
|
|
|
2006-06-10 13:15:32 +02:00
|
|
|
static HRESULT WINAPI IWineD3DPixelShaderImpl_GetParent(IWineD3DPixelShader *iface, IUnknown** parent){
|
2005-08-25 21:24:21 +02:00
|
|
|
IWineD3DPixelShaderImpl *This = (IWineD3DPixelShaderImpl *)iface;
|
|
|
|
|
2005-12-03 18:10:56 +01:00
|
|
|
*parent = This->parent;
|
2005-08-25 21:24:21 +02:00
|
|
|
IUnknown_AddRef(*parent);
|
|
|
|
TRACE("(%p) : returning %p\n", This, *parent);
|
2006-04-07 12:51:12 +02:00
|
|
|
return WINED3D_OK;
|
2005-08-25 21:24:21 +02:00
|
|
|
}
|
2005-11-21 17:27:55 +01:00
|
|
|
|
2006-06-10 13:15:32 +02:00
|
|
|
static HRESULT WINAPI IWineD3DPixelShaderImpl_GetDevice(IWineD3DPixelShader* iface, IWineD3DDevice **pDevice){
|
2005-08-25 21:24:21 +02:00
|
|
|
IWineD3DPixelShaderImpl *This = (IWineD3DPixelShaderImpl *)iface;
|
2006-09-27 13:14:46 +02:00
|
|
|
IWineD3DDevice_AddRef(This->baseShader.device);
|
|
|
|
*pDevice = This->baseShader.device;
|
2005-08-25 21:24:21 +02:00
|
|
|
TRACE("(%p) returning %p\n", This, *pDevice);
|
2006-04-07 12:51:12 +02:00
|
|
|
return WINED3D_OK;
|
2005-08-25 21:24:21 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2006-06-10 13:15:32 +02:00
|
|
|
static HRESULT WINAPI IWineD3DPixelShaderImpl_GetFunction(IWineD3DPixelShader* impl, VOID* pData, UINT* pSizeOfData) {
|
2005-08-25 21:24:21 +02:00
|
|
|
IWineD3DPixelShaderImpl *This = (IWineD3DPixelShaderImpl *)impl;
|
2006-06-09 23:46:38 +02:00
|
|
|
TRACE("(%p) : pData(%p), pSizeOfData(%p)\n", This, pData, pSizeOfData);
|
2005-08-25 21:24:21 +02:00
|
|
|
|
|
|
|
if (NULL == pData) {
|
2006-03-30 19:14:31 +02:00
|
|
|
*pSizeOfData = This->baseShader.functionLength;
|
2006-04-07 12:51:12 +02:00
|
|
|
return WINED3D_OK;
|
2005-08-25 21:24:21 +02:00
|
|
|
}
|
2006-03-30 19:14:31 +02:00
|
|
|
if (*pSizeOfData < This->baseShader.functionLength) {
|
2007-03-08 01:16:09 +01:00
|
|
|
/* MSDN claims (for d3d8 at least) that if *pSizeOfData is smaller
|
|
|
|
* than the required size we should write the required size and
|
|
|
|
* return D3DERR_MOREDATA. That's not actually true. */
|
|
|
|
return WINED3DERR_INVALIDCALL;
|
2005-08-25 21:24:21 +02:00
|
|
|
}
|
2006-03-30 19:14:31 +02:00
|
|
|
if (NULL == This->baseShader.function) { /* no function defined */
|
2005-08-25 21:24:21 +02:00
|
|
|
TRACE("(%p) : GetFunction no User Function defined using NULL to %p\n", This, pData);
|
|
|
|
(*(DWORD **) pData) = NULL;
|
|
|
|
} else {
|
2006-03-30 19:14:31 +02:00
|
|
|
if (This->baseShader.functionLength == 0) {
|
2005-08-25 21:24:21 +02:00
|
|
|
|
|
|
|
}
|
|
|
|
TRACE("(%p) : GetFunction copying to %p\n", This, pData);
|
2006-03-30 19:14:31 +02:00
|
|
|
memcpy(pData, This->baseShader.function, This->baseShader.functionLength);
|
2005-08-25 21:24:21 +02:00
|
|
|
}
|
2006-04-07 12:51:12 +02:00
|
|
|
return WINED3D_OK;
|
2005-08-25 21:24:21 +02:00
|
|
|
}
|
|
|
|
|
2006-03-28 21:10:44 +02:00
|
|
|
CONST SHADER_OPCODE IWineD3DPixelShaderImpl_shader_ins[] = {
|
2006-05-10 00:05:26 +02:00
|
|
|
/* Arithmethic */
|
2007-03-06 22:35:23 +01:00
|
|
|
{WINED3DSIO_NOP, "nop", "NOP", 0, 0, pshader_hw_map2gl, NULL, 0, 0},
|
|
|
|
{WINED3DSIO_MOV, "mov", "MOV", 1, 2, pshader_hw_map2gl, shader_glsl_mov, 0, 0},
|
|
|
|
{WINED3DSIO_ADD, "add", "ADD", 1, 3, pshader_hw_map2gl, shader_glsl_arith, 0, 0},
|
|
|
|
{WINED3DSIO_SUB, "sub", "SUB", 1, 3, pshader_hw_map2gl, shader_glsl_arith, 0, 0},
|
|
|
|
{WINED3DSIO_MAD, "mad", "MAD", 1, 4, pshader_hw_map2gl, shader_glsl_mad, 0, 0},
|
|
|
|
{WINED3DSIO_MUL, "mul", "MUL", 1, 3, pshader_hw_map2gl, shader_glsl_arith, 0, 0},
|
|
|
|
{WINED3DSIO_RCP, "rcp", "RCP", 1, 2, pshader_hw_map2gl, shader_glsl_rcp, 0, 0},
|
2007-07-02 22:40:06 +02:00
|
|
|
{WINED3DSIO_RSQ, "rsq", "RSQ", 1, 2, pshader_hw_map2gl, shader_glsl_rsq, 0, 0},
|
2007-03-06 22:35:23 +01:00
|
|
|
{WINED3DSIO_DP3, "dp3", "DP3", 1, 3, pshader_hw_map2gl, shader_glsl_dot, 0, 0},
|
|
|
|
{WINED3DSIO_DP4, "dp4", "DP4", 1, 3, pshader_hw_map2gl, shader_glsl_dot, 0, 0},
|
|
|
|
{WINED3DSIO_MIN, "min", "MIN", 1, 3, pshader_hw_map2gl, shader_glsl_map2gl, 0, 0},
|
|
|
|
{WINED3DSIO_MAX, "max", "MAX", 1, 3, pshader_hw_map2gl, shader_glsl_map2gl, 0, 0},
|
|
|
|
{WINED3DSIO_SLT, "slt", "SLT", 1, 3, pshader_hw_map2gl, shader_glsl_compare, 0, 0},
|
|
|
|
{WINED3DSIO_SGE, "sge", "SGE", 1, 3, pshader_hw_map2gl, shader_glsl_compare, 0, 0},
|
|
|
|
{WINED3DSIO_ABS, "abs", "ABS", 1, 2, pshader_hw_map2gl, shader_glsl_map2gl, 0, 0},
|
|
|
|
{WINED3DSIO_EXP, "exp", "EX2", 1, 2, pshader_hw_map2gl, shader_glsl_map2gl, 0, 0},
|
2007-09-09 21:24:53 +02:00
|
|
|
{WINED3DSIO_LOG, "log", "LG2", 1, 2, pshader_hw_map2gl, shader_glsl_log, 0, 0},
|
2007-03-06 22:35:23 +01:00
|
|
|
{WINED3DSIO_EXPP, "expp", "EXP", 1, 2, pshader_hw_map2gl, shader_glsl_expp, 0, 0},
|
|
|
|
{WINED3DSIO_LOGP, "logp", "LOG", 1, 2, pshader_hw_map2gl, shader_glsl_map2gl, 0, 0},
|
|
|
|
{WINED3DSIO_DST, "dst", "DST", 1, 3, pshader_hw_map2gl, shader_glsl_dst, 0, 0},
|
|
|
|
{WINED3DSIO_LRP, "lrp", "LRP", 1, 4, pshader_hw_map2gl, shader_glsl_lrp, 0, 0},
|
|
|
|
{WINED3DSIO_FRC, "frc", "FRC", 1, 2, pshader_hw_map2gl, shader_glsl_map2gl, 0, 0},
|
2007-07-22 21:41:29 +02:00
|
|
|
{WINED3DSIO_CND, "cnd", NULL, 1, 4, pshader_hw_cnd, shader_glsl_cnd, WINED3DPS_VERSION(1,0), WINED3DPS_VERSION(1,4)},
|
2007-03-06 22:35:23 +01:00
|
|
|
{WINED3DSIO_CMP, "cmp", NULL, 1, 4, pshader_hw_cmp, shader_glsl_cmp, WINED3DPS_VERSION(1,2), WINED3DPS_VERSION(3,0)},
|
2007-09-05 16:27:10 +02:00
|
|
|
{WINED3DSIO_POW, "pow", "POW", 1, 3, pshader_hw_map2gl, shader_glsl_pow, 0, 0},
|
|
|
|
{WINED3DSIO_CRS, "crs", "XPD", 1, 3, pshader_hw_map2gl, shader_glsl_cross, 0, 0},
|
2007-09-05 20:09:06 +02:00
|
|
|
{WINED3DSIO_NRM, "nrm", NULL, 1, 2, shader_hw_nrm, shader_glsl_map2gl, 0, 0},
|
2007-09-26 22:09:59 +02:00
|
|
|
{WINED3DSIO_SINCOS, "sincos", NULL, 1, 4, shader_hw_sincos, shader_glsl_sincos, WINED3DPS_VERSION(2,0), WINED3DPS_VERSION(2,1)},
|
|
|
|
{WINED3DSIO_SINCOS, "sincos", "SCS", 1, 2, shader_hw_sincos, shader_glsl_sincos, WINED3DPS_VERSION(3,0), -1},
|
2007-09-05 16:46:12 +02:00
|
|
|
{WINED3DSIO_DP2ADD, "dp2add", NULL, 1, 4, pshader_hw_dp2add, pshader_glsl_dp2add, WINED3DPS_VERSION(2,0), -1},
|
2006-05-10 00:05:26 +02:00
|
|
|
/* Matrix */
|
2007-09-05 20:01:53 +02:00
|
|
|
{WINED3DSIO_M4x4, "m4x4", "undefined", 1, 3, shader_hw_mnxn, shader_glsl_mnxn, 0, 0},
|
|
|
|
{WINED3DSIO_M4x3, "m4x3", "undefined", 1, 3, shader_hw_mnxn, shader_glsl_mnxn, 0, 0},
|
|
|
|
{WINED3DSIO_M3x4, "m3x4", "undefined", 1, 3, shader_hw_mnxn, shader_glsl_mnxn, 0, 0},
|
|
|
|
{WINED3DSIO_M3x3, "m3x3", "undefined", 1, 3, shader_hw_mnxn, shader_glsl_mnxn, 0, 0},
|
|
|
|
{WINED3DSIO_M3x2, "m3x2", "undefined", 1, 3, shader_hw_mnxn, shader_glsl_mnxn, 0, 0},
|
2006-05-10 00:05:26 +02:00
|
|
|
/* Register declarations */
|
2007-03-06 22:35:23 +01:00
|
|
|
{WINED3DSIO_DCL, "dcl", NULL, 0, 2, NULL, NULL, 0, 0},
|
2006-04-16 11:25:15 +02:00
|
|
|
/* Flow control - requires GLSL or software shaders */
|
2007-03-06 22:35:23 +01:00
|
|
|
{WINED3DSIO_REP , "rep", NULL, 0, 1, NULL, shader_glsl_rep, WINED3DPS_VERSION(2,1), -1},
|
|
|
|
{WINED3DSIO_ENDREP, "endrep", NULL, 0, 0, NULL, shader_glsl_end, WINED3DPS_VERSION(2,1), -1},
|
|
|
|
{WINED3DSIO_IF, "if", NULL, 0, 1, NULL, shader_glsl_if, WINED3DPS_VERSION(2,1), -1},
|
|
|
|
{WINED3DSIO_IFC, "ifc", NULL, 0, 2, NULL, shader_glsl_ifc, WINED3DPS_VERSION(2,1), -1},
|
|
|
|
{WINED3DSIO_ELSE, "else", NULL, 0, 0, NULL, shader_glsl_else, WINED3DPS_VERSION(2,1), -1},
|
|
|
|
{WINED3DSIO_ENDIF, "endif", NULL, 0, 0, NULL, shader_glsl_end, WINED3DPS_VERSION(2,1), -1},
|
|
|
|
{WINED3DSIO_BREAK, "break", NULL, 0, 0, NULL, shader_glsl_break, WINED3DPS_VERSION(2,1), -1},
|
|
|
|
{WINED3DSIO_BREAKC, "breakc", NULL, 0, 2, NULL, shader_glsl_breakc, WINED3DPS_VERSION(2,1), -1},
|
|
|
|
{WINED3DSIO_BREAKP, "breakp", GLNAME_REQUIRE_GLSL, 0, 1, NULL, NULL, 0, 0},
|
|
|
|
{WINED3DSIO_CALL, "call", NULL, 0, 1, NULL, shader_glsl_call, WINED3DPS_VERSION(2,1), -1},
|
|
|
|
{WINED3DSIO_CALLNZ, "callnz", NULL, 0, 2, NULL, shader_glsl_callnz, WINED3DPS_VERSION(2,1), -1},
|
|
|
|
{WINED3DSIO_LOOP, "loop", NULL, 0, 2, NULL, shader_glsl_loop, WINED3DPS_VERSION(3,0), -1},
|
|
|
|
{WINED3DSIO_RET, "ret", NULL, 0, 0, NULL, NULL, WINED3DPS_VERSION(2,1), -1},
|
|
|
|
{WINED3DSIO_ENDLOOP, "endloop", NULL, 0, 0, NULL, shader_glsl_end, WINED3DPS_VERSION(3,0), -1},
|
|
|
|
{WINED3DSIO_LABEL, "label", NULL, 0, 1, NULL, shader_glsl_label, WINED3DPS_VERSION(2,1), -1},
|
2006-05-10 00:05:26 +02:00
|
|
|
/* Constant definitions */
|
2007-03-06 22:35:23 +01:00
|
|
|
{WINED3DSIO_DEF, "def", "undefined", 1, 5, NULL, NULL, 0, 0},
|
|
|
|
{WINED3DSIO_DEFB, "defb", GLNAME_REQUIRE_GLSL, 1, 2, NULL, NULL, 0, 0},
|
|
|
|
{WINED3DSIO_DEFI, "defi", GLNAME_REQUIRE_GLSL, 1, 5, NULL, NULL, 0, 0},
|
2006-05-10 00:05:26 +02:00
|
|
|
/* Texture */
|
2007-03-06 22:35:23 +01:00
|
|
|
{WINED3DSIO_TEXCOORD, "texcoord", "undefined", 1, 1, pshader_hw_texcoord, pshader_glsl_texcoord, 0, WINED3DPS_VERSION(1,3)},
|
|
|
|
{WINED3DSIO_TEXCOORD, "texcrd", "undefined", 1, 2, pshader_hw_texcoord, pshader_glsl_texcoord, WINED3DPS_VERSION(1,4), WINED3DPS_VERSION(1,4)},
|
2007-08-30 23:35:50 +02:00
|
|
|
{WINED3DSIO_TEXKILL, "texkill", "KIL", 1, 1, pshader_hw_texkill, pshader_glsl_texkill, WINED3DPS_VERSION(1,0), WINED3DPS_VERSION(3,0)},
|
2007-03-06 22:35:23 +01:00
|
|
|
{WINED3DSIO_TEX, "tex", "undefined", 1, 1, pshader_hw_tex, pshader_glsl_tex, 0, WINED3DPS_VERSION(1,3)},
|
|
|
|
{WINED3DSIO_TEX, "texld", "undefined", 1, 2, pshader_hw_tex, pshader_glsl_tex, WINED3DPS_VERSION(1,4), WINED3DPS_VERSION(1,4)},
|
|
|
|
{WINED3DSIO_TEX, "texld", "undefined", 1, 3, pshader_hw_tex, pshader_glsl_tex, WINED3DPS_VERSION(2,0), -1},
|
|
|
|
{WINED3DSIO_TEXBEM, "texbem", "undefined", 1, 2, pshader_hw_texbem, pshader_glsl_texbem, 0, WINED3DPS_VERSION(1,3)},
|
2007-09-01 20:11:17 +02:00
|
|
|
{WINED3DSIO_TEXBEML, "texbeml", GLNAME_REQUIRE_GLSL, 1, 2, pshader_hw_texbem, pshader_glsl_texbem, WINED3DPS_VERSION(1,0), WINED3DPS_VERSION(1,3)},
|
2007-07-22 21:41:29 +02:00
|
|
|
{WINED3DSIO_TEXREG2AR,"texreg2ar","undefined", 1, 2, pshader_hw_texreg2ar, pshader_glsl_texreg2ar, WINED3DPS_VERSION(1,0), WINED3DPS_VERSION(1,3)},
|
|
|
|
{WINED3DSIO_TEXREG2GB,"texreg2gb","undefined", 1, 2, pshader_hw_texreg2gb, pshader_glsl_texreg2gb, WINED3DPS_VERSION(1,0), WINED3DPS_VERSION(1,3)},
|
2007-09-05 17:05:58 +02:00
|
|
|
{WINED3DSIO_TEXREG2RGB, "texreg2rgb", "undefined", 1, 2, pshader_hw_texreg2rgb, pshader_glsl_texreg2rgb, WINED3DPS_VERSION(1,2), WINED3DPS_VERSION(1,3)},
|
2007-03-06 22:35:23 +01:00
|
|
|
{WINED3DSIO_TEXM3x2PAD, "texm3x2pad", "undefined", 1, 2, pshader_hw_texm3x2pad, pshader_glsl_texm3x2pad, WINED3DPS_VERSION(1,0), WINED3DPS_VERSION(1,3)},
|
|
|
|
{WINED3DSIO_TEXM3x2TEX, "texm3x2tex", "undefined", 1, 2, pshader_hw_texm3x2tex, pshader_glsl_texm3x2tex, WINED3DPS_VERSION(1,0), WINED3DPS_VERSION(1,3)},
|
|
|
|
{WINED3DSIO_TEXM3x3PAD, "texm3x3pad", "undefined", 1, 2, pshader_hw_texm3x3pad, pshader_glsl_texm3x3pad, WINED3DPS_VERSION(1,0), WINED3DPS_VERSION(1,3)},
|
|
|
|
{WINED3DSIO_TEXM3x3DIFF, "texm3x3diff", GLNAME_REQUIRE_GLSL, 1, 2, NULL, NULL, WINED3DPS_VERSION(0,0), WINED3DPS_VERSION(0,0)},
|
|
|
|
{WINED3DSIO_TEXM3x3SPEC, "texm3x3spec", "undefined", 1, 3, pshader_hw_texm3x3spec, pshader_glsl_texm3x3spec, WINED3DPS_VERSION(1,0), WINED3DPS_VERSION(1,3)},
|
|
|
|
{WINED3DSIO_TEXM3x3VSPEC, "texm3x3vspec", "undefined", 1, 2, pshader_hw_texm3x3vspec, pshader_glsl_texm3x3vspec, WINED3DPS_VERSION(1,0), WINED3DPS_VERSION(1,3)},
|
|
|
|
{WINED3DSIO_TEXM3x3TEX, "texm3x3tex", "undefined", 1, 2, pshader_hw_texm3x3tex, pshader_glsl_texm3x3tex, WINED3DPS_VERSION(1,0), WINED3DPS_VERSION(1,3)},
|
2007-09-25 01:00:27 +02:00
|
|
|
{WINED3DSIO_TEXDP3TEX, "texdp3tex", NULL, 1, 2, pshader_hw_texdp3tex, pshader_glsl_texdp3tex, WINED3DPS_VERSION(1,2), WINED3DPS_VERSION(1,3)},
|
|
|
|
{WINED3DSIO_TEXM3x2DEPTH, "texm3x2depth", GLNAME_REQUIRE_GLSL, 1, 2, pshader_hw_texm3x2depth, pshader_glsl_texm3x2depth, WINED3DPS_VERSION(1,3), WINED3DPS_VERSION(1,3)},
|
|
|
|
{WINED3DSIO_TEXDP3, "texdp3", NULL, 1, 2, pshader_hw_texdp3, pshader_glsl_texdp3, WINED3DPS_VERSION(1,2), WINED3DPS_VERSION(1,3)},
|
|
|
|
{WINED3DSIO_TEXM3x3, "texm3x3", NULL, 1, 2, pshader_hw_texm3x3, pshader_glsl_texm3x3, WINED3DPS_VERSION(1,2), WINED3DPS_VERSION(1,3)},
|
2007-08-31 17:00:16 +02:00
|
|
|
{WINED3DSIO_TEXDEPTH, "texdepth", NULL, 1, 1, pshader_hw_texdepth, pshader_glsl_texdepth, WINED3DPS_VERSION(1,4), WINED3DPS_VERSION(1,4)},
|
2007-03-26 23:34:32 +02:00
|
|
|
{WINED3DSIO_BEM, "bem", "undefined", 1, 3, pshader_hw_bem, pshader_glsl_bem, WINED3DPS_VERSION(1,4), WINED3DPS_VERSION(1,4)},
|
2007-07-03 00:22:18 +02:00
|
|
|
{WINED3DSIO_DSX, "dsx", NULL, 1, 2, NULL, shader_glsl_map2gl, WINED3DPS_VERSION(2,1), -1},
|
|
|
|
{WINED3DSIO_DSY, "dsy", NULL, 1, 2, NULL, shader_glsl_map2gl, WINED3DPS_VERSION(2,1), -1},
|
2007-03-06 22:35:23 +01:00
|
|
|
{WINED3DSIO_TEXLDD, "texldd", GLNAME_REQUIRE_GLSL, 1, 5, NULL, NULL, WINED3DPS_VERSION(2,1), -1},
|
|
|
|
{WINED3DSIO_SETP, "setp", GLNAME_REQUIRE_GLSL, 1, 3, NULL, NULL, 0, 0},
|
2007-06-27 23:46:53 +02:00
|
|
|
{WINED3DSIO_TEXLDL, "texldl", NULL, 1, 3, NULL, shader_glsl_texldl, WINED3DPS_VERSION(3,0), -1},
|
2007-03-06 22:35:23 +01:00
|
|
|
{WINED3DSIO_PHASE, "phase", GLNAME_REQUIRE_GLSL, 0, 0, NULL, NULL, 0, 0},
|
2006-06-12 12:57:04 +02:00
|
|
|
{0, NULL, NULL, 0, 0, NULL, NULL, 0, 0}
|
2005-11-21 17:27:55 +01:00
|
|
|
};
|
|
|
|
|
2006-06-12 08:54:30 +02:00
|
|
|
static void pshader_set_limits(
|
|
|
|
IWineD3DPixelShaderImpl *This) {
|
2006-05-08 23:09:21 +02:00
|
|
|
|
2006-05-26 17:52:33 +02:00
|
|
|
This->baseShader.limits.attributes = 0;
|
2006-05-08 23:09:21 +02:00
|
|
|
This->baseShader.limits.address = 0;
|
2006-06-12 08:57:07 +02:00
|
|
|
This->baseShader.limits.packed_output = 0;
|
2006-05-08 23:09:21 +02:00
|
|
|
|
2006-06-12 08:54:30 +02:00
|
|
|
switch (This->baseShader.hex_version) {
|
2006-10-13 05:36:41 +02:00
|
|
|
case WINED3DPS_VERSION(1,0):
|
|
|
|
case WINED3DPS_VERSION(1,1):
|
|
|
|
case WINED3DPS_VERSION(1,2):
|
|
|
|
case WINED3DPS_VERSION(1,3):
|
2006-06-12 08:54:30 +02:00
|
|
|
This->baseShader.limits.temporary = 2;
|
2006-05-08 23:09:21 +02:00
|
|
|
This->baseShader.limits.constant_float = 8;
|
|
|
|
This->baseShader.limits.constant_int = 0;
|
|
|
|
This->baseShader.limits.constant_bool = 0;
|
2006-06-12 08:59:16 +02:00
|
|
|
This->baseShader.limits.texcoord = 4;
|
|
|
|
This->baseShader.limits.sampler = 4;
|
2006-06-12 08:57:07 +02:00
|
|
|
This->baseShader.limits.packed_input = 0;
|
2006-07-10 12:35:15 +02:00
|
|
|
This->baseShader.limits.label = 0;
|
2006-05-08 23:09:21 +02:00
|
|
|
break;
|
|
|
|
|
2006-10-13 05:36:41 +02:00
|
|
|
case WINED3DPS_VERSION(1,4):
|
2006-06-12 08:54:30 +02:00
|
|
|
This->baseShader.limits.temporary = 6;
|
2006-05-08 23:09:21 +02:00
|
|
|
This->baseShader.limits.constant_float = 8;
|
|
|
|
This->baseShader.limits.constant_int = 0;
|
|
|
|
This->baseShader.limits.constant_bool = 0;
|
2006-06-12 08:59:16 +02:00
|
|
|
This->baseShader.limits.texcoord = 6;
|
|
|
|
This->baseShader.limits.sampler = 6;
|
2006-06-12 08:57:07 +02:00
|
|
|
This->baseShader.limits.packed_input = 0;
|
2006-07-10 12:35:15 +02:00
|
|
|
This->baseShader.limits.label = 0;
|
2006-05-08 23:09:21 +02:00
|
|
|
break;
|
|
|
|
|
|
|
|
/* FIXME: temporaries must match D3DPSHADERCAPS2_0.NumTemps */
|
2006-10-13 05:36:41 +02:00
|
|
|
case WINED3DPS_VERSION(2,0):
|
2006-07-10 12:35:15 +02:00
|
|
|
This->baseShader.limits.temporary = 32;
|
|
|
|
This->baseShader.limits.constant_float = 32;
|
|
|
|
This->baseShader.limits.constant_int = 16;
|
|
|
|
This->baseShader.limits.constant_bool = 16;
|
|
|
|
This->baseShader.limits.texcoord = 8;
|
|
|
|
This->baseShader.limits.sampler = 16;
|
|
|
|
This->baseShader.limits.packed_input = 0;
|
|
|
|
break;
|
|
|
|
|
2006-10-13 05:36:41 +02:00
|
|
|
case WINED3DPS_VERSION(2,1):
|
2006-06-12 08:54:30 +02:00
|
|
|
This->baseShader.limits.temporary = 32;
|
2006-05-08 23:09:21 +02:00
|
|
|
This->baseShader.limits.constant_float = 32;
|
|
|
|
This->baseShader.limits.constant_int = 16;
|
|
|
|
This->baseShader.limits.constant_bool = 16;
|
2006-06-12 08:59:16 +02:00
|
|
|
This->baseShader.limits.texcoord = 8;
|
|
|
|
This->baseShader.limits.sampler = 16;
|
2006-06-12 08:57:07 +02:00
|
|
|
This->baseShader.limits.packed_input = 0;
|
2006-07-10 12:35:15 +02:00
|
|
|
This->baseShader.limits.label = 16;
|
2006-05-08 23:09:21 +02:00
|
|
|
break;
|
|
|
|
|
2006-10-13 05:36:41 +02:00
|
|
|
case WINED3DPS_VERSION(3,0):
|
2006-06-12 08:54:30 +02:00
|
|
|
This->baseShader.limits.temporary = 32;
|
2006-05-08 23:09:21 +02:00
|
|
|
This->baseShader.limits.constant_float = 224;
|
|
|
|
This->baseShader.limits.constant_int = 16;
|
|
|
|
This->baseShader.limits.constant_bool = 16;
|
2006-06-12 08:59:16 +02:00
|
|
|
This->baseShader.limits.texcoord = 0;
|
|
|
|
This->baseShader.limits.sampler = 16;
|
2006-06-12 08:57:07 +02:00
|
|
|
This->baseShader.limits.packed_input = 12;
|
2006-07-10 12:35:15 +02:00
|
|
|
This->baseShader.limits.label = 16; /* FIXME: 2048 */
|
2006-05-08 23:09:21 +02:00
|
|
|
break;
|
|
|
|
|
|
|
|
default: This->baseShader.limits.temporary = 32;
|
2006-06-12 08:59:16 +02:00
|
|
|
This->baseShader.limits.constant_float = 32;
|
|
|
|
This->baseShader.limits.constant_int = 16;
|
|
|
|
This->baseShader.limits.constant_bool = 16;
|
|
|
|
This->baseShader.limits.texcoord = 8;
|
|
|
|
This->baseShader.limits.sampler = 16;
|
2006-06-12 08:57:07 +02:00
|
|
|
This->baseShader.limits.packed_input = 0;
|
2006-07-10 12:35:15 +02:00
|
|
|
This->baseShader.limits.label = 0;
|
2006-10-01 05:20:10 +02:00
|
|
|
FIXME("Unrecognized pixel shader version %#x\n",
|
2006-06-12 08:54:30 +02:00
|
|
|
This->baseShader.hex_version);
|
2006-05-08 23:09:21 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2006-05-10 04:39:02 +02:00
|
|
|
/** Generate a pixel shader string using either GL_FRAGMENT_PROGRAM_ARB
|
|
|
|
or GLSL and send it to the card */
|
2007-03-17 11:39:40 +01:00
|
|
|
static inline VOID IWineD3DPixelShaderImpl_GenerateShader(
|
2006-05-10 04:39:02 +02:00
|
|
|
IWineD3DPixelShader *iface,
|
2006-07-04 10:01:46 +02:00
|
|
|
shader_reg_maps* reg_maps,
|
2006-05-10 04:39:02 +02:00
|
|
|
CONST DWORD *pFunction) {
|
|
|
|
|
|
|
|
IWineD3DPixelShaderImpl *This = (IWineD3DPixelShaderImpl *)iface;
|
|
|
|
SHADER_BUFFER buffer;
|
|
|
|
|
|
|
|
#if 0 /* FIXME: Use the buffer that is held by the device, this is ok since fixups will be skipped for software shaders
|
|
|
|
it also requires entering a critical section but cuts down the runtime footprint of wined3d and any memory fragmentation that may occur... */
|
|
|
|
if (This->device->fixupVertexBufferSize < SHADER_PGMSIZE) {
|
|
|
|
HeapFree(GetProcessHeap(), 0, This->fixupVertexBuffer);
|
|
|
|
This->fixupVertexBuffer = HeapAlloc(GetProcessHeap() , 0, SHADER_PGMSIZE);
|
|
|
|
This->fixupVertexBufferSize = PGMSIZE;
|
|
|
|
This->fixupVertexBuffer[0] = 0;
|
|
|
|
}
|
|
|
|
buffer.buffer = This->device->fixupVertexBuffer;
|
|
|
|
#else
|
|
|
|
buffer.buffer = HeapAlloc(GetProcessHeap(), HEAP_ZERO_MEMORY, SHADER_PGMSIZE);
|
|
|
|
#endif
|
|
|
|
buffer.bsize = 0;
|
|
|
|
buffer.lineNo = 0;
|
2007-01-15 19:30:41 +01:00
|
|
|
buffer.newline = TRUE;
|
2006-05-10 04:39:02 +02:00
|
|
|
|
wined3d: Rework shader mode selection.
- currently half the shader selection code (GLSL vs ARB) is in
fillGLcaps. The parts that check for software shaders are in
GetDeviceCaps. That placement, will work, but is definitely not optimal.
FillGLcaps should detect support - it should not make decision as to
what's used, because that's not what the purpose of the function is.
GetDeviceCaps should report support as it has already been selected.
Instead, select shader mode in its own function, called in the
appropriate places.
- unifying pixel and vertex shaders into a single selection is a
mistake. A software vertex shader can be coupled with a hardware arb or
glsl pixel shader, or no shader at all. Split them back into two and add
a SHADER_NONE variant.
- drawprim is doing support checks for ARB_PROGRAM, and making shader
decisions based on that - that's wrong, support has already been
checked, and decided upon, and shaders can be implemented via software,
ARB_PROGRAm or GLSL, so that support check isn't valid.
- Store the shader selected mode into the shader itself. Different types
of shaders can be combined, so this is an improvement. In fact, storing
the mode into the settings globally is a mistake as well - it should be
done per device, since different cards have different capabilities.
2006-07-04 09:21:53 +02:00
|
|
|
if (This->baseShader.shader_mode == SHADER_GLSL) {
|
2006-05-26 17:52:33 +02:00
|
|
|
|
|
|
|
/* Create the hw GLSL shader object and assign it as the baseShader.prgId */
|
|
|
|
GLhandleARB shader_obj = GL_EXTCALL(glCreateShaderObjectARB(GL_FRAGMENT_SHADER_ARB));
|
|
|
|
|
2006-10-02 20:06:38 +02:00
|
|
|
if (GL_SUPPORT(ARB_DRAW_BUFFERS)) {
|
|
|
|
shader_addline(&buffer, "#extension GL_ARB_draw_buffers : enable\n");
|
|
|
|
}
|
|
|
|
|
2006-06-12 08:55:30 +02:00
|
|
|
/* Base Declarations */
|
2006-07-19 06:06:07 +02:00
|
|
|
shader_generate_glsl_declarations( (IWineD3DBaseShader*) This, reg_maps, &buffer, &GLINFO_LOCATION);
|
2006-06-12 08:55:30 +02:00
|
|
|
|
2006-06-12 08:57:07 +02:00
|
|
|
/* Pack 3.0 inputs */
|
2007-11-08 23:41:59 +01:00
|
|
|
if (This->baseShader.hex_version >= WINED3DPS_VERSION(3,0)) {
|
2007-10-26 02:11:00 +02:00
|
|
|
|
|
|
|
if(((IWineD3DDeviceImpl *) This->baseShader.device)->strided_streams.u.s.position_transformed) {
|
|
|
|
This->vertexprocessing = pretransformed;
|
2007-11-08 23:41:59 +01:00
|
|
|
pshader_glsl_input_pack(&buffer, This->semantics_in, iface);
|
2007-10-26 02:11:00 +02:00
|
|
|
} else if(!use_vs((IWineD3DDeviceImpl *) This->baseShader.device)) {
|
|
|
|
This->vertexprocessing = fixedfunction;
|
2007-11-08 23:41:59 +01:00
|
|
|
pshader_glsl_input_pack(&buffer, This->semantics_in, iface);
|
2007-10-26 02:11:00 +02:00
|
|
|
} else {
|
|
|
|
This->vertexprocessing = vertexshader;
|
|
|
|
}
|
|
|
|
}
|
2006-06-12 08:57:07 +02:00
|
|
|
|
2006-06-12 08:53:32 +02:00
|
|
|
/* Base Shader Body */
|
2006-07-04 10:01:46 +02:00
|
|
|
shader_generate_main( (IWineD3DBaseShader*) This, &buffer, reg_maps, pFunction);
|
2006-05-26 17:52:33 +02:00
|
|
|
|
|
|
|
/* Pixel shaders < 2.0 place the resulting color in R0 implicitly */
|
2006-10-13 05:36:41 +02:00
|
|
|
if (This->baseShader.hex_version < WINED3DPS_VERSION(2,0)) {
|
2006-08-09 18:24:08 +02:00
|
|
|
/* Some older cards like GeforceFX ones don't support multiple buffers, so also not gl_FragData */
|
|
|
|
if(GL_SUPPORT(ARB_DRAW_BUFFERS))
|
|
|
|
shader_addline(&buffer, "gl_FragData[0] = R0;\n");
|
|
|
|
else
|
|
|
|
shader_addline(&buffer, "gl_FragColor = R0;\n");
|
|
|
|
}
|
2007-03-22 17:32:48 +01:00
|
|
|
|
|
|
|
/* Pixel shader < 3.0 do not replace the fog stage.
|
|
|
|
* This implements linear fog computation and blending.
|
|
|
|
* TODO: non linear fog
|
|
|
|
* NOTE: gl_Fog.start and gl_Fog.end don't hold fog start s and end e but
|
|
|
|
* -1/(e-s) and e/(e-s) respectively.
|
|
|
|
*/
|
|
|
|
if(This->baseShader.hex_version < WINED3DPS_VERSION(3,0)) {
|
|
|
|
shader_addline(&buffer, "float Fog = clamp(gl_FogFragCoord * gl_Fog.start + gl_Fog.end, 0.0, 1.0);\n");
|
|
|
|
if(GL_SUPPORT(ARB_DRAW_BUFFERS))
|
|
|
|
shader_addline(&buffer, "gl_FragData[0].xyz = mix(gl_Fog.color.xyz, gl_FragData[0].xyz, Fog);\n");
|
|
|
|
else
|
|
|
|
shader_addline(&buffer, "gl_FragColor.xyz = mix(gl_Fog.color.xyz, gl_FragColor.xyz, Fog);\n");
|
|
|
|
}
|
2007-09-14 13:02:59 +02:00
|
|
|
if(This->srgb_enabled) {
|
|
|
|
const char *fragcolor;
|
|
|
|
|
|
|
|
if(GL_SUPPORT(ARB_DRAW_BUFFERS)) {
|
|
|
|
fragcolor = "gl_FragData[0]";
|
|
|
|
} else {
|
|
|
|
fragcolor = "gl_FragColor";
|
|
|
|
}
|
|
|
|
shader_addline(&buffer, "tmp0.xyz = pow(%s.xyz, vec3(%f, %f, %f)) * vec3(%f, %f, %f) - vec3(%f, %f, %f);\n",
|
|
|
|
fragcolor, srgb_pow, srgb_pow, srgb_pow, srgb_mul_high, srgb_mul_high, srgb_mul_high,
|
|
|
|
srgb_sub_high, srgb_sub_high, srgb_sub_high);
|
|
|
|
shader_addline(&buffer, "tmp1.xyz = %s.xyz * srgb_mul_low.xyz;\n", fragcolor);
|
|
|
|
shader_addline(&buffer, "%s.x = %s.x < srgb_comparison.x ? tmp1.x : tmp0.x;\n", fragcolor, fragcolor);
|
|
|
|
shader_addline(&buffer, "%s.y = %s.y < srgb_comparison.y ? tmp1.y : tmp0.y;\n", fragcolor, fragcolor);
|
|
|
|
shader_addline(&buffer, "%s.z = %s.z < srgb_comparison.z ? tmp1.z : tmp0.z;\n", fragcolor, fragcolor);
|
|
|
|
shader_addline(&buffer, "%s = clamp(%s, 0.0, 1.0);\n", fragcolor, fragcolor);
|
|
|
|
}
|
2007-03-22 17:32:48 +01:00
|
|
|
|
2006-10-15 17:06:44 +02:00
|
|
|
shader_addline(&buffer, "}\n");
|
2006-05-26 17:52:33 +02:00
|
|
|
|
|
|
|
TRACE("Compiling shader object %u\n", shader_obj);
|
|
|
|
GL_EXTCALL(glShaderSourceARB(shader_obj, 1, (const char**)&buffer.buffer, NULL));
|
|
|
|
GL_EXTCALL(glCompileShaderARB(shader_obj));
|
|
|
|
print_glsl_info_log(&GLINFO_LOCATION, shader_obj);
|
|
|
|
|
|
|
|
/* Store the shader object */
|
|
|
|
This->baseShader.prgId = shader_obj;
|
|
|
|
|
2006-10-08 05:25:01 +02:00
|
|
|
} else if (This->baseShader.shader_mode == SHADER_ARB) {
|
2006-05-10 04:39:02 +02:00
|
|
|
/* Create the hw ARB shader */
|
|
|
|
shader_addline(&buffer, "!!ARBfp1.0\n");
|
|
|
|
|
|
|
|
shader_addline(&buffer, "TEMP TMP;\n"); /* Used in matrix ops */
|
|
|
|
shader_addline(&buffer, "TEMP TMP2;\n"); /* Used in matrix ops */
|
|
|
|
shader_addline(&buffer, "TEMP TA;\n"); /* Used for modifiers */
|
|
|
|
shader_addline(&buffer, "TEMP TB;\n"); /* Used for modifiers */
|
|
|
|
shader_addline(&buffer, "TEMP TC;\n"); /* Used for modifiers */
|
|
|
|
shader_addline(&buffer, "PARAM coefdiv = { 0.5, 0.25, 0.125, 0.0625 };\n");
|
|
|
|
shader_addline(&buffer, "PARAM coefmul = { 2, 4, 8, 16 };\n");
|
|
|
|
shader_addline(&buffer, "PARAM one = { 1.0, 1.0, 1.0, 1.0 };\n");
|
|
|
|
|
2006-06-12 08:55:30 +02:00
|
|
|
/* Base Declarations */
|
2006-07-19 06:06:07 +02:00
|
|
|
shader_generate_arb_declarations( (IWineD3DBaseShader*) This, reg_maps, &buffer, &GLINFO_LOCATION);
|
2006-06-12 08:55:30 +02:00
|
|
|
|
2007-03-22 17:32:48 +01:00
|
|
|
/* We need two variables for fog blending */
|
|
|
|
shader_addline(&buffer, "TEMP TMP_FOG;\n");
|
|
|
|
if (This->baseShader.hex_version >= WINED3DPS_VERSION(2,0)) {
|
|
|
|
shader_addline(&buffer, "TEMP TMP_COLOR;\n");
|
|
|
|
}
|
|
|
|
|
2006-06-12 08:53:32 +02:00
|
|
|
/* Base Shader Body */
|
2006-07-04 10:01:46 +02:00
|
|
|
shader_generate_main( (IWineD3DBaseShader*) This, &buffer, reg_maps, pFunction);
|
2006-05-10 04:39:02 +02:00
|
|
|
|
2007-03-22 17:32:48 +01:00
|
|
|
/* calculate fog and blend it
|
|
|
|
* NOTE: state.fog.params.y and state.fog.params.z don't hold fog start s and end e but
|
|
|
|
* -1/(e-s) and e/(e-s) respectively.
|
|
|
|
*/
|
|
|
|
shader_addline(&buffer, "MAD_SAT TMP_FOG, fragment.fogcoord, state.fog.params.y, state.fog.params.z;\n");
|
2007-09-14 13:02:59 +02:00
|
|
|
|
|
|
|
if(This->srgb_enabled) {
|
|
|
|
if (This->baseShader.hex_version < WINED3DPS_VERSION(2,0)) {
|
|
|
|
shader_addline(&buffer, "LRP TMP_COLOR.rgb, TMP_FOG.x, R0, state.fog.color;\n");
|
|
|
|
shader_addline(&buffer, "MOV result.color.a, R0.a;\n");
|
|
|
|
} else {
|
|
|
|
shader_addline(&buffer, "LRP TMP_COLOR.rgb, TMP_FOG.x, TMP_COLOR, state.fog.color;\n");
|
|
|
|
shader_addline(&buffer, "MOV result.color.a, TMP_COLOR.a;\n");
|
|
|
|
}
|
|
|
|
/* Perform sRGB write correction. See GLX_EXT_framebuffer_sRGB */
|
|
|
|
|
|
|
|
/* Calculate the > 0.0031308 case */
|
|
|
|
shader_addline(&buffer, "POW TMP.x, TMP_COLOR.x, srgb_pow.x;\n");
|
|
|
|
shader_addline(&buffer, "POW TMP.y, TMP_COLOR.y, srgb_pow.y;\n");
|
|
|
|
shader_addline(&buffer, "POW TMP.z, TMP_COLOR.z, srgb_pow.z;\n");
|
|
|
|
shader_addline(&buffer, "MUL TMP, TMP, srgb_mul_hi;\n");
|
|
|
|
shader_addline(&buffer, "SUB TMP, TMP, srgb_sub_hi;\n");
|
|
|
|
/* Calculate the < case */
|
|
|
|
shader_addline(&buffer, "MUL TMP2, srgb_mul_low, TMP_COLOR;\n");
|
|
|
|
/* Get 1.0 / 0.0 masks for > 0.0031308 and < 0.0031308 */
|
|
|
|
shader_addline(&buffer, "SLT TA, srgb_comparison, TMP_COLOR;\n");
|
|
|
|
shader_addline(&buffer, "SGE TB, srgb_comparison, TMP_COLOR;\n");
|
|
|
|
/* Store the components > 0.0031308 in the destination */
|
|
|
|
shader_addline(&buffer, "MUL TMP_COLOR, TMP, TA;\n");
|
|
|
|
/* Add the components that are < 0.0031308 */
|
|
|
|
shader_addline(&buffer, "MAD result.color.xyz, TMP2, TB, TMP_COLOR;\n");
|
|
|
|
/* [0.0;1.0] clamping. Not needed, this is done implicitly */
|
2007-03-22 17:32:48 +01:00
|
|
|
} else {
|
2007-09-14 13:02:59 +02:00
|
|
|
if (This->baseShader.hex_version < WINED3DPS_VERSION(2,0)) {
|
|
|
|
shader_addline(&buffer, "LRP result.color.rgb, TMP_FOG.x, R0, state.fog.color;\n");
|
|
|
|
shader_addline(&buffer, "MOV result.color.a, R0.a;\n");
|
|
|
|
} else {
|
|
|
|
shader_addline(&buffer, "LRP result.color.rgb, TMP_FOG.x, TMP_COLOR, state.fog.color;\n");
|
|
|
|
shader_addline(&buffer, "MOV result.color.a, TMP_COLOR.a;\n");
|
|
|
|
}
|
2007-03-22 17:32:48 +01:00
|
|
|
}
|
|
|
|
|
2006-10-15 17:06:44 +02:00
|
|
|
shader_addline(&buffer, "END\n");
|
2006-05-10 04:39:02 +02:00
|
|
|
|
|
|
|
/* TODO: change to resource.glObjectHandle or something like that */
|
|
|
|
GL_EXTCALL(glGenProgramsARB(1, &This->baseShader.prgId));
|
|
|
|
|
|
|
|
TRACE("Creating a hw pixel shader, prg=%d\n", This->baseShader.prgId);
|
|
|
|
GL_EXTCALL(glBindProgramARB(GL_FRAGMENT_PROGRAM_ARB, This->baseShader.prgId));
|
|
|
|
|
|
|
|
TRACE("Created hw pixel shader, prg=%d\n", This->baseShader.prgId);
|
|
|
|
/* Create the program and check for errors */
|
|
|
|
GL_EXTCALL(glProgramStringARB(GL_FRAGMENT_PROGRAM_ARB, GL_PROGRAM_FORMAT_ASCII_ARB,
|
|
|
|
buffer.bsize, buffer.buffer));
|
|
|
|
|
|
|
|
if (glGetError() == GL_INVALID_OPERATION) {
|
|
|
|
GLint errPos;
|
|
|
|
glGetIntegerv(GL_PROGRAM_ERROR_POSITION_ARB, &errPos);
|
|
|
|
FIXME("HW PixelShader Error at position %d: %s\n",
|
|
|
|
errPos, debugstr_a((const char *)glGetString(GL_PROGRAM_ERROR_STRING_ARB)));
|
|
|
|
This->baseShader.prgId = -1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2007-02-15 03:05:17 +01:00
|
|
|
This->needsbumpmat = reg_maps->bumpmat;
|
|
|
|
|
2006-05-10 04:39:02 +02:00
|
|
|
#if 1 /* if were using the data buffer of device then we don't need to free it */
|
|
|
|
HeapFree(GetProcessHeap(), 0, buffer.buffer);
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2006-06-10 13:15:32 +02:00
|
|
|
static HRESULT WINAPI IWineD3DPixelShaderImpl_SetFunction(IWineD3DPixelShader *iface, CONST DWORD *pFunction) {
|
2006-06-12 08:54:30 +02:00
|
|
|
|
|
|
|
IWineD3DPixelShaderImpl *This =(IWineD3DPixelShaderImpl *)iface;
|
2006-10-08 05:25:01 +02:00
|
|
|
IWineD3DDeviceImpl *deviceImpl = (IWineD3DDeviceImpl *) This->baseShader.device;
|
2006-06-12 08:54:30 +02:00
|
|
|
|
2006-07-25 00:51:03 +02:00
|
|
|
TRACE("(%p) : pFunction %p\n", iface, pFunction);
|
|
|
|
|
2006-07-04 10:01:46 +02:00
|
|
|
/* First pass: trace shader */
|
2006-06-12 08:54:30 +02:00
|
|
|
shader_trace_init((IWineD3DBaseShader*) This, pFunction);
|
|
|
|
pshader_set_limits(This);
|
2005-11-21 17:27:55 +01:00
|
|
|
|
2006-07-10 06:51:03 +02:00
|
|
|
/* Initialize immediate constant lists */
|
|
|
|
list_init(&This->baseShader.constantsF);
|
|
|
|
list_init(&This->baseShader.constantsB);
|
|
|
|
list_init(&This->baseShader.constantsI);
|
|
|
|
|
2007-06-07 23:52:48 +02:00
|
|
|
if (WINED3DSHADER_VERSION_MAJOR(This->baseShader.hex_version) > 1) {
|
|
|
|
shader_reg_maps *reg_maps = &This->baseShader.reg_maps;
|
|
|
|
HRESULT hr;
|
2007-11-06 12:34:22 +01:00
|
|
|
unsigned int i, j, highest_reg_used = 0, num_regs_used = 0;
|
2007-06-07 23:52:48 +02:00
|
|
|
|
|
|
|
/* Second pass: figure out which registers are used, what the semantics are, etc.. */
|
|
|
|
memset(reg_maps, 0, sizeof(shader_reg_maps));
|
|
|
|
hr = shader_get_registers_used((IWineD3DBaseShader*) This, reg_maps,
|
|
|
|
This->semantics_in, NULL, pFunction, NULL);
|
|
|
|
if (FAILED(hr)) return hr;
|
|
|
|
/* FIXME: validate reg_maps against OpenGL */
|
2007-10-28 00:12:37 +02:00
|
|
|
|
|
|
|
for(i = 0; i < MAX_REG_INPUT; i++) {
|
2007-11-06 12:34:22 +01:00
|
|
|
if(This->input_reg_used[i]) {
|
|
|
|
num_regs_used++;
|
|
|
|
highest_reg_used = i;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Don't do any register mapping magic if it is not needed, or if we can't
|
|
|
|
* achive anything anyway
|
|
|
|
*/
|
|
|
|
if(highest_reg_used < (GL_LIMITS(glsl_varyings) / 4) ||
|
2007-11-07 18:22:00 +01:00
|
|
|
num_regs_used > (GL_LIMITS(glsl_varyings) / 4) ) {
|
|
|
|
if(num_regs_used > (GL_LIMITS(glsl_varyings) / 4)) {
|
2007-11-06 12:34:22 +01:00
|
|
|
/* This happens with relative addressing. The input mapper function
|
|
|
|
* warns about this if the higher registers are declared too, so
|
|
|
|
* don't write a FIXME here
|
|
|
|
*/
|
|
|
|
WARN("More varying registers used than supported\n");
|
|
|
|
}
|
|
|
|
|
|
|
|
for(i = 0; i < MAX_REG_INPUT; i++) {
|
|
|
|
This->input_reg_map[i] = i;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
j = 0;
|
|
|
|
for(i = 0; i < MAX_REG_INPUT; i++) {
|
|
|
|
if(This->input_reg_used[i]) {
|
|
|
|
This->input_reg_map[i] = j;
|
|
|
|
j++;
|
|
|
|
} else {
|
|
|
|
This->input_reg_map[i] = -1;
|
|
|
|
}
|
|
|
|
}
|
2007-10-28 00:12:37 +02:00
|
|
|
}
|
2007-06-07 23:52:48 +02:00
|
|
|
}
|
|
|
|
|
2006-10-08 05:25:01 +02:00
|
|
|
This->baseShader.shader_mode = deviceImpl->ps_selected_mode;
|
2005-11-21 17:27:55 +01:00
|
|
|
|
|
|
|
TRACE("(%p) : Copying the function\n", This);
|
|
|
|
if (NULL != pFunction) {
|
2006-11-24 15:15:16 +01:00
|
|
|
void *function;
|
|
|
|
|
|
|
|
function = HeapAlloc(GetProcessHeap(), HEAP_ZERO_MEMORY, This->baseShader.functionLength);
|
|
|
|
if (!function) return E_OUTOFMEMORY;
|
|
|
|
memcpy(function, pFunction, This->baseShader.functionLength);
|
|
|
|
This->baseShader.function = function;
|
2005-11-21 17:27:55 +01:00
|
|
|
} else {
|
2006-03-30 19:14:31 +02:00
|
|
|
This->baseShader.function = NULL;
|
2005-11-21 17:27:55 +01:00
|
|
|
}
|
|
|
|
|
2006-08-05 18:15:35 +02:00
|
|
|
return WINED3D_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
static HRESULT WINAPI IWineD3DPixelShaderImpl_CompileShader(IWineD3DPixelShader *iface) {
|
2006-09-27 13:14:46 +02:00
|
|
|
|
2006-08-05 18:15:35 +02:00
|
|
|
IWineD3DPixelShaderImpl *This =(IWineD3DPixelShaderImpl *)iface;
|
2006-09-27 13:14:46 +02:00
|
|
|
IWineD3DDeviceImpl *deviceImpl = (IWineD3DDeviceImpl*) This->baseShader.device;
|
2006-08-05 18:15:35 +02:00
|
|
|
CONST DWORD *function = This->baseShader.function;
|
2007-09-21 23:47:40 +02:00
|
|
|
UINT i, sampler;
|
|
|
|
IWineD3DBaseTextureImpl *texture;
|
2006-08-05 18:15:35 +02:00
|
|
|
|
|
|
|
TRACE("(%p) : function %p\n", iface, function);
|
|
|
|
|
2007-09-21 23:47:40 +02:00
|
|
|
/* We're already compiled, but check if any of the hardcoded stateblock assumptions
|
|
|
|
* changed.
|
|
|
|
*/
|
|
|
|
if (This->baseShader.is_compiled) {
|
2007-09-14 13:02:59 +02:00
|
|
|
char srgbenabled = deviceImpl->stateBlock->renderState[WINED3DRS_SRGBWRITEENABLE] ? 1 : 0;
|
2007-09-21 23:47:40 +02:00
|
|
|
for(i = 0; i < This->baseShader.num_sampled_samplers; i++) {
|
|
|
|
sampler = This->baseShader.sampled_samplers[i];
|
|
|
|
texture = (IWineD3DBaseTextureImpl *) deviceImpl->stateBlock->textures[sampler];
|
|
|
|
if(texture && texture->baseTexture.shader_conversion_group != This->baseShader.sampled_format[sampler]) {
|
|
|
|
WARN("Recompiling shader %p due to format change on sampler %d\n", This, sampler);
|
|
|
|
WARN("Old format group %s, new is %s\n",
|
|
|
|
debug_d3dformat(This->baseShader.sampled_format[sampler]),
|
|
|
|
debug_d3dformat(texture->baseTexture.shader_conversion_group));
|
|
|
|
goto recompile;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* TODO: Check projected textures */
|
|
|
|
/* TODO: Check texture types(2D, Cube, 3D) */
|
|
|
|
|
2007-09-14 13:02:59 +02:00
|
|
|
if(srgbenabled != This->srgb_enabled && This->srgb_mode_hardcoded) {
|
|
|
|
WARN("Recompiling shader because srgb correction is different and hardcoded\n");
|
|
|
|
goto recompile;
|
|
|
|
}
|
2007-09-14 13:11:00 +02:00
|
|
|
if(This->baseShader.reg_maps.vpos && !This->vpos_uniform) {
|
|
|
|
if(This->render_offscreen != deviceImpl->render_offscreen ||
|
|
|
|
This->height != ((IWineD3DSurfaceImpl *) deviceImpl->render_targets[0])->currentDesc.Height) {
|
|
|
|
WARN("Recompiling shader because vpos is used, hard compiled and changed\n");
|
|
|
|
goto recompile;
|
2007-10-13 13:03:56 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
if(This->baseShader.reg_maps.usesdsy && !This->vpos_uniform) {
|
|
|
|
if(This->render_offscreen ? 0 : 1 != deviceImpl->render_offscreen ? 0 : 1) {
|
|
|
|
WARN("Recompiling shader because dsy is used, hard compiled and render_offscreen changed\n");
|
|
|
|
goto recompile;
|
2007-10-26 02:11:00 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
if(This->baseShader.hex_version >= WINED3DPS_VERSION(3,0)) {
|
|
|
|
if(((IWineD3DDeviceImpl *) This->baseShader.device)->strided_streams.u.s.position_transformed &&
|
|
|
|
This->vertexprocessing != pretransformed) {
|
|
|
|
WARN("Recompiling shader because pretransformed vertices are provided, which wasn't the case before\n");
|
|
|
|
goto recompile;
|
|
|
|
} else if(!use_vs((IWineD3DDeviceImpl *) This->baseShader.device) &&
|
|
|
|
This->vertexprocessing != fixedfunction) {
|
|
|
|
WARN("Recompiling shader because fixed function vp is in use, which wasn't the case before\n");
|
|
|
|
goto recompile;
|
|
|
|
} else if(This->vertexprocessing != vertexshader) {
|
|
|
|
WARN("Recompiling shader because vertex shaders are in use, which wasn't the case before\n");
|
|
|
|
goto recompile;
|
2007-09-14 13:11:00 +02:00
|
|
|
}
|
|
|
|
}
|
2007-09-14 13:02:59 +02:00
|
|
|
|
2007-09-21 23:47:40 +02:00
|
|
|
return WINED3D_OK;
|
|
|
|
|
|
|
|
recompile:
|
|
|
|
if(This->baseShader.recompile_count > 50) {
|
|
|
|
FIXME("Shader %p recompiled more than 50 times\n", This);
|
|
|
|
} else {
|
|
|
|
This->baseShader.recompile_count++;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (This->baseShader.shader_mode == SHADER_GLSL && This->baseShader.prgId != 0) {
|
|
|
|
destroy_glsl_pshader(This);
|
|
|
|
}
|
|
|
|
}
|
2006-08-05 18:15:35 +02:00
|
|
|
|
|
|
|
/* We don't need to compile */
|
2007-03-06 22:35:23 +01:00
|
|
|
if (!function) {
|
2006-08-05 18:15:35 +02:00
|
|
|
This->baseShader.is_compiled = TRUE;
|
|
|
|
return WINED3D_OK;
|
|
|
|
}
|
|
|
|
|
2007-06-07 23:52:48 +02:00
|
|
|
if (WINED3DSHADER_VERSION_MAJOR(This->baseShader.hex_version) == 1) {
|
|
|
|
shader_reg_maps *reg_maps = &This->baseShader.reg_maps;
|
|
|
|
HRESULT hr;
|
|
|
|
|
|
|
|
/* Second pass: figure out which registers are used, what the semantics are, etc.. */
|
|
|
|
memset(reg_maps, 0, sizeof(shader_reg_maps));
|
|
|
|
hr = shader_get_registers_used((IWineD3DBaseShader*)This, reg_maps,
|
|
|
|
This->semantics_in, NULL, This->baseShader.function, deviceImpl->stateBlock);
|
|
|
|
if (FAILED(hr)) return hr;
|
|
|
|
/* FIXME: validate reg_maps against OpenGL */
|
|
|
|
}
|
2006-08-27 19:16:01 +02:00
|
|
|
|
2007-10-11 18:31:26 +02:00
|
|
|
/* Reset fields tracking stateblock values being hardcoded in the shader */
|
2007-09-21 23:47:40 +02:00
|
|
|
This->baseShader.num_sampled_samplers = 0;
|
|
|
|
|
2006-08-05 18:15:35 +02:00
|
|
|
/* Generate the HW shader */
|
|
|
|
TRACE("(%p) : Generating hardware program\n", This);
|
|
|
|
IWineD3DPixelShaderImpl_GenerateShader(iface, &This->baseShader.reg_maps, function);
|
|
|
|
|
|
|
|
This->baseShader.is_compiled = TRUE;
|
|
|
|
|
2006-04-07 12:51:12 +02:00
|
|
|
return WINED3D_OK;
|
2005-11-21 17:27:55 +01:00
|
|
|
}
|
2005-08-25 21:24:21 +02:00
|
|
|
|
|
|
|
const IWineD3DPixelShaderVtbl IWineD3DPixelShader_Vtbl =
|
|
|
|
{
|
|
|
|
/*** IUnknown methods ***/
|
|
|
|
IWineD3DPixelShaderImpl_QueryInterface,
|
|
|
|
IWineD3DPixelShaderImpl_AddRef,
|
|
|
|
IWineD3DPixelShaderImpl_Release,
|
2006-03-28 21:10:51 +02:00
|
|
|
/*** IWineD3DBase methods ***/
|
2005-08-25 21:24:21 +02:00
|
|
|
IWineD3DPixelShaderImpl_GetParent,
|
2006-03-28 21:10:51 +02:00
|
|
|
/*** IWineD3DBaseShader methods ***/
|
|
|
|
IWineD3DPixelShaderImpl_SetFunction,
|
2006-08-05 18:15:35 +02:00
|
|
|
IWineD3DPixelShaderImpl_CompileShader,
|
2006-03-28 21:10:51 +02:00
|
|
|
/*** IWineD3DPixelShader methods ***/
|
2005-08-25 21:24:21 +02:00
|
|
|
IWineD3DPixelShaderImpl_GetDevice,
|
2006-03-28 21:10:51 +02:00
|
|
|
IWineD3DPixelShaderImpl_GetFunction
|
2005-08-25 21:24:21 +02:00
|
|
|
};
|