ppsspp/GPU/Directx9/ShaderManagerDX9.cpp

699 lines
21 KiB
C++
Raw Normal View History

2013-08-17 11:23:51 +02:00
// Copyright (c) 2012- PPSSPP Project.
// This program is free software: you can redistribute it and/or modify
// it under the terms of the GNU General Public License as published by
// the Free Software Foundation, version 2.0 or later versions.
// This program is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
// GNU General Public License 2.0 for more details.
// A copy of the GPL 2.0 should have been included with the program.
// If not, see http://www.gnu.org/licenses/
// Official git repository and contact information can be found at
// https://github.com/hrydgard/ppsspp and http://www.ppsspp.org/.
#ifdef _WIN32
#define SHADERLOG
#endif
#include <cmath>
2013-08-17 11:23:51 +02:00
#include <map>
#include "gfx/d3d9_shader.h"
#include "Common/Data/Text/I18n.h"
2013-08-17 11:23:51 +02:00
#include "math/lin/matrix4x4.h"
#include "math/math_util.h"
#include "math/dataconv.h"
#include "thin3d/thin3d.h"
#include "Common/Data/Encoding/Utf8.h"
2013-08-17 11:23:51 +02:00
#include "Common/Common.h"
#include "Common/Log.h"
#include "Common/StringUtils.h"
#include "Core/Config.h"
#include "Core/Host.h"
2013-08-17 11:23:51 +02:00
#include "Core/Reporting.h"
#include "GPU/Math3D.h"
2013-08-17 11:23:51 +02:00
#include "GPU/GPUState.h"
#include "GPU/ge_constants.h"
#include "GPU/Common/ShaderUniforms.h"
#include "GPU/Directx9/ShaderManagerDX9.h"
2016-04-10 10:55:13 +02:00
#include "GPU/Directx9/DrawEngineDX9.h"
#include "GPU/Directx9/FramebufferManagerDX9.h"
2013-08-17 11:23:51 +02:00
using namespace Lin;
namespace DX9 {
PSShader::PSShader(LPDIRECT3DDEVICE9 device, FShaderID id, const char *code) : id_(id), shader(nullptr), failed_(false) {
2013-08-17 11:23:51 +02:00
source_ = code;
#ifdef SHADERLOG
OutputDebugString(ConvertUTF8ToWString(code).c_str());
2013-08-17 11:23:51 +02:00
#endif
bool success;
std::string errorMessage;
2013-08-17 11:23:51 +02:00
2017-02-05 20:46:26 +01:00
success = CompilePixelShader(device, code, &shader, NULL, errorMessage);
if (!errorMessage.empty()) {
if (success) {
ERROR_LOG(G3D, "Warnings in shader compilation!");
} else {
ERROR_LOG(G3D, "Error in shader compilation!");
}
ERROR_LOG(G3D, "Messages: %s", errorMessage.c_str());
ERROR_LOG(G3D, "Shader source:\n%s", LineNumberString(code).c_str());
OutputDebugStringUTF8("Messages:\n");
OutputDebugStringUTF8(errorMessage.c_str());
Reporting::ReportMessage("D3D error in shader compilation: info: %s / code: %s", errorMessage.c_str(), code);
}
2013-08-17 11:23:51 +02:00
if (!success) {
failed_ = true;
2014-09-07 10:38:49 -07:00
if (shader)
shader->Release();
2013-08-17 11:23:51 +02:00
shader = NULL;
return;
2013-08-17 11:23:51 +02:00
} else {
VERBOSE_LOG(G3D, "Compiled pixel shader:\n%s\n", (const char *)code);
2013-08-17 11:23:51 +02:00
}
}
PSShader::~PSShader() {
if (shader)
shader->Release();
}
std::string PSShader::GetShaderString(DebugShaderStringType type) const {
switch (type) {
case SHADER_STRING_SOURCE_CODE:
return source_;
case SHADER_STRING_SHORT_DESC:
return FragmentShaderDesc(id_);
default:
return "N/A";
}
}
VSShader::VSShader(LPDIRECT3DDEVICE9 device, VShaderID id, const char *code, bool useHWTransform) : id_(id), shader(nullptr), failed_(false), useHWTransform_(useHWTransform) {
2013-08-17 11:23:51 +02:00
source_ = code;
#ifdef SHADERLOG
OutputDebugString(ConvertUTF8ToWString(code).c_str());
2013-08-17 11:23:51 +02:00
#endif
bool success;
std::string errorMessage;
2013-08-17 11:23:51 +02:00
2017-02-05 20:46:26 +01:00
success = CompileVertexShader(device, code, &shader, NULL, errorMessage);
if (!errorMessage.empty()) {
if (success) {
ERROR_LOG(G3D, "Warnings in shader compilation!");
} else {
ERROR_LOG(G3D, "Error in shader compilation!");
}
ERROR_LOG(G3D, "Messages: %s", errorMessage.c_str());
ERROR_LOG(G3D, "Shader source:\n%s", code);
OutputDebugStringUTF8("Messages:\n");
OutputDebugStringUTF8(errorMessage.c_str());
Reporting::ReportMessage("D3D error in shader compilation: info: %s / code: %s", errorMessage.c_str(), code);
}
2013-08-17 11:23:51 +02:00
if (!success) {
failed_ = true;
2014-09-07 10:38:49 -07:00
if (shader)
shader->Release();
2013-08-17 11:23:51 +02:00
shader = NULL;
return;
2013-08-17 11:23:51 +02:00
} else {
VERBOSE_LOG(G3D, "Compiled vertex shader:\n%s\n", (const char *)code);
2013-08-17 11:23:51 +02:00
}
}
VSShader::~VSShader() {
if (shader)
shader->Release();
}
std::string VSShader::GetShaderString(DebugShaderStringType type) const {
switch (type) {
case SHADER_STRING_SOURCE_CODE:
return source_;
case SHADER_STRING_SHORT_DESC:
return VertexShaderDesc(id_);
default:
return "N/A";
}
}
void ShaderManagerDX9::PSSetColorUniform3(int creg, u32 color) {
float f[4];
Uint8x3ToFloat4(f, color);
device_->SetPixelShaderConstantF(creg, f, 1);
}
void ShaderManagerDX9::PSSetColorUniform3Alpha255(int creg, u32 color, u8 alpha) {
const float col[4] = {
(float)((color & 0xFF)),
(float)((color & 0xFF00) >> 8),
(float)((color & 0xFF0000) >> 16),
(float)alpha,
};
device_->SetPixelShaderConstantF(creg, col, 1);
2013-08-23 14:29:33 +02:00
}
void ShaderManagerDX9::PSSetFloat(int creg, float value) {
const float f[4] = { value, 0.0f, 0.0f, 0.0f };
device_->SetPixelShaderConstantF(creg, f, 1);
}
void ShaderManagerDX9::PSSetFloatArray(int creg, const float *value, int count) {
float f[4] = { 0.0f, 0.0f, 0.0f, 0.0f };
for (int i = 0; i < count; i++) {
f[i] = value[i];
}
device_->SetPixelShaderConstantF(creg, f, 1);
}
void ShaderManagerDX9::VSSetFloat(int creg, float value) {
const float f[4] = { value, 0.0f, 0.0f, 0.0f };
device_->SetVertexShaderConstantF(creg, f, 1);
}
void ShaderManagerDX9::VSSetFloatArray(int creg, const float *value, int count) {
float f[4] = { 0.0f, 0.0f, 0.0f, 0.0f };
for (int i = 0; i < count; i++) {
f[i] = value[i];
}
device_->SetVertexShaderConstantF(creg, f, 1);
2013-08-23 14:29:33 +02:00
}
2013-08-23 17:11:01 +02:00
// Utility
void ShaderManagerDX9::VSSetColorUniform3(int creg, u32 color) {
float f[4];
Uint8x3ToFloat4(f, color);
device_->SetVertexShaderConstantF(creg, f, 1);
}
2015-08-26 17:45:21 +02:00
void ShaderManagerDX9::VSSetFloatUniform4(int creg, float data[4]) {
device_->SetVertexShaderConstantF(creg, data, 1);
2015-08-26 17:45:21 +02:00
}
void ShaderManagerDX9::VSSetFloat24Uniform3(int creg, const u32 data[3]) {
float f[4];
ExpandFloat24x3ToFloat4(f, data);
device_->SetVertexShaderConstantF(creg, f, 1);
}
2013-08-17 11:23:51 +02:00
void ShaderManagerDX9::VSSetColorUniform3Alpha(int creg, u32 color, u8 alpha) {
float f[4];
Uint8x3ToFloat4_AlphaUint8(f, color, alpha);
device_->SetVertexShaderConstantF(creg, f, 1);
2013-08-23 14:29:33 +02:00
}
void ShaderManagerDX9::VSSetColorUniform3ExtraFloat(int creg, u32 color, float extra) {
2013-08-23 17:11:01 +02:00
const float col[4] = {
((color & 0xFF)) / 255.0f,
((color & 0xFF00) >> 8) / 255.0f,
((color & 0xFF0000) >> 16) / 255.0f,
extra
};
device_->SetVertexShaderConstantF(creg, col, 1);
2013-08-17 11:23:51 +02:00
}
2013-08-23 17:11:01 +02:00
// Utility
void ShaderManagerDX9::VSSetMatrix4x3(int creg, const float *m4x3) {
2013-08-23 17:11:01 +02:00
float m4x4[16];
ConvertMatrix4x3To4x4Transposed(m4x4, m4x3);
device_->SetVertexShaderConstantF(creg, m4x4, 4);
2013-08-17 11:23:51 +02:00
}
void ShaderManagerDX9::VSSetMatrix4x3_3(int creg, const float *m4x3) {
float m3x4[12];
ConvertMatrix4x3To3x4Transposed(m3x4, m4x3);
device_->SetVertexShaderConstantF(creg, m3x4, 3);
}
void ShaderManagerDX9::VSSetMatrix(int creg, const float* pMatrix) {
float transp[16];
Transpose4x4(transp, pMatrix);
device_->SetVertexShaderConstantF(creg, transp, 4);
2013-08-17 11:23:51 +02:00
}
// Depth in ogl is between -1;1 we need between 0;1 and optionally reverse it
static void ConvertProjMatrixToD3D(Matrix4x4 &in, bool invertedX, bool invertedY) {
// Half pixel offset hack
2017-05-23 23:45:55 -07:00
float xoff = 1.0f / gstate_c.curRTRenderWidth;
2020-01-26 16:34:46 +01:00
if (invertedX) {
xoff = -gstate_c.vpXOffset - xoff;
} else {
xoff = gstate_c.vpXOffset - xoff;
}
2020-01-26 16:34:46 +01:00
float yoff = -1.0f / gstate_c.curRTRenderHeight;
if (invertedY) {
yoff = -gstate_c.vpYOffset - yoff;
} else {
yoff = gstate_c.vpYOffset - yoff;
2020-01-26 16:34:46 +01:00
}
const Vec3 trans(xoff, yoff, gstate_c.vpZOffset * 0.5f + 0.5f);
const Vec3 scale(gstate_c.vpWidthScale, gstate_c.vpHeightScale, gstate_c.vpDepthScale * 0.5f);
in.translateAndScale(trans, scale);
}
static void ConvertProjMatrixToD3DThrough(Matrix4x4 &in) {
2017-05-23 23:45:55 -07:00
float xoff = -1.0f / gstate_c.curRTRenderWidth;
float yoff = 1.0f / gstate_c.curRTRenderHeight;
in.translateAndScale(Vec3(xoff, yoff, 0.5f), Vec3(1.0f, 1.0f, 0.5f));
2013-08-17 11:23:51 +02:00
}
2017-01-24 14:16:51 +01:00
const uint64_t psUniforms = DIRTY_TEXENV | DIRTY_ALPHACOLORREF | DIRTY_ALPHACOLORMASK | DIRTY_FOGCOLOR | DIRTY_STENCILREPLACEVALUE | DIRTY_SHADERBLEND | DIRTY_TEXCLAMP;
void ShaderManagerDX9::PSUpdateUniforms(u64 dirtyUniforms) {
if (dirtyUniforms & DIRTY_TEXENV) {
2014-09-10 13:48:55 +02:00
PSSetColorUniform3(CONST_PS_TEXENV, gstate.texenvcolor);
}
if (dirtyUniforms & DIRTY_ALPHACOLORREF) {
PSSetColorUniform3Alpha255(CONST_PS_ALPHACOLORREF, gstate.getColorTestRef(), gstate.getAlphaTestRef() & gstate.getAlphaTestMask());
}
if (dirtyUniforms & DIRTY_ALPHACOLORMASK) {
PSSetColorUniform3Alpha255(CONST_PS_ALPHACOLORMASK, gstate.colortestmask, gstate.getAlphaTestMask());
}
if (dirtyUniforms & DIRTY_FOGCOLOR) {
2014-09-10 13:48:55 +02:00
PSSetColorUniform3(CONST_PS_FOGCOLOR, gstate.fogcolor);
}
if (dirtyUniforms & DIRTY_STENCILREPLACEVALUE) {
PSSetFloat(CONST_PS_STENCILREPLACE, (float)gstate.getStencilTestRef() * (1.0f / 255.0f));
}
if (dirtyUniforms & DIRTY_SHADERBLEND) {
PSSetColorUniform3(CONST_PS_BLENDFIXA, gstate.getFixA());
PSSetColorUniform3(CONST_PS_BLENDFIXB, gstate.getFixB());
const float fbotexSize[2] = {
1.0f / (float)gstate_c.curRTRenderWidth,
1.0f / (float)gstate_c.curRTRenderHeight,
};
PSSetFloatArray(CONST_PS_FBOTEXSIZE, fbotexSize, 2);
}
if (dirtyUniforms & DIRTY_TEXCLAMP) {
const float invW = 1.0f / (float)gstate_c.curTextureWidth;
const float invH = 1.0f / (float)gstate_c.curTextureHeight;
const int w = gstate.getTextureWidth(0);
const int h = gstate.getTextureHeight(0);
const float widthFactor = (float)w * invW;
const float heightFactor = (float)h * invH;
// First wrap xy, then half texel xy (for clamp.)
const float texclamp[4] = {
widthFactor,
heightFactor,
invW * 0.5f,
invH * 0.5f,
};
const float texclampoff[2] = {
gstate_c.curTextureXOffset * invW,
gstate_c.curTextureYOffset * invH,
};
PSSetFloatArray(CONST_PS_TEXCLAMP, texclamp, 4);
PSSetFloatArray(CONST_PS_TEXCLAMPOFF, texclampoff, 2);
}
2013-08-23 17:11:01 +02:00
}
2017-01-24 14:16:51 +01:00
const uint64_t vsUniforms = DIRTY_PROJMATRIX | DIRTY_PROJTHROUGHMATRIX | DIRTY_WORLDMATRIX | DIRTY_VIEWMATRIX | DIRTY_TEXMATRIX |
2018-09-16 23:40:30 -07:00
DIRTY_FOGCOEF | DIRTY_BONE_UNIFORMS | DIRTY_UVSCALEOFFSET | DIRTY_DEPTHRANGE | DIRTY_CULLRANGE |
2017-01-24 14:16:51 +01:00
DIRTY_AMBIENT | DIRTY_MATAMBIENTALPHA | DIRTY_MATSPECULAR | DIRTY_MATDIFFUSE | DIRTY_MATEMISSIVE | DIRTY_LIGHT0 | DIRTY_LIGHT1 | DIRTY_LIGHT2 | DIRTY_LIGHT3;
void ShaderManagerDX9::VSUpdateUniforms(u64 dirtyUniforms) {
2013-08-17 11:23:51 +02:00
// Update any dirty uniforms before we draw
if (dirtyUniforms & DIRTY_PROJMATRIX) {
2013-08-17 11:23:51 +02:00
Matrix4x4 flippedMatrix;
memcpy(&flippedMatrix, gstate.projMatrix, 16 * sizeof(float));
const bool invertedY = gstate_c.vpHeight < 0;
2014-09-24 23:09:09 -07:00
if (!invertedY) {
flippedMatrix[1] = -flippedMatrix[1];
2013-08-17 11:23:51 +02:00
flippedMatrix[5] = -flippedMatrix[5];
flippedMatrix[9] = -flippedMatrix[9];
2013-08-17 11:23:51 +02:00
flippedMatrix[13] = -flippedMatrix[13];
}
const bool invertedX = gstate_c.vpWidth < 0;
if (invertedX) {
2013-08-17 11:23:51 +02:00
flippedMatrix[0] = -flippedMatrix[0];
flippedMatrix[4] = -flippedMatrix[4];
flippedMatrix[8] = -flippedMatrix[8];
2013-08-17 11:23:51 +02:00
flippedMatrix[12] = -flippedMatrix[12];
}
ConvertProjMatrixToD3D(flippedMatrix, invertedX, invertedY);
2013-08-17 11:23:51 +02:00
2014-09-10 13:48:55 +02:00
VSSetMatrix(CONST_VS_PROJ, flippedMatrix.getReadPtr());
2013-08-17 11:23:51 +02:00
}
if (dirtyUniforms & DIRTY_PROJTHROUGHMATRIX) {
2013-08-17 11:23:51 +02:00
Matrix4x4 proj_through;
proj_through.setOrtho(0.0f, gstate_c.curRTWidth, gstate_c.curRTHeight, 0, 0, 1);
ConvertProjMatrixToD3DThrough(proj_through);
2013-08-17 11:23:51 +02:00
2014-09-10 13:48:55 +02:00
VSSetMatrix(CONST_VS_PROJ_THROUGH, proj_through.getReadPtr());
2013-08-17 11:23:51 +02:00
}
// Transform
if (dirtyUniforms & DIRTY_WORLDMATRIX) {
VSSetMatrix4x3_3(CONST_VS_WORLD, gstate.worldMatrix);
2013-08-17 11:23:51 +02:00
}
if (dirtyUniforms & DIRTY_VIEWMATRIX) {
VSSetMatrix4x3_3(CONST_VS_VIEW, gstate.viewMatrix);
2013-08-17 11:23:51 +02:00
}
if (dirtyUniforms & DIRTY_TEXMATRIX) {
VSSetMatrix4x3_3(CONST_VS_TEXMTX, gstate.tgenMatrix);
2013-08-17 11:23:51 +02:00
}
if (dirtyUniforms & DIRTY_FOGCOEF) {
float fogcoef[2] = {
getFloat24(gstate.fog1),
getFloat24(gstate.fog2),
};
// The PSP just ignores infnan here (ignoring IEEE), so take it down to a valid float.
// Workaround for https://github.com/hrydgard/ppsspp/issues/5384#issuecomment-38365988
if (my_isnanorinf(fogcoef[0])) {
// Not really sure what a sensible value might be, but let's try 64k.
fogcoef[0] = std::signbit(fogcoef[0]) ? -65535.0f : 65535.0f;
}
if (my_isnanorinf(fogcoef[1])) {
fogcoef[1] = std::signbit(fogcoef[1]) ? -65535.0f : 65535.0f;
}
2014-09-10 13:48:55 +02:00
VSSetFloatArray(CONST_VS_FOGCOEF, fogcoef, 2);
}
// TODO: Could even set all bones in one go if they're all dirty.
#ifdef USE_BONE_ARRAY
if (u_bone != 0) {
float allBones[8 * 16];
bool allDirty = true;
for (int i = 0; i < numBones; i++) {
if (dirtyUniforms & (DIRTY_BONEMATRIX0 << i)) {
ConvertMatrix4x3To4x4(allBones + 16 * i, gstate.boneMatrix + 12 * i);
} else {
allDirty = false;
}
}
if (allDirty) {
// Set them all with one call
//glUniformMatrix4fv(u_bone, numBones, GL_FALSE, allBones);
} else {
// Set them one by one. Could try to coalesce two in a row etc but too lazy.
for (int i = 0; i < numBones; i++) {
if (dirtyUniforms & (DIRTY_BONEMATRIX0 << i)) {
//glUniformMatrix4fv(u_bone + i, 1, GL_FALSE, allBones + 16 * i);
}
}
}
}
#else
for (int i = 0; i < 8; i++) {
if (dirtyUniforms & (DIRTY_BONEMATRIX0 << i)) {
VSSetMatrix4x3_3(CONST_VS_BONE0 + 3 * i, gstate.boneMatrix + 12 * i);
}
}
#endif
2013-08-17 11:23:51 +02:00
// Texturing
if (dirtyUniforms & DIRTY_UVSCALEOFFSET) {
const float invW = 1.0f / (float)gstate_c.curTextureWidth;
const float invH = 1.0f / (float)gstate_c.curTextureHeight;
const int w = gstate.getTextureWidth(0);
const int h = gstate.getTextureHeight(0);
const float widthFactor = (float)w * invW;
const float heightFactor = (float)h * invH;
float uvscaleoff[4];
uvscaleoff[0] = widthFactor;
uvscaleoff[1] = heightFactor;
uvscaleoff[2] = 0.0f;
uvscaleoff[3] = 0.0f;
2014-09-10 13:48:55 +02:00
VSSetFloatArray(CONST_VS_UVSCALEOFFSET, uvscaleoff, 4);
}
2018-09-16 23:40:30 -07:00
if (dirtyUniforms & DIRTY_DEPTHRANGE) {
// Depth is [0, 1] mapping to [minz, maxz], not too hard.
float vpZScale = gstate.getViewportZScale();
float vpZCenter = gstate.getViewportZCenter();
// These are just the reverse of the formulas in GPUStateUtils.
float halfActualZRange = vpZScale / gstate_c.vpDepthScale;
float minz = -((gstate_c.vpZOffset * halfActualZRange) - vpZCenter) - halfActualZRange;
float viewZScale = halfActualZRange * 2.0f;
2016-01-20 22:53:47 -08:00
// Account for the half pixel offset.
float viewZCenter = minz + (DepthSliceFactor() / 256.0f) * 0.5f;
float viewZInvScale;
2015-08-27 18:01:00 +02:00
if (viewZScale != 0.0) {
viewZInvScale = 1.0f / viewZScale;
2015-08-27 18:01:00 +02:00
} else {
viewZInvScale = 0.0;
}
float data[4] = { viewZScale, viewZCenter, viewZCenter, viewZInvScale };
2015-08-26 17:45:21 +02:00
VSSetFloatUniform4(CONST_VS_DEPTHRANGE, data);
}
2018-09-16 23:40:30 -07:00
if (dirtyUniforms & DIRTY_CULLRANGE) {
float minValues[4], maxValues[4];
CalcCullRange(minValues, maxValues, false, false);
2018-09-16 23:40:30 -07:00
VSSetFloatUniform4(CONST_VS_CULLRANGEMIN, minValues);
VSSetFloatUniform4(CONST_VS_CULLRANGEMAX, maxValues);
}
2013-08-17 11:23:51 +02:00
// Lighting
if (dirtyUniforms & DIRTY_AMBIENT) {
2014-09-10 13:48:55 +02:00
VSSetColorUniform3Alpha(CONST_VS_AMBIENT, gstate.ambientcolor, gstate.getAmbientA());
2013-08-17 11:23:51 +02:00
}
if (dirtyUniforms & DIRTY_MATAMBIENTALPHA) {
2014-09-10 13:48:55 +02:00
VSSetColorUniform3Alpha(CONST_VS_MATAMBIENTALPHA, gstate.materialambient, gstate.getMaterialAmbientA());
2013-08-17 11:23:51 +02:00
}
if (dirtyUniforms & DIRTY_MATDIFFUSE) {
2014-09-10 13:48:55 +02:00
VSSetColorUniform3(CONST_VS_MATDIFFUSE, gstate.materialdiffuse);
2013-08-17 11:23:51 +02:00
}
if (dirtyUniforms & DIRTY_MATEMISSIVE) {
2014-09-10 13:48:55 +02:00
VSSetColorUniform3(CONST_VS_MATEMISSIVE, gstate.materialemissive);
2013-08-17 11:23:51 +02:00
}
if (dirtyUniforms & DIRTY_MATSPECULAR) {
2014-09-10 13:48:55 +02:00
VSSetColorUniform3ExtraFloat(CONST_VS_MATSPECULAR, gstate.materialspecular, getFloat24(gstate.materialspecularcoef));
2013-08-17 11:23:51 +02:00
}
for (int i = 0; i < 4; i++) {
if (dirtyUniforms & (DIRTY_LIGHT0 << i)) {
if (gstate.isDirectionalLight(i)) {
// Prenormalize
float x = getFloat24(gstate.lpos[i * 3 + 0]);
float y = getFloat24(gstate.lpos[i * 3 + 1]);
float z = getFloat24(gstate.lpos[i * 3 + 2]);
float len = sqrtf(x*x + y*y + z*z);
if (len == 0.0f)
len = 1.0f;
else
len = 1.0f / len;
float vec[3] = { x * len, y * len, z * len };
VSSetFloatArray(CONST_VS_LIGHTPOS + i, vec, 3);
} else {
VSSetFloat24Uniform3(CONST_VS_LIGHTPOS + i, &gstate.lpos[i * 3]);
2013-08-17 11:23:51 +02:00
}
VSSetFloat24Uniform3(CONST_VS_LIGHTDIR + i, &gstate.ldir[i * 3]);
VSSetFloat24Uniform3(CONST_VS_LIGHTATT + i, &gstate.latt[i * 3]);
float angle_spotCoef[4] = { getFloat24(gstate.lcutoff[i]), getFloat24(gstate.lconv[i]) };
VSSetFloatUniform4(CONST_VS_LIGHTANGLE_SPOTCOEF + i, angle_spotCoef);
VSSetColorUniform3(CONST_VS_LIGHTAMBIENT + i, gstate.lcolor[i * 3]);
VSSetColorUniform3(CONST_VS_LIGHTDIFFUSE + i, gstate.lcolor[i * 3 + 1]);
VSSetColorUniform3(CONST_VS_LIGHTSPECULAR + i, gstate.lcolor[i * 3 + 2]);
2013-08-17 11:23:51 +02:00
}
}
}
ShaderManagerDX9::ShaderManagerDX9(Draw::DrawContext *draw, LPDIRECT3DDEVICE9 device)
: ShaderManagerCommon(draw), device_(device), lastVShader_(nullptr), lastPShader_(nullptr) {
2013-08-17 11:23:51 +02:00
codeBuffer_ = new char[16384];
}
ShaderManagerDX9::~ShaderManagerDX9() {
2013-08-17 11:23:51 +02:00
delete [] codeBuffer_;
}
void ShaderManagerDX9::Clear() {
2013-08-23 17:11:01 +02:00
for (auto iter = fsCache_.begin(); iter != fsCache_.end(); ++iter) {
2013-08-17 11:23:51 +02:00
delete iter->second;
}
2013-08-23 17:11:01 +02:00
for (auto iter = vsCache_.begin(); iter != vsCache_.end(); ++iter) {
2013-08-17 11:23:51 +02:00
delete iter->second;
}
2013-08-23 17:11:01 +02:00
fsCache_.clear();
vsCache_.clear();
2013-08-17 11:23:51 +02:00
DirtyShader();
}
void ShaderManagerDX9::ClearCache(bool deleteThem) {
2013-08-17 11:23:51 +02:00
Clear();
}
void ShaderManagerDX9::DirtyShader() {
2013-08-17 11:23:51 +02:00
// Forget the last shader ID
lastFSID_.set_invalid();
lastVSID_.set_invalid();
lastVShader_ = nullptr;
lastPShader_ = nullptr;
gstate_c.Dirty(DIRTY_ALL_UNIFORMS | DIRTY_VERTEXSHADER_STATE | DIRTY_FRAGMENTSHADER_STATE);
2013-08-17 11:23:51 +02:00
}
void ShaderManagerDX9::DirtyLastShader() { // disables vertex arrays
lastVShader_ = nullptr;
lastPShader_ = nullptr;
2013-08-17 11:23:51 +02:00
}
VSShader *ShaderManagerDX9::ApplyShader(bool useHWTransform, bool useHWTessellation, u32 vertType) {
// Always use software for flat shading to fix the provoking index.
bool tess = gstate_c.bezier || gstate_c.spline;
useHWTransform = useHWTransform && (tess || gstate.getShadeMode() != GE_SHADE_FLAT);
2013-08-17 11:23:51 +02:00
VShaderID VSID;
if (gstate_c.IsDirty(DIRTY_VERTEXSHADER_STATE)) {
gstate_c.Clean(DIRTY_VERTEXSHADER_STATE);
ComputeVertexShaderID(&VSID, vertType, useHWTransform, useHWTessellation);
} else {
VSID = lastVSID_;
}
FShaderID FSID;
2017-03-19 11:32:29 +01:00
if (gstate_c.IsDirty(DIRTY_FRAGMENTSHADER_STATE)) {
gstate_c.Clean(DIRTY_FRAGMENTSHADER_STATE);
ComputeFragmentShaderID(&FSID, draw_->GetBugs());
2017-03-19 11:32:29 +01:00
} else {
FSID = lastFSID_;
}
2013-08-17 11:23:51 +02:00
// Just update uniforms if this is the same shader as last time.
if (lastVShader_ != nullptr && lastPShader_ != nullptr && VSID == lastVSID_ && FSID == lastFSID_) {
uint64_t dirtyUniforms = gstate_c.GetDirtyUniforms();
if (dirtyUniforms) {
2017-01-24 14:16:51 +01:00
if (dirtyUniforms & psUniforms)
PSUpdateUniforms(dirtyUniforms);
if (dirtyUniforms & vsUniforms)
VSUpdateUniforms(dirtyUniforms);
gstate_c.CleanUniforms();
}
return lastVShader_; // Already all set.
2013-08-17 11:23:51 +02:00
}
2013-08-23 17:11:01 +02:00
VSCache::iterator vsIter = vsCache_.find(VSID);
2013-08-17 11:23:51 +02:00
VSShader *vs;
2013-08-23 17:11:01 +02:00
if (vsIter == vsCache_.end()) {
2013-08-17 11:23:51 +02:00
// Vertex shader not in cache. Let's compile it.
GenerateVertexShaderHLSL(VSID, codeBuffer_);
2017-02-05 20:46:26 +01:00
vs = new VSShader(device_, VSID, codeBuffer_, useHWTransform);
2013-08-17 11:23:51 +02:00
if (vs->Failed()) {
auto gr = GetI18NCategory("Graphics");
ERROR_LOG(G3D, "Shader compilation failed, falling back to software transform");
if (!g_Config.bHideSlowWarnings) {
host->NotifyUserMessage(gr->T("hardware transform error - falling back to software"), 2.5f, 0xFF3030FF);
}
2013-08-17 11:23:51 +02:00
delete vs;
ComputeVertexShaderID(&VSID, vertType, false, false);
2013-08-17 11:23:51 +02:00
// TODO: Look for existing shader with the appropriate ID, use that instead of generating a new one - however, need to make sure
// that that shader ID is not used when computing the linked shader ID below, because then IDs won't match
// next time and we'll do this over and over...
// Can still work with software transform.
GenerateVertexShaderHLSL(VSID, codeBuffer_);
2017-02-05 20:46:26 +01:00
vs = new VSShader(device_, VSID, codeBuffer_, false);
2013-08-17 11:23:51 +02:00
}
2013-08-23 17:11:01 +02:00
vsCache_[VSID] = vs;
2013-08-17 11:23:51 +02:00
} else {
vs = vsIter->second;
}
lastVSID_ = VSID;
2013-08-17 11:23:51 +02:00
2013-08-23 17:11:01 +02:00
FSCache::iterator fsIter = fsCache_.find(FSID);
2013-08-17 11:23:51 +02:00
PSShader *fs;
2013-08-23 17:11:01 +02:00
if (fsIter == fsCache_.end()) {
2013-08-17 11:23:51 +02:00
// Fragment shader not in cache. Let's compile it.
GenerateFragmentShaderHLSL(FSID, codeBuffer_);
2017-02-05 20:46:26 +01:00
fs = new PSShader(device_, FSID, codeBuffer_);
2013-08-23 17:11:01 +02:00
fsCache_[FSID] = fs;
2013-08-17 11:23:51 +02:00
} else {
fs = fsIter->second;
}
lastFSID_ = FSID;
uint64_t dirtyUniforms = gstate_c.GetDirtyUniforms();
if (dirtyUniforms) {
2017-01-24 14:16:51 +01:00
if (dirtyUniforms & psUniforms)
PSUpdateUniforms(dirtyUniforms);
if (dirtyUniforms & vsUniforms)
VSUpdateUniforms(dirtyUniforms);
gstate_c.CleanUniforms();
}
device_->SetPixelShader(fs->shader);
device_->SetVertexShader(vs->shader);
2013-08-17 11:23:51 +02:00
lastPShader_ = fs;
lastVShader_ = vs;
return vs;
2013-08-17 11:23:51 +02:00
}
std::vector<std::string> ShaderManagerDX9::DebugGetShaderIDs(DebugShaderType type) {
std::string id;
std::vector<std::string> ids;
switch (type) {
case SHADER_TYPE_VERTEX:
{
for (auto iter : vsCache_) {
iter.first.ToString(&id);
ids.push_back(id);
}
}
break;
case SHADER_TYPE_FRAGMENT:
{
for (auto iter : fsCache_) {
iter.first.ToString(&id);
ids.push_back(id);
}
}
break;
}
return ids;
}
std::string ShaderManagerDX9::DebugGetShaderString(std::string id, DebugShaderType type, DebugShaderStringType stringType) {
ShaderID shaderId;
shaderId.FromString(id);
switch (type) {
case SHADER_TYPE_VERTEX:
{
auto iter = vsCache_.find(VShaderID(shaderId));
if (iter == vsCache_.end()) {
return "";
}
return iter->second->GetShaderString(stringType);
}
case SHADER_TYPE_FRAGMENT:
{
auto iter = fsCache_.find(FShaderID(shaderId));
if (iter == fsCache_.end()) {
return "";
}
return iter->second->GetShaderString(stringType);
}
default:
return "N/A";
}
}
} // namespace