mirror of
https://github.com/wheremyfoodat/Panda3DS.git
synced 2025-04-07 06:35:40 +12:00
[Shader JIT] Add caching
This commit is contained in:
parent
364443d66f
commit
4064abfdeb
9 changed files with 77 additions and 5 deletions
|
@ -22,6 +22,7 @@ include_directories(third_party/gl3w/)
|
||||||
include_directories(third_party/imgui/)
|
include_directories(third_party/imgui/)
|
||||||
include_directories(third_party/dynarmic/src)
|
include_directories(third_party/dynarmic/src)
|
||||||
include_directories(third_party/cryptopp/)
|
include_directories(third_party/cryptopp/)
|
||||||
|
include_directories(third_party/cityhash/include)
|
||||||
include_directories(third_party/result/include/)
|
include_directories(third_party/result/include/)
|
||||||
|
|
||||||
add_compile_definitions(NOMINMAX)
|
add_compile_definitions(NOMINMAX)
|
||||||
|
|
|
@ -1,22 +1,35 @@
|
||||||
#pragma once
|
#pragma once
|
||||||
#include "PICA/shader.hpp"
|
#include "PICA/shader.hpp"
|
||||||
|
|
||||||
|
#if defined(PANDA3DS_DYNAPICA_SUPPORTED) && defined(PANDA3DS_X64_HOST)
|
||||||
|
#define PANDA3DS_SHADER_JIT_SUPPORTED
|
||||||
|
#include <unordered_map>
|
||||||
|
#endif
|
||||||
|
|
||||||
class ShaderJIT {
|
class ShaderJIT {
|
||||||
|
#ifdef PANDA3DS_SHADER_JIT_SUPPORTED
|
||||||
|
using Hash = PICAShader::Hash;
|
||||||
|
using ShaderCache = std::unordered_map<Hash, int>;
|
||||||
|
|
||||||
|
ShaderCache cache;
|
||||||
void compileShader(PICAShader& shaderUnit);
|
void compileShader(PICAShader& shaderUnit);
|
||||||
|
#endif
|
||||||
|
|
||||||
public:
|
public:
|
||||||
#if defined(PANDA3DS_DYNAPICA_SUPPORTED) && defined(PANDA3DS_X64_HOST)
|
#ifdef PANDA3DS_SHADER_JIT_SUPPORTED
|
||||||
#define PANDA3DS_SHADER_JIT_SUPPORTED
|
|
||||||
|
|
||||||
// Call this before starting to process a batch of vertices
|
// Call this before starting to process a batch of vertices
|
||||||
// This will read the PICA config (uploaded shader and shader operand descriptors) and search if we've already compiled this shader
|
// This will read the PICA config (uploaded shader and shader operand descriptors) and search if we've already compiled this shader
|
||||||
// If yes, it sets it as the active shader. if not, then it compiles it, adds it to the cache, and sets it as active,
|
// If yes, it sets it as the active shader. if not, then it compiles it, adds it to the cache, and sets it as active,
|
||||||
void prepare(PICAShader& shaderUnit);
|
void prepare(PICAShader& shaderUnit);
|
||||||
|
void reset();
|
||||||
|
|
||||||
static constexpr bool isAvailable() { return true; }
|
static constexpr bool isAvailable() { return true; }
|
||||||
#else
|
#else
|
||||||
void prepare(PICAShader& shaderUnit) {
|
void prepare(PICAShader& shaderUnit) {
|
||||||
Helpers::panic("Vertex Loader JIT: Tried to load vertices with JIT on platform that does not support vertex loader jit");
|
Helpers::panic("Vertex Loader JIT: Tried to load vertices with JIT on platform that does not support vertex loader jit");
|
||||||
}
|
}
|
||||||
|
|
||||||
|
void reset() {}
|
||||||
static constexpr bool isAvailable() { return false; }
|
static constexpr bool isAvailable() { return false; }
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
|
|
@ -16,6 +16,8 @@ class GPU {
|
||||||
|
|
||||||
Memory& mem;
|
Memory& mem;
|
||||||
ShaderUnit shaderUnit;
|
ShaderUnit shaderUnit;
|
||||||
|
ShaderJIT shaderJIT; // Doesn't do anything if JIT is disabled or not supported
|
||||||
|
|
||||||
u8* vram = nullptr;
|
u8* vram = nullptr;
|
||||||
MAKE_LOG_FUNCTION(log, gpuLogger)
|
MAKE_LOG_FUNCTION(log, gpuLogger)
|
||||||
|
|
||||||
|
|
|
@ -89,6 +89,17 @@ protected:
|
||||||
std::array<CallInfo, 4> callInfo;
|
std::array<CallInfo, 4> callInfo;
|
||||||
ShaderType type;
|
ShaderType type;
|
||||||
|
|
||||||
|
// We use a hashmap for matching 3DS shaders to their equivalent compiled code in our shader cache in the shader JIT
|
||||||
|
// We choose our hash type to be a 64-bit integer by default, as the collision chance is very tiny and generating it is decently optimal
|
||||||
|
// Ideally we want to be able to support multiple different types of hash depending on compilation settings, but let's get this working first
|
||||||
|
using Hash = u64;
|
||||||
|
|
||||||
|
Hash lastCodeHash = 0; // Last hash computed for the shader code (Used for the JIT caching mechanism)
|
||||||
|
Hash lastOpdescHash = 0; // Last hash computed for the operand descriptors (Also used for the JIT)
|
||||||
|
|
||||||
|
bool codeHashDirty = false;
|
||||||
|
bool opdescHashDirty = false;
|
||||||
|
|
||||||
friend class ShaderJIT;
|
friend class ShaderJIT;
|
||||||
|
|
||||||
private:
|
private:
|
||||||
|
@ -204,11 +215,15 @@ public:
|
||||||
if (bufferIndex >= 4095) Helpers::panic("o no, shader upload overflew");
|
if (bufferIndex >= 4095) Helpers::panic("o no, shader upload overflew");
|
||||||
bufferedShader[bufferIndex++] = word;
|
bufferedShader[bufferIndex++] = word;
|
||||||
bufferIndex &= 0xfff;
|
bufferIndex &= 0xfff;
|
||||||
|
|
||||||
|
codeHashDirty = true; // Signal the JIT if necessary that the program hash has potentially changed
|
||||||
}
|
}
|
||||||
|
|
||||||
void uploadDescriptor(u32 word) {
|
void uploadDescriptor(u32 word) {
|
||||||
operandDescriptors[opDescriptorIndex++] = word;
|
operandDescriptors[opDescriptorIndex++] = word;
|
||||||
opDescriptorIndex &= 0x7f;
|
opDescriptorIndex &= 0x7f;
|
||||||
|
|
||||||
|
opdescHashDirty = true; // Signal the JIT if necessary that the program hash has potentially changed
|
||||||
}
|
}
|
||||||
|
|
||||||
void setFloatUniformIndex(u32 word) {
|
void setFloatUniformIndex(u32 word) {
|
||||||
|
@ -250,4 +265,7 @@ public:
|
||||||
|
|
||||||
void run();
|
void run();
|
||||||
void reset();
|
void reset();
|
||||||
|
|
||||||
|
Hash getCodeHash();
|
||||||
|
Hash getOpdescHash();
|
||||||
};
|
};
|
|
@ -1,7 +1,14 @@
|
||||||
#include "PICA/dynapica/shader_rec.hpp"
|
#include "PICA/dynapica/shader_rec.hpp"
|
||||||
|
#include "cityhash.hpp"
|
||||||
|
|
||||||
#ifdef PANDA3DS_SHADER_JIT_SUPPORTED
|
#ifdef PANDA3DS_SHADER_JIT_SUPPORTED
|
||||||
|
void ShaderJIT::reset() {
|
||||||
|
cache.clear();
|
||||||
|
}
|
||||||
|
|
||||||
void ShaderJIT::prepare(PICAShader& shaderUnit) {
|
void ShaderJIT::prepare(PICAShader& shaderUnit) {
|
||||||
printf("HAPPY HAPPY HAPPY\n");
|
// We construct a shader hash from both the code and operand descriptor hashes
|
||||||
|
// This is so that if only one of them changes, we still properly recompile the shader
|
||||||
|
Hash hash = shaderUnit.getCodeHash() ^ shaderUnit.getOpdescHash();
|
||||||
}
|
}
|
||||||
#endif // PANDA3DS_SHADER_JIT_SUPPORTED
|
#endif // PANDA3DS_SHADER_JIT_SUPPORTED
|
|
@ -12,6 +12,7 @@ GPU::GPU(Memory& mem) : mem(mem), renderer(*this, regs) {
|
||||||
void GPU::reset() {
|
void GPU::reset() {
|
||||||
regs.fill(0);
|
regs.fill(0);
|
||||||
shaderUnit.reset();
|
shaderUnit.reset();
|
||||||
|
shaderJIT.reset();
|
||||||
std::memset(vram, 0, vramSize);
|
std::memset(vram, 0, vramSize);
|
||||||
|
|
||||||
totalAttribCount = 0;
|
totalAttribCount = 0;
|
||||||
|
@ -84,6 +85,10 @@ void GPU::drawArrays() {
|
||||||
log("PICA::DrawElements(vertex count = %d, index buffer config = %08X)\n", vertexCount, indexBufferConfig);
|
log("PICA::DrawElements(vertex count = %d, index buffer config = %08X)\n", vertexCount, indexBufferConfig);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if constexpr (useShaderJIT) {
|
||||||
|
shaderJIT.prepare(shaderUnit.vs);
|
||||||
|
}
|
||||||
|
|
||||||
// Total number of input attributes to shader. Differs between GS and VS. Currently stubbed to the VS one, as we don't have geometry shaders.
|
// Total number of input attributes to shader. Differs between GS and VS. Currently stubbed to the VS one, as we don't have geometry shaders.
|
||||||
const u32 inputAttrCount = (regs[PICAInternalRegs::VertexShaderInputBufferCfg] & 0xf) + 1;
|
const u32 inputAttrCount = (regs[PICAInternalRegs::VertexShaderInputBufferCfg] & 0xf) + 1;
|
||||||
const u64 inputAttrCfg = getVertexShaderInputConfig();
|
const u64 inputAttrCfg = getVertexShaderInputConfig();
|
||||||
|
|
|
@ -1,4 +1,5 @@
|
||||||
#include "PICA/shader_unit.hpp"
|
#include "PICA/shader_unit.hpp"
|
||||||
|
#include "cityhash.hpp"
|
||||||
|
|
||||||
void ShaderUnit::reset() {
|
void ShaderUnit::reset() {
|
||||||
vs.reset();
|
vs.reset();
|
||||||
|
@ -30,4 +31,29 @@ void PICAShader::reset() {
|
||||||
addrRegister.x() = 0;
|
addrRegister.x() = 0;
|
||||||
addrRegister.y() = 0;
|
addrRegister.y() = 0;
|
||||||
loopCounter = 0;
|
loopCounter = 0;
|
||||||
|
|
||||||
|
codeHashDirty = true;
|
||||||
|
opdescHashDirty = true;
|
||||||
|
}
|
||||||
|
|
||||||
|
PICAShader::Hash PICAShader::getCodeHash() {
|
||||||
|
// Hash the code again if the code changed
|
||||||
|
if (codeHashDirty) {
|
||||||
|
codeHashDirty = false;
|
||||||
|
lastCodeHash = CityHash::CityHash64((const char*)&loadedShader[0], loadedShader.size() * sizeof(loadedShader[0]));
|
||||||
|
}
|
||||||
|
|
||||||
|
// Return the code hash
|
||||||
|
return lastCodeHash;
|
||||||
|
}
|
||||||
|
|
||||||
|
PICAShader::Hash PICAShader::getOpdescHash() {
|
||||||
|
// Hash the code again if the operand descriptors changed
|
||||||
|
if (opdescHashDirty) {
|
||||||
|
opdescHashDirty = false;
|
||||||
|
lastOpdescHash = CityHash::CityHash64((const char*)&operandDescriptors[0], operandDescriptors.size() * sizeof(operandDescriptors[0]));
|
||||||
|
}
|
||||||
|
|
||||||
|
// Return the code hash
|
||||||
|
return lastOpdescHash;
|
||||||
}
|
}
|
2
third_party/cityhash/cityhash.cpp
vendored
2
third_party/cityhash/cityhash.cpp
vendored
|
@ -29,7 +29,7 @@
|
||||||
|
|
||||||
#include <algorithm>
|
#include <algorithm>
|
||||||
#include <string.h> // for memcpy and memset
|
#include <string.h> // for memcpy and memset
|
||||||
#include "cityhash.hpp"
|
#include "include/cityhash.hpp"
|
||||||
#include "swap.hpp"
|
#include "swap.hpp"
|
||||||
|
|
||||||
// #include "config.h"
|
// #include "config.h"
|
||||||
|
|
Loading…
Add table
Reference in a new issue