Merge pull request #708 from wheremyfoodat/icache

GPU: Add sw texture copies
This commit is contained in:
wheremyfoodat 2025-01-03 21:40:18 +02:00 committed by GitHub
commit b559725920
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
4 changed files with 42 additions and 1 deletions

View file

@ -53,6 +53,7 @@ class Renderer {
EmulatorConfig* emulatorConfig = nullptr;
void doSoftwareTextureCopy(u32 inputAddr, u32 outputAddr, u32 copySize, u32 inputWidth, u32 inputGap, u32 outputWidth, u32 outputGap);
public:
Renderer(GPU& gpu, const std::array<u32, regNum>& internalRegs, const std::array<u32, extRegNum>& externalRegs);
virtual ~Renderer();

View file

@ -792,6 +792,8 @@ void RendererGL::textureCopy(u32 inputAddr, u32 outputAddr, u32 totalBytes, u32
shutUpCounter++;
printf("RendererGL::TextureCopy failed to locate src framebuffer!\n");
}
doSoftwareTextureCopy(inputAddr, outputAddr, copySize, inputWidth, inputGap, outputWidth, outputGap);
return;
}

View file

@ -426,7 +426,7 @@ void RendererMTL::textureCopy(u32 inputAddr, u32 outputAddr, u32 totalBytes, u32
// Find the source surface.
auto srcFramebuffer = getColorRenderTarget(inputAddr, PICA::ColorFmt::RGBA8, copyStride, copyHeight, false);
if (!srcFramebuffer) {
Helpers::warn("RendererMTL::TextureCopy failed to locate src framebuffer!\n");
doSoftwareTextureCopy(inputAddr, outputAddr, copySize, inputWidth, inputGap, outputWidth, outputGap);
return;
}
nextRenderPassName = "Clear before texture copy";

View file

@ -3,6 +3,8 @@
#include <algorithm>
#include <unordered_map>
#include "PICA/gpu.hpp"
Renderer::Renderer(GPU& gpu, const std::array<u32, regNum>& internalRegs, const std::array<u32, extRegNum>& externalRegs)
: gpu(gpu), regs(internalRegs), externalRegs(externalRegs) {}
Renderer::~Renderer() {}
@ -39,3 +41,39 @@ const char* Renderer::typeToString(RendererType rendererType) {
default: return "Invalid";
}
}
void Renderer::doSoftwareTextureCopy(u32 inputAddr, u32 outputAddr, u32 copySize, u32 inputWidth, u32 inputGap, u32 outputWidth, u32 outputGap) {
u8* inputPointer = gpu.getPointerPhys<u8>(inputAddr);
u8* outputPointer = gpu.getPointerPhys<u8>(outputAddr);
if (inputPointer == nullptr || outputPointer == nullptr) {
return;
}
u32 inputBytesLeft = inputWidth;
u32 outputBytesLeft = outputWidth;
u32 copyBytesLeft = copySize;
while (copyBytesLeft > 0) {
const u32 bytes = std::min<u32>({inputBytesLeft, outputBytesLeft, copyBytesLeft});
std::memcpy(outputPointer, inputPointer, bytes);
inputPointer += bytes;
outputPointer += bytes;
inputBytesLeft -= bytes;
outputBytesLeft -= bytes;
copyBytesLeft -= bytes;
// Apply input and output gap when an input or output line ends
if (inputBytesLeft == 0) {
inputBytesLeft = inputWidth;
inputPointer += inputGap;
}
if (outputBytesLeft == 0) {
outputBytesLeft = outputWidth;
outputPointer += outputGap;
}
}
}