mirror of
https://github.com/wheremyfoodat/Panda3DS.git
synced 2025-04-06 22:25:41 +12:00
First Metal cleanup & formatting pass
This commit is contained in:
parent
4cc62d4870
commit
49b65242b9
17 changed files with 1084 additions and 1115 deletions
|
@ -19,8 +19,6 @@ template <typename SurfaceType, size_t capacity, bool evictOnOverflow = false>
|
|||
class SurfaceCache {
|
||||
// Vanilla std::optional can't hold actual references
|
||||
using OptionalRef = std::optional<std::reference_wrapper<SurfaceType>>;
|
||||
//static_assert(std::is_same<SurfaceType, ColourBuffer>() || std::is_same<SurfaceType, DepthBuffer>() ||
|
||||
// std::is_same<SurfaceType, Texture>(), "Invalid surface type");
|
||||
|
||||
size_t size;
|
||||
size_t evictionIndex;
|
||||
|
|
|
@ -7,16 +7,15 @@
|
|||
using namespace PICA;
|
||||
|
||||
namespace Metal {
|
||||
|
||||
struct BlitPipelineHash {
|
||||
struct BlitPipelineHash {
|
||||
// Formats
|
||||
ColorFmt colorFmt;
|
||||
DepthFmt depthFmt;
|
||||
};
|
||||
};
|
||||
|
||||
// This pipeline only caches the pipeline with all of its color and depth attachment variations
|
||||
class BlitPipelineCache {
|
||||
public:
|
||||
// This pipeline only caches the pipeline with all of its color and depth attachment variations
|
||||
class BlitPipelineCache {
|
||||
public:
|
||||
BlitPipelineCache() = default;
|
||||
|
||||
~BlitPipelineCache() {
|
||||
|
@ -64,12 +63,11 @@ public:
|
|||
pipelineCache.clear();
|
||||
}
|
||||
|
||||
private:
|
||||
private:
|
||||
std::map<u8, MTL::RenderPipelineState*> pipelineCache;
|
||||
|
||||
MTL::Device* device;
|
||||
MTL::Function* vertexFunction;
|
||||
MTL::Function* fragmentFunction;
|
||||
};
|
||||
|
||||
};
|
||||
} // namespace Metal
|
||||
|
|
|
@ -3,16 +3,15 @@
|
|||
#include <Metal/Metal.hpp>
|
||||
|
||||
namespace Metal {
|
||||
|
||||
struct RenderState {
|
||||
struct RenderState {
|
||||
MTL::RenderPipelineState* renderPipelineState = nullptr;
|
||||
MTL::DepthStencilState* depthStencilState = nullptr;
|
||||
MTL::Texture* textures[3] = {nullptr};
|
||||
MTL::SamplerState* samplerStates[3] = {nullptr};
|
||||
};
|
||||
};
|
||||
|
||||
class CommandEncoder {
|
||||
public:
|
||||
class CommandEncoder {
|
||||
public:
|
||||
void newRenderCommandEncoder(MTL::RenderCommandEncoder* rce) {
|
||||
renderCommandEncoder = rce;
|
||||
|
||||
|
@ -49,10 +48,9 @@ public:
|
|||
}
|
||||
}
|
||||
|
||||
private:
|
||||
private:
|
||||
MTL::RenderCommandEncoder* renderCommandEncoder = nullptr;
|
||||
|
||||
RenderState renderState;
|
||||
};
|
||||
|
||||
};
|
||||
} // namespace Metal
|
||||
|
|
|
@ -7,28 +7,24 @@
|
|||
using namespace PICA;
|
||||
|
||||
namespace Metal {
|
||||
|
||||
struct DepthStencilHash {
|
||||
bool depthStencilWrite;
|
||||
u8 depthFunc;
|
||||
struct DepthStencilHash {
|
||||
u32 stencilConfig;
|
||||
u16 stencilOpConfig;
|
||||
};
|
||||
bool depthStencilWrite;
|
||||
u8 depthFunc;
|
||||
};
|
||||
|
||||
class DepthStencilCache {
|
||||
public:
|
||||
class DepthStencilCache {
|
||||
public:
|
||||
DepthStencilCache() = default;
|
||||
|
||||
~DepthStencilCache() {
|
||||
reset();
|
||||
}
|
||||
~DepthStencilCache() { reset(); }
|
||||
|
||||
void set(MTL::Device* dev) {
|
||||
device = dev;
|
||||
}
|
||||
void set(MTL::Device* dev) { device = dev; }
|
||||
|
||||
MTL::DepthStencilState* get(DepthStencilHash hash) {
|
||||
u64 intHash = ((u64)hash.depthStencilWrite << 56) | ((u64)hash.depthFunc << 48) | ((u64)hash.stencilConfig << 16) | (u64)hash.stencilOpConfig;
|
||||
u64 intHash =
|
||||
((u64)hash.depthStencilWrite << 56) | ((u64)hash.depthFunc << 48) | ((u64)hash.stencilConfig << 16) | (u64)hash.stencilOpConfig;
|
||||
auto& depthStencilState = depthStencilCache[intHash];
|
||||
if (!depthStencilState) {
|
||||
MTL::DepthStencilDescriptor* desc = MTL::DepthStencilDescriptor::alloc()->init();
|
||||
|
@ -77,10 +73,8 @@ public:
|
|||
depthStencilCache.clear();
|
||||
}
|
||||
|
||||
private:
|
||||
private:
|
||||
std::map<u64, MTL::DepthStencilState*> depthStencilCache;
|
||||
|
||||
MTL::Device* device;
|
||||
};
|
||||
|
||||
};
|
||||
} // namespace Metal
|
||||
|
|
|
@ -7,30 +7,24 @@
|
|||
using namespace PICA;
|
||||
|
||||
namespace Metal {
|
||||
|
||||
struct DrawFragmentFunctionHash {
|
||||
struct DrawFragmentFunctionHash {
|
||||
bool lightingEnabled; // 1 bit
|
||||
u8 lightingNumLights; // 3 bits
|
||||
u32 lightingConfig1; // 32 bits (TODO: check this)
|
||||
// | ref | func | on |
|
||||
u16 alphaControl; // 12 bits (mask: 11111111 0111 0001)
|
||||
};
|
||||
};
|
||||
|
||||
//bool operator==(const DrawFragmentFunctionHash& l, const DrawFragmentFunctionHash& r) {
|
||||
// return ((l.lightingEnabled == r.lightingEnabled) && (l.lightingNumLights == r.lightingNumLights) &&
|
||||
// (l.lightingConfig1 == r.lightingConfig1) && (l.alphaControl == r.alphaControl));
|
||||
//}
|
||||
|
||||
inline bool operator<(const DrawFragmentFunctionHash& l, const DrawFragmentFunctionHash& r) {
|
||||
inline bool operator<(const DrawFragmentFunctionHash& l, const DrawFragmentFunctionHash& r) {
|
||||
if (!l.lightingEnabled && r.lightingEnabled) return true;
|
||||
if (l.lightingNumLights < r.lightingNumLights) return true;
|
||||
if (l.lightingConfig1 < r.lightingConfig1) return true;
|
||||
if (l.alphaControl < r.alphaControl) return true;
|
||||
|
||||
return false;
|
||||
}
|
||||
}
|
||||
|
||||
struct DrawPipelineHash { // 56 bits
|
||||
struct DrawPipelineHash { // 56 bits
|
||||
// Formats
|
||||
ColorFmt colorFmt; // 3 bits
|
||||
DepthFmt depthFmt; // 3 bits
|
||||
|
@ -42,15 +36,9 @@ struct DrawPipelineHash { // 56 bits
|
|||
u8 colorWriteMask; // 4 bits
|
||||
|
||||
DrawFragmentFunctionHash fragHash;
|
||||
};
|
||||
};
|
||||
|
||||
//bool operator==(const DrawPipelineHash& l, const DrawPipelineHash& r) {
|
||||
// return (((u32)l.colorFmt == (u32)r.colorFmt) && ((u32)l.depthFmt == (u32)r.depthFmt) &&
|
||||
// (l.blendEnabled == r.blendEnabled) && (l.blendControl == r.blendControl) &&
|
||||
// (l.colorWriteMask == r.colorWriteMask) && (l.fragHash == r.fragHash));
|
||||
//}
|
||||
|
||||
inline bool operator<(const DrawPipelineHash& l, const DrawPipelineHash& r) {
|
||||
inline bool operator<(const DrawPipelineHash& l, const DrawPipelineHash& r) {
|
||||
if ((u32)l.colorFmt < (u32)r.colorFmt) return true;
|
||||
if ((u32)l.depthFmt < (u32)r.depthFmt) return true;
|
||||
if (!l.blendEnabled && r.blendEnabled) return true;
|
||||
|
@ -59,14 +47,11 @@ inline bool operator<(const DrawPipelineHash& l, const DrawPipelineHash& r) {
|
|||
if (l.fragHash < r.fragHash) return true;
|
||||
|
||||
return false;
|
||||
}
|
||||
}
|
||||
|
||||
// Bind the vertex buffer to binding 30 so that it doesn't occupy the lower indices
|
||||
#define VERTEX_BUFFER_BINDING_INDEX 30
|
||||
|
||||
// This pipeline only caches the pipeline with all of its color and depth attachment variations
|
||||
class DrawPipelineCache {
|
||||
public:
|
||||
// This pipeline only caches the pipeline with all of its color and depth attachment variations
|
||||
class DrawPipelineCache {
|
||||
public:
|
||||
DrawPipelineCache() = default;
|
||||
|
||||
~DrawPipelineCache() {
|
||||
|
@ -83,9 +68,8 @@ public:
|
|||
}
|
||||
|
||||
MTL::RenderPipelineState* get(DrawPipelineHash hash) {
|
||||
//u32 fragmentFunctionHash = ((u32)hash.lightingEnabled << 22) | ((u32)hash.lightingNumLights << 19) | ((u32)hash.lightingConfig1 << 12) | ((((u32)hash.alphaControl & 0b1111111100000000) >> 8) << 4) | ((((u32)hash.alphaControl & 0b01110000) >> 4) << 1) | ((u32)hash.alphaControl & 0b0001);
|
||||
//u64 pipelineHash = ((u64)hash.colorFmt << 53) | ((u64)hash.depthFmt << 50) | ((u64)hash.blendEnabled << 49) | ((u64)hash.colorWriteMask << 45) | ((((u64)hash.blendControl & 0b11111111111111110000000000000000) >> 16) << 29) | ((((u64)hash.blendControl & 0b0000011100000000) >> 8) << 26) | (((u64)hash.blendControl & 0b00000111) << 23) | fragmentFunctionHash;
|
||||
auto& pipeline = pipelineCache[hash];
|
||||
|
||||
if (!pipeline) {
|
||||
auto& fragmentFunction = fragmentFunctionCache[hash.fragHash];
|
||||
if (!fragmentFunction) {
|
||||
|
@ -137,8 +121,7 @@ public:
|
|||
|
||||
MTL::PixelFormat depthFormat = toMTLPixelFormatDepth(hash.depthFmt);
|
||||
desc->setDepthAttachmentPixelFormat(depthFormat);
|
||||
if (hash.depthFmt == DepthFmt::Depth24Stencil8)
|
||||
desc->setStencilAttachmentPixelFormat(depthFormat);
|
||||
if (hash.depthFmt == DepthFmt::Depth24Stencil8) desc->setStencilAttachmentPixelFormat(depthFormat);
|
||||
|
||||
NS::Error* error = nullptr;
|
||||
desc->setLabel(toNSString("Draw pipeline"));
|
||||
|
@ -158,13 +141,14 @@ public:
|
|||
pair.second->release();
|
||||
}
|
||||
pipelineCache.clear();
|
||||
|
||||
for (auto& pair : fragmentFunctionCache) {
|
||||
pair.second->release();
|
||||
}
|
||||
fragmentFunctionCache.clear();
|
||||
}
|
||||
|
||||
private:
|
||||
private:
|
||||
std::map<DrawPipelineHash, MTL::RenderPipelineState*> pipelineCache;
|
||||
std::map<DrawFragmentFunctionHash, MTL::Function*> fragmentFunctionCache;
|
||||
|
||||
|
@ -172,6 +156,6 @@ private:
|
|||
MTL::Library* library;
|
||||
MTL::Function* vertexFunction;
|
||||
MTL::VertexDescriptor* vertexDescriptor;
|
||||
};
|
||||
};
|
||||
|
||||
} // namespace Metal
|
||||
|
|
|
@ -8,17 +8,12 @@ class LutTexture {
|
|||
public:
|
||||
LutTexture(MTL::Device* device, MTL::TextureType type, MTL::PixelFormat pixelFormat, u32 width, u32 height, const char* name);
|
||||
~LutTexture();
|
||||
|
||||
u32 getNextIndex();
|
||||
|
||||
// Getters
|
||||
MTL::Texture* getTexture() { return texture; }
|
||||
|
||||
u32 getCurrentIndex() { return currentIndex; }
|
||||
|
||||
private:
|
||||
MTL::Texture* texture;
|
||||
|
||||
u32 currentIndex = 0;
|
||||
};
|
||||
|
||||
|
|
|
@ -1,21 +1,21 @@
|
|||
#pragma once
|
||||
#include <Metal/Metal.hpp>
|
||||
#include <array>
|
||||
#include <string>
|
||||
#include <Metal/Metal.hpp>
|
||||
|
||||
#include "boost/icl/interval.hpp"
|
||||
#include "helpers.hpp"
|
||||
#include "math_util.hpp"
|
||||
#include "objc_helper.hpp"
|
||||
#include "opengl.hpp"
|
||||
#include "pica_to_mtl.hpp"
|
||||
#include "objc_helper.hpp"
|
||||
|
||||
template <typename T>
|
||||
using Interval = boost::icl::right_open_interval<T>;
|
||||
|
||||
namespace Metal {
|
||||
|
||||
template <typename Format_t>
|
||||
struct RenderTarget {
|
||||
template <typename Format_t>
|
||||
struct RenderTarget {
|
||||
MTL::Device* device;
|
||||
|
||||
u32 location;
|
||||
|
@ -47,8 +47,7 @@ struct RenderTarget {
|
|||
// For 2 textures to "match" we only care about their locations, formats, and dimensions to match
|
||||
// For other things, such as filtering mode, etc, we can just switch the attributes of the cached texture
|
||||
bool matches(RenderTarget& other) {
|
||||
return location == other.location && format == other.format &&
|
||||
size.x() == other.size.x() && size.y() == other.size.y();
|
||||
return location == other.location && format == other.format && size.x() == other.size.x() && size.y() == other.size.y();
|
||||
}
|
||||
|
||||
void allocate() {
|
||||
|
@ -69,7 +68,10 @@ struct RenderTarget {
|
|||
descriptor->setUsage(MTL::TextureUsageRenderTarget | MTL::TextureUsageShaderRead);
|
||||
descriptor->setStorageMode(MTL::StorageModePrivate);
|
||||
texture = device->newTexture(descriptor);
|
||||
texture->setLabel(toNSString(std::string(std::is_same<Format_t, PICA::ColorFmt>::value ? "Color" : "Depth") + " render target " + std::to_string(size.u()) + "x" + std::to_string(size.v())));
|
||||
texture->setLabel(toNSString(
|
||||
std::string(std::is_same<Format_t, PICA::ColorFmt>::value ? "Color" : "Depth") + " render target " + std::to_string(size.u()) + "x" +
|
||||
std::to_string(size.v())
|
||||
));
|
||||
descriptor->release();
|
||||
}
|
||||
|
||||
|
@ -81,12 +83,9 @@ struct RenderTarget {
|
|||
}
|
||||
}
|
||||
|
||||
u64 sizeInBytes() {
|
||||
return (size_t)size.x() * (size_t)size.y() * PICA::sizePerPixel(format);
|
||||
}
|
||||
};
|
||||
|
||||
typedef RenderTarget<PICA::ColorFmt> ColorRenderTarget;
|
||||
typedef RenderTarget<PICA::DepthFmt> DepthStencilRenderTarget;
|
||||
u64 sizeInBytes() { return (size_t)size.x() * (size_t)size.y() * PICA::sizePerPixel(format); }
|
||||
};
|
||||
|
||||
using ColorRenderTarget = RenderTarget<PICA::ColorFmt>;
|
||||
using DepthStencilRenderTarget = RenderTarget<PICA::DepthFmt>;
|
||||
} // namespace Metal
|
||||
|
|
|
@ -1,8 +1,9 @@
|
|||
#pragma once
|
||||
|
||||
#include <Metal/Metal.hpp>
|
||||
#include <array>
|
||||
#include <string>
|
||||
#include <Metal/Metal.hpp>
|
||||
|
||||
#include "PICA/regs.hpp"
|
||||
#include "boost/icl/interval.hpp"
|
||||
#include "helpers.hpp"
|
||||
|
@ -10,12 +11,12 @@
|
|||
#include "opengl.hpp"
|
||||
#include "renderer_mtl/pica_to_mtl.hpp"
|
||||
|
||||
|
||||
template <typename T>
|
||||
using Interval = boost::icl::right_open_interval<T>;
|
||||
|
||||
namespace Metal {
|
||||
|
||||
struct Texture {
|
||||
struct Texture {
|
||||
MTL::Device* device;
|
||||
|
||||
u32 location;
|
||||
|
@ -35,7 +36,6 @@ struct Texture {
|
|||
|
||||
Texture(MTL::Device* dev, u32 loc, PICA::TextureFmt format, u32 x, u32 y, u32 config, bool valid = true)
|
||||
: device(dev), location(loc), format(format), size({x, y}), config(config), valid(valid) {
|
||||
|
||||
u64 endLoc = (u64)loc + sizeInBytes();
|
||||
// Check if start and end are valid here
|
||||
range = Interval<u32>(loc, (u32)endLoc);
|
||||
|
@ -44,8 +44,7 @@ struct Texture {
|
|||
// For 2 textures to "match" we only care about their locations, formats, and dimensions to match
|
||||
// For other things, such as filtering mode, etc, we can just switch the attributes of the cached texture
|
||||
bool matches(Texture& other) {
|
||||
return location == other.location && format == other.format &&
|
||||
size.x() == other.size.x() && size.y() == other.size.y();
|
||||
return location == other.location && format == other.format && size.x() == other.size.x() && size.y() == other.size.y();
|
||||
}
|
||||
|
||||
void allocate();
|
||||
|
@ -65,14 +64,11 @@ struct Texture {
|
|||
static u32 getSwizzledOffset_4bpp(u32 u, u32 v, u32 width);
|
||||
|
||||
// Returns the format of this texture as a string
|
||||
std::string_view formatToString() {
|
||||
return PICA::textureFormatToString(format);
|
||||
}
|
||||
std::string_view formatToString() { return PICA::textureFormatToString(format); }
|
||||
|
||||
// Returns the texel at coordinates (u, v) of an ETC1(A4) texture
|
||||
// TODO: Make hasAlpha a template parameter
|
||||
u32 getTexelETC(bool hasAlpha, u32 u, u32 v, u32 width, std::span<const u8> data);
|
||||
u32 decodeETC(u32 alpha, u32 u, u32 v, u64 colourData);
|
||||
};
|
||||
|
||||
};
|
||||
} // namespace Metal
|
||||
|
|
|
@ -5,17 +5,16 @@
|
|||
using namespace PICA;
|
||||
|
||||
namespace Metal {
|
||||
|
||||
struct BufferHandle {
|
||||
struct BufferHandle {
|
||||
MTL::Buffer* buffer;
|
||||
size_t offset;
|
||||
};
|
||||
};
|
||||
|
||||
// 128MB buffer for caching vertex data
|
||||
#define CACHE_BUFFER_SIZE 128 * 1024 * 1024
|
||||
class VertexBufferCache {
|
||||
// 128MB buffer for caching vertex data
|
||||
static constexpr usize CACHE_BUFFER_SIZE = 128 * 1024 * 1024;
|
||||
|
||||
class VertexBufferCache {
|
||||
public:
|
||||
public:
|
||||
VertexBufferCache() = default;
|
||||
|
||||
~VertexBufferCache() {
|
||||
|
@ -64,7 +63,7 @@ public:
|
|||
}
|
||||
}
|
||||
|
||||
private:
|
||||
private:
|
||||
MTL::Buffer* buffer = nullptr;
|
||||
size_t ptr = 0;
|
||||
std::vector<MTL::Buffer*> additionalAllocations;
|
||||
|
@ -75,6 +74,5 @@ private:
|
|||
buffer = device->newBuffer(CACHE_BUFFER_SIZE, MTL::ResourceStorageModeShared);
|
||||
buffer->setLabel(toNSString("Shared vertex buffer"));
|
||||
}
|
||||
};
|
||||
|
||||
};
|
||||
} // namespace Metal
|
||||
|
|
|
@ -5,12 +5,8 @@
|
|||
#include "mtl_common.hpp"
|
||||
|
||||
namespace Metal {
|
||||
|
||||
dispatch_data_t createDispatchData(const void* data, size_t size);
|
||||
|
||||
dispatch_data_t createDispatchData(const void* data, size_t size);
|
||||
} // namespace Metal
|
||||
|
||||
// Cast from std::string to NS::String*
|
||||
inline NS::String* toNSString(const std::string& str) {
|
||||
return NS::String::string(str.c_str(), NS::ASCIIStringEncoding);
|
||||
}
|
||||
inline NS::String* toNSString(const std::string& str) { return NS::String::string(str.c_str(), NS::ASCIIStringEncoding); }
|
|
@ -1,16 +1,17 @@
|
|||
#pragma once
|
||||
|
||||
#include <Metal/Metal.hpp>
|
||||
|
||||
#include "PICA/regs.hpp"
|
||||
|
||||
namespace PICA {
|
||||
|
||||
struct PixelFormatInfo {
|
||||
namespace PICA {
|
||||
struct PixelFormatInfo {
|
||||
MTL::PixelFormat pixelFormat;
|
||||
size_t bytesPerTexel;
|
||||
};
|
||||
};
|
||||
|
||||
constexpr PixelFormatInfo pixelFormatInfos[14] = {
|
||||
constexpr PixelFormatInfo pixelFormatInfos[14] = {
|
||||
{MTL::PixelFormatRGBA8Unorm, 4}, // RGBA8
|
||||
{MTL::PixelFormatRGBA8Unorm, 4}, // RGB8
|
||||
{MTL::PixelFormatBGR5A1Unorm, 2}, // RGBA5551
|
||||
|
@ -25,13 +26,11 @@ constexpr PixelFormatInfo pixelFormatInfos[14] = {
|
|||
{MTL::PixelFormatA8Unorm, 1}, // A4
|
||||
{MTL::PixelFormatRGBA8Unorm, 4}, // ETC1
|
||||
{MTL::PixelFormatRGBA8Unorm, 4}, // ETC1A4
|
||||
};
|
||||
};
|
||||
|
||||
inline PixelFormatInfo getPixelFormatInfo(TextureFmt format) {
|
||||
return pixelFormatInfos[static_cast<int>(format)];
|
||||
}
|
||||
inline PixelFormatInfo getPixelFormatInfo(TextureFmt format) { return pixelFormatInfos[static_cast<int>(format)]; }
|
||||
|
||||
inline MTL::PixelFormat toMTLPixelFormatColor(ColorFmt format) {
|
||||
inline MTL::PixelFormat toMTLPixelFormatColor(ColorFmt format) {
|
||||
switch (format) {
|
||||
case ColorFmt::RGBA8: return MTL::PixelFormatRGBA8Unorm;
|
||||
case ColorFmt::RGB8: return MTL::PixelFormatRGBA8Unorm;
|
||||
|
@ -39,19 +38,20 @@ inline MTL::PixelFormat toMTLPixelFormatColor(ColorFmt format) {
|
|||
case ColorFmt::RGB565: return MTL::PixelFormatRGBA8Unorm; // TODO: use MTL::PixelFormatB5G6R5Unorm?
|
||||
case ColorFmt::RGBA4: return MTL::PixelFormatABGR4Unorm;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
inline MTL::PixelFormat toMTLPixelFormatDepth(DepthFmt format) {
|
||||
inline MTL::PixelFormat toMTLPixelFormatDepth(DepthFmt format) {
|
||||
switch (format) {
|
||||
case DepthFmt::Depth16: return MTL::PixelFormatDepth16Unorm;
|
||||
case DepthFmt::Unknown1: return MTL::PixelFormatInvalid;
|
||||
case DepthFmt::Depth24: return MTL::PixelFormatDepth32Float; // Metal does not support 24-bit depth formats
|
||||
case DepthFmt::Depth24:
|
||||
return MTL::PixelFormatDepth32Float; // Metal does not support 24-bit depth formats
|
||||
// Apple sillicon doesn't support 24-bit depth buffers, so we use 32-bit instead
|
||||
case DepthFmt::Depth24Stencil8: return MTL::PixelFormatDepth32Float_Stencil8;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
inline MTL::CompareFunction toMTLCompareFunc(u8 func) {
|
||||
inline MTL::CompareFunction toMTLCompareFunc(u8 func) {
|
||||
switch (func) {
|
||||
case 0: return MTL::CompareFunctionNever;
|
||||
case 1: return MTL::CompareFunctionAlways;
|
||||
|
@ -65,9 +65,9 @@ inline MTL::CompareFunction toMTLCompareFunc(u8 func) {
|
|||
}
|
||||
|
||||
return MTL::CompareFunctionAlways;
|
||||
}
|
||||
}
|
||||
|
||||
inline MTL::BlendOperation toMTLBlendOperation(u8 op) {
|
||||
inline MTL::BlendOperation toMTLBlendOperation(u8 op) {
|
||||
switch (op) {
|
||||
case 0: return MTL::BlendOperationAdd;
|
||||
case 1: return MTL::BlendOperationSubtract;
|
||||
|
@ -81,9 +81,9 @@ inline MTL::BlendOperation toMTLBlendOperation(u8 op) {
|
|||
}
|
||||
|
||||
return MTL::BlendOperationAdd;
|
||||
}
|
||||
}
|
||||
|
||||
inline MTL::BlendFactor toMTLBlendFactor(u8 factor) {
|
||||
inline MTL::BlendFactor toMTLBlendFactor(u8 factor) {
|
||||
switch (factor) {
|
||||
case 0: return MTL::BlendFactorZero;
|
||||
case 1: return MTL::BlendFactorOne;
|
||||
|
@ -105,9 +105,9 @@ inline MTL::BlendFactor toMTLBlendFactor(u8 factor) {
|
|||
}
|
||||
|
||||
return MTL::BlendFactorOne;
|
||||
}
|
||||
}
|
||||
|
||||
inline MTL::StencilOperation toMTLStencilOperation(u8 op) {
|
||||
inline MTL::StencilOperation toMTLStencilOperation(u8 op) {
|
||||
switch (op) {
|
||||
case 0: return MTL::StencilOperationKeep;
|
||||
case 1: return MTL::StencilOperationZero;
|
||||
|
@ -121,9 +121,9 @@ inline MTL::StencilOperation toMTLStencilOperation(u8 op) {
|
|||
}
|
||||
|
||||
return MTL::StencilOperationKeep;
|
||||
}
|
||||
}
|
||||
|
||||
inline MTL::PrimitiveType toMTLPrimitiveType(PrimType primType) {
|
||||
inline MTL::PrimitiveType toMTLPrimitiveType(PrimType primType) {
|
||||
switch (primType) {
|
||||
case PrimType::TriangleList: return MTL::PrimitiveTypeTriangle;
|
||||
case PrimType::TriangleStrip: return MTL::PrimitiveTypeTriangleStrip;
|
||||
|
@ -131,12 +131,12 @@ inline MTL::PrimitiveType toMTLPrimitiveType(PrimType primType) {
|
|||
Helpers::warn("Triangle fans are not supported on Metal, using triangles instead");
|
||||
return MTL::PrimitiveTypeTriangle;
|
||||
case PrimType::GeometryPrimitive:
|
||||
//Helpers::warn("Geometry primitives are not yet, using triangles instead");
|
||||
// Helpers::warn("Geometry primitives are not yet, using triangles instead");
|
||||
return MTL::PrimitiveTypeTriangle;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
inline MTL::SamplerAddressMode toMTLSamplerAddressMode(u8 addrMode) {
|
||||
inline MTL::SamplerAddressMode toMTLSamplerAddressMode(u8 addrMode) {
|
||||
switch (addrMode) {
|
||||
case 0: return MTL::SamplerAddressModeClampToEdge;
|
||||
case 1: return MTL::SamplerAddressModeClampToBorderColor;
|
||||
|
@ -150,6 +150,5 @@ inline MTL::SamplerAddressMode toMTLSamplerAddressMode(u8 addrMode) {
|
|||
}
|
||||
|
||||
return MTL::SamplerAddressModeClampToEdge;
|
||||
}
|
||||
|
||||
}
|
||||
} // namespace PICA
|
||||
|
|
|
@ -3,15 +3,16 @@
|
|||
#include <Metal/Metal.hpp>
|
||||
#include <QuartzCore/QuartzCore.hpp>
|
||||
|
||||
#include "renderer.hpp"
|
||||
#include "mtl_texture.hpp"
|
||||
#include "mtl_render_target.hpp"
|
||||
#include "mtl_blit_pipeline_cache.hpp"
|
||||
#include "mtl_draw_pipeline_cache.hpp"
|
||||
#include "mtl_depth_stencil_cache.hpp"
|
||||
#include "mtl_vertex_buffer_cache.hpp"
|
||||
#include "mtl_lut_texture.hpp"
|
||||
#include "mtl_command_encoder.hpp"
|
||||
#include "mtl_depth_stencil_cache.hpp"
|
||||
#include "mtl_draw_pipeline_cache.hpp"
|
||||
#include "mtl_lut_texture.hpp"
|
||||
#include "mtl_render_target.hpp"
|
||||
#include "mtl_texture.hpp"
|
||||
#include "mtl_vertex_buffer_cache.hpp"
|
||||
#include "renderer.hpp"
|
||||
|
||||
|
||||
// HACK: use the OpenGL cache
|
||||
#include "../renderer_gl/surface_cache.hpp"
|
||||
|
@ -72,7 +73,7 @@ class RendererMTL final : public Renderer {
|
|||
|
||||
// Pipelines
|
||||
MTL::RenderPipelineState* displayPipeline;
|
||||
//MTL::RenderPipelineState* copyToLutTexturePipeline;
|
||||
// MTL::RenderPipelineState* copyToLutTexturePipeline;
|
||||
|
||||
// Clears
|
||||
std::map<MTL::Texture*, Color4> colorClearOps;
|
||||
|
@ -101,7 +102,9 @@ class RendererMTL final : public Renderer {
|
|||
}
|
||||
}
|
||||
|
||||
void beginRenderPassIfNeeded(MTL::RenderPassDescriptor* renderPassDescriptor, bool doesClears, MTL::Texture* colorTexture, MTL::Texture* depthTexture = nullptr);
|
||||
void beginRenderPassIfNeeded(
|
||||
MTL::RenderPassDescriptor* renderPassDescriptor, bool doesClears, MTL::Texture* colorTexture, MTL::Texture* depthTexture = nullptr
|
||||
);
|
||||
|
||||
void commitCommandBuffer() {
|
||||
if (renderCommandEncoder) {
|
||||
|
@ -118,8 +121,11 @@ class RendererMTL final : public Renderer {
|
|||
}
|
||||
}
|
||||
|
||||
template<typename AttachmentT, typename ClearDataT, typename GetAttachmentT, typename SetClearDataT>
|
||||
inline void clearAttachment(MTL::RenderPassDescriptor* renderPassDescriptor, MTL::Texture* texture, ClearDataT clearData, GetAttachmentT getAttachment, SetClearDataT setClearData) {
|
||||
template <typename AttachmentT, typename ClearDataT, typename GetAttachmentT, typename SetClearDataT>
|
||||
inline void clearAttachment(
|
||||
MTL::RenderPassDescriptor* renderPassDescriptor, MTL::Texture* texture, ClearDataT clearData, GetAttachmentT getAttachment,
|
||||
SetClearDataT setClearData
|
||||
) {
|
||||
bool beginRenderPass = (renderPassDescriptor == nullptr);
|
||||
if (!renderPassDescriptor) {
|
||||
renderPassDescriptor = MTL::RenderPassDescriptor::alloc()->init();
|
||||
|
@ -139,8 +145,11 @@ class RendererMTL final : public Renderer {
|
|||
}
|
||||
}
|
||||
|
||||
template<typename AttachmentT, typename ClearDataT, typename GetAttachmentT, typename SetClearDataT>
|
||||
inline bool clearAttachment(MTL::RenderPassDescriptor* renderPassDescriptor, MTL::Texture* texture, std::map<MTL::Texture*, ClearDataT>& clearOps, GetAttachmentT getAttachment, SetClearDataT setClearData) {
|
||||
template <typename AttachmentT, typename ClearDataT, typename GetAttachmentT, typename SetClearDataT>
|
||||
inline bool clearAttachment(
|
||||
MTL::RenderPassDescriptor* renderPassDescriptor, MTL::Texture* texture, std::map<MTL::Texture*, ClearDataT>& clearOps,
|
||||
GetAttachmentT getAttachment, SetClearDataT setClearData
|
||||
) {
|
||||
auto it = clearOps.find(texture);
|
||||
if (it != clearOps.end()) {
|
||||
clearAttachment<AttachmentT>(renderPassDescriptor, texture, it->second, getAttachment, setClearData);
|
||||
|
@ -159,29 +168,40 @@ class RendererMTL final : public Renderer {
|
|||
}
|
||||
|
||||
bool clearColor(MTL::RenderPassDescriptor* renderPassDescriptor, MTL::Texture* texture) {
|
||||
return clearAttachment<MTL::RenderPassColorAttachmentDescriptor, Color4>(renderPassDescriptor, texture, colorClearOps, [](MTL::RenderPassDescriptor* renderPassDescriptor) { return renderPassDescriptor->colorAttachments()->object(0); }, [](auto attachment, auto& color) {
|
||||
attachment->setClearColor(MTL::ClearColor(color.r, color.g, color.b, color.a));
|
||||
});
|
||||
return clearAttachment<MTL::RenderPassColorAttachmentDescriptor, Color4>(
|
||||
renderPassDescriptor, texture, colorClearOps,
|
||||
[](MTL::RenderPassDescriptor* renderPassDescriptor) { return renderPassDescriptor->colorAttachments()->object(0); },
|
||||
[](auto attachment, auto& color) { attachment->setClearColor(MTL::ClearColor(color.r, color.g, color.b, color.a)); }
|
||||
);
|
||||
}
|
||||
|
||||
bool clearDepth(MTL::RenderPassDescriptor* renderPassDescriptor, MTL::Texture* texture) {
|
||||
return clearAttachment<MTL::RenderPassDepthAttachmentDescriptor, float>(renderPassDescriptor, texture, depthClearOps, [](MTL::RenderPassDescriptor* renderPassDescriptor) { return renderPassDescriptor->depthAttachment(); }, [](auto attachment, auto& depth) {
|
||||
attachment->setClearDepth(depth);
|
||||
});
|
||||
return clearAttachment<MTL::RenderPassDepthAttachmentDescriptor, float>(
|
||||
renderPassDescriptor, texture, depthClearOps,
|
||||
[](MTL::RenderPassDescriptor* renderPassDescriptor) { return renderPassDescriptor->depthAttachment(); },
|
||||
[](auto attachment, auto& depth) { attachment->setClearDepth(depth); }
|
||||
);
|
||||
}
|
||||
|
||||
bool clearStencil(MTL::RenderPassDescriptor* renderPassDescriptor, MTL::Texture* texture) {
|
||||
return clearAttachment<MTL::RenderPassStencilAttachmentDescriptor, u8>(renderPassDescriptor, texture, stencilClearOps, [](MTL::RenderPassDescriptor* renderPassDescriptor) { return renderPassDescriptor->stencilAttachment(); }, [](auto attachment, auto& stencil) {
|
||||
attachment->setClearStencil(stencil);
|
||||
});
|
||||
return clearAttachment<MTL::RenderPassStencilAttachmentDescriptor, u8>(
|
||||
renderPassDescriptor, texture, stencilClearOps,
|
||||
[](MTL::RenderPassDescriptor* renderPassDescriptor) { return renderPassDescriptor->stencilAttachment(); },
|
||||
[](auto attachment, auto& stencil) { attachment->setClearStencil(stencil); }
|
||||
);
|
||||
}
|
||||
|
||||
std::optional<Metal::ColorRenderTarget> getColorRenderTarget(u32 addr, PICA::ColorFmt format, u32 width, u32 height, bool createIfnotFound = true);
|
||||
std::optional<Metal::ColorRenderTarget> getColorRenderTarget(
|
||||
u32 addr, PICA::ColorFmt format, u32 width, u32 height, bool createIfnotFound = true
|
||||
);
|
||||
Metal::DepthStencilRenderTarget& getDepthRenderTarget();
|
||||
Metal::Texture& getTexture(Metal::Texture& tex);
|
||||
void setupTextureEnvState(MTL::RenderCommandEncoder* encoder);
|
||||
void bindTexturesToSlots();
|
||||
void updateLightingLUT(MTL::RenderCommandEncoder* encoder);
|
||||
void updateFogLUT(MTL::RenderCommandEncoder* encoder);
|
||||
void textureCopyImpl(Metal::ColorRenderTarget& srcFramebuffer, Metal::ColorRenderTarget& destFramebuffer, const Math::Rect<u32>& srcRect, const Math::Rect<u32>& destRect);
|
||||
void textureCopyImpl(
|
||||
Metal::ColorRenderTarget& srcFramebuffer, Metal::ColorRenderTarget& destFramebuffer, const Math::Rect<u32>& srcRect,
|
||||
const Math::Rect<u32>& destRect
|
||||
);
|
||||
};
|
||||
|
|
|
@ -12,8 +12,9 @@ static constexpr u32 signExtend3To32(u32 val) {
|
|||
u32 Texture::getTexelETC(bool hasAlpha, u32 u, u32 v, u32 width, std::span<const u8> data) {
|
||||
// Pixel offset of the 8x8 tile based on u, v and the width of the texture
|
||||
u32 offs = ((u & ~7) * 8) + ((v & ~7) * width);
|
||||
if (!hasAlpha)
|
||||
if (!hasAlpha) {
|
||||
offs >>= 1;
|
||||
}
|
||||
|
||||
// In-tile offsets for u/v
|
||||
u &= 7;
|
||||
|
|
|
@ -1,21 +1,23 @@
|
|||
#include <algorithm>
|
||||
|
||||
#include "colour.hpp"
|
||||
#include "renderer_mtl/renderer_mtl.hpp"
|
||||
#include "renderer_mtl/mtl_texture.hpp"
|
||||
#include "renderer_mtl/renderer_mtl.hpp"
|
||||
|
||||
|
||||
using namespace Helpers;
|
||||
|
||||
namespace Metal {
|
||||
|
||||
static constexpr u32 signExtend3To32(u32 val) {
|
||||
static constexpr u32 signExtend3To32(u32 val) {
|
||||
return (u32)(s32(val) << 29 >> 29);
|
||||
}
|
||||
}
|
||||
|
||||
u32 Texture::getTexelETC(bool hasAlpha, u32 u, u32 v, u32 width, std::span<const u8> data) {
|
||||
u32 Texture::getTexelETC(bool hasAlpha, u32 u, u32 v, u32 width, std::span<const u8> data) {
|
||||
// Pixel offset of the 8x8 tile based on u, v and the width of the texture
|
||||
u32 offs = ((u & ~7) * 8) + ((v & ~7) * width);
|
||||
if (!hasAlpha)
|
||||
if (!hasAlpha) {
|
||||
offs >>= 1;
|
||||
}
|
||||
|
||||
// In-tile offsets for u/v
|
||||
u &= 7;
|
||||
|
@ -38,26 +40,18 @@ u32 Texture::getTexelETC(bool hasAlpha, u32 u, u32 v, u32 width, std::span<const
|
|||
// First 64 bits of the 4x4 subtile are alpha data
|
||||
const u64 alphaData = *ptr++;
|
||||
alpha = Colour::convert4To8Bit((alphaData >> (4 * (u * 4 + v))) & 0xf);
|
||||
}
|
||||
else {
|
||||
} else {
|
||||
alpha = 0xff; // ETC1 without alpha uses ff for every pixel
|
||||
}
|
||||
|
||||
// Next 64 bits of the subtile are colour data
|
||||
u64 colourData = *ptr;
|
||||
return decodeETC(alpha, u, v, colourData);
|
||||
}
|
||||
}
|
||||
|
||||
u32 Texture::decodeETC(u32 alpha, u32 u, u32 v, u64 colourData) {
|
||||
u32 Texture::decodeETC(u32 alpha, u32 u, u32 v, u64 colourData) {
|
||||
static constexpr u32 modifiers[8][2] = {
|
||||
{ 2, 8 },
|
||||
{ 5, 17 },
|
||||
{ 9, 29 },
|
||||
{ 13, 42 },
|
||||
{ 18, 60 },
|
||||
{ 24, 80 },
|
||||
{ 33, 106 },
|
||||
{ 47, 183 },
|
||||
{2, 8}, {5, 17}, {9, 29}, {13, 42}, {18, 60}, {24, 80}, {33, 106}, {47, 183},
|
||||
};
|
||||
|
||||
// Parse colour data for 4x4 block
|
||||
|
@ -71,8 +65,7 @@ u32 Texture::decodeETC(u32 alpha, u32 u, u32 v, u64 colourData) {
|
|||
const u32 tableIndex2 = getBits<34, 3, u32>(colourData);
|
||||
const u32 texelIndex = u * 4 + v; // Index of the texel in the block
|
||||
|
||||
if (flip)
|
||||
std::swap(u, v);
|
||||
if (flip) std::swap(u, v);
|
||||
|
||||
s32 r, g, b;
|
||||
if (diffMode) {
|
||||
|
@ -119,6 +112,5 @@ u32 Texture::decodeETC(u32 alpha, u32 u, u32 v, u64 colourData) {
|
|||
b = std::clamp(b + modifier, 0, 255);
|
||||
|
||||
return (alpha << 24) | (u32(b) << 16) | (u32(g) << 8) | u32(r);
|
||||
}
|
||||
|
||||
}
|
||||
} // namespace Metal
|
||||
|
|
|
@ -1,32 +1,27 @@
|
|||
#include "renderer_mtl/renderer_mtl.hpp"
|
||||
|
||||
namespace Metal {
|
||||
static constexpr u32 LAYER_COUNT = 1024;
|
||||
|
||||
constexpr u32 LAYER_COUNT = 1024;
|
||||
|
||||
LutTexture::LutTexture(MTL::Device* device, MTL::TextureType type, MTL::PixelFormat pixelFormat, u32 width, u32 height, const char* name) {
|
||||
LutTexture::LutTexture(MTL::Device* device, MTL::TextureType type, MTL::PixelFormat pixelFormat, u32 width, u32 height, const char* name) {
|
||||
MTL::TextureDescriptor* desc = MTL::TextureDescriptor::alloc()->init();
|
||||
desc->setTextureType(type);
|
||||
desc->setPixelFormat(pixelFormat);
|
||||
desc->setWidth(width);
|
||||
desc->setHeight(height);
|
||||
desc->setArrayLength(LAYER_COUNT);
|
||||
desc->setUsage(MTL::TextureUsageShaderRead/* | MTL::TextureUsageShaderWrite*/);
|
||||
desc->setUsage(MTL::TextureUsageShaderRead /* | MTL::TextureUsageShaderWrite*/);
|
||||
desc->setStorageMode(MTL::StorageModeShared);
|
||||
|
||||
texture = device->newTexture(desc);
|
||||
texture->setLabel(toNSString(name));
|
||||
desc->release();
|
||||
}
|
||||
}
|
||||
|
||||
LutTexture::~LutTexture() {
|
||||
texture->release();
|
||||
}
|
||||
LutTexture::~LutTexture() { texture->release(); }
|
||||
|
||||
u32 LutTexture::getNextIndex() {
|
||||
u32 LutTexture::getNextIndex() {
|
||||
currentIndex = (currentIndex + 1) % LAYER_COUNT;
|
||||
|
||||
return currentIndex;
|
||||
}
|
||||
|
||||
}
|
||||
} // namespace Metal
|
||||
|
|
|
@ -1,13 +1,15 @@
|
|||
#include "renderer_mtl/mtl_texture.hpp"
|
||||
#include "renderer_mtl/objc_helper.hpp"
|
||||
#include "colour.hpp"
|
||||
|
||||
#include <array>
|
||||
|
||||
#include "colour.hpp"
|
||||
#include "renderer_mtl/objc_helper.hpp"
|
||||
|
||||
|
||||
using namespace Helpers;
|
||||
|
||||
namespace Metal {
|
||||
|
||||
void Texture::allocate() {
|
||||
void Texture::allocate() {
|
||||
formatInfo = PICA::getPixelFormatInfo(format);
|
||||
|
||||
MTL::TextureDescriptor* descriptor = MTL::TextureDescriptor::alloc()->init();
|
||||
|
@ -18,14 +20,16 @@ void Texture::allocate() {
|
|||
descriptor->setUsage(MTL::TextureUsageShaderRead);
|
||||
descriptor->setStorageMode(MTL::StorageModeShared); // TODO: use private + staging buffers?
|
||||
texture = device->newTexture(descriptor);
|
||||
texture->setLabel(toNSString("Texture " + std::string(PICA::textureFormatToString(format)) + " " + std::to_string(size.u()) + "x" + std::to_string(size.v())));
|
||||
texture->setLabel(toNSString(
|
||||
"Texture " + std::string(PICA::textureFormatToString(format)) + " " + std::to_string(size.u()) + "x" + std::to_string(size.v())
|
||||
));
|
||||
descriptor->release();
|
||||
|
||||
setNewConfig(config);
|
||||
}
|
||||
}
|
||||
|
||||
// Set the texture's configuration, which includes min/mag filters, wrapping S/T modes, and so on
|
||||
void Texture::setNewConfig(u32 cfg) {
|
||||
// Set the texture's configuration, which includes min/mag filters, wrapping S/T modes, and so on
|
||||
void Texture::setNewConfig(u32 cfg) {
|
||||
config = cfg;
|
||||
|
||||
if (sampler) {
|
||||
|
@ -46,9 +50,9 @@ void Texture::setNewConfig(u32 cfg) {
|
|||
samplerDescriptor->setLabel(toNSString("Sampler"));
|
||||
sampler = device->newSamplerState(samplerDescriptor);
|
||||
samplerDescriptor->release();
|
||||
}
|
||||
}
|
||||
|
||||
void Texture::free() {
|
||||
void Texture::free() {
|
||||
valid = false;
|
||||
|
||||
if (texture) {
|
||||
|
@ -57,9 +61,9 @@ void Texture::free() {
|
|||
if (sampler) {
|
||||
sampler->release();
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
u64 Texture::sizeInBytes() {
|
||||
u64 Texture::sizeInBytes() {
|
||||
u64 pixelCount = u64(size.x()) * u64(size.y());
|
||||
|
||||
switch (format) {
|
||||
|
@ -73,17 +77,14 @@ u64 Texture::sizeInBytes() {
|
|||
case PICA::TextureFmt::RGB565:
|
||||
case PICA::TextureFmt::RGBA4:
|
||||
case PICA::TextureFmt::RG8:
|
||||
case PICA::TextureFmt::IA8:
|
||||
return pixelCount * 2;
|
||||
case PICA::TextureFmt::IA8: return pixelCount * 2;
|
||||
|
||||
case PICA::TextureFmt::A8: // 1 byte per pixel
|
||||
case PICA::TextureFmt::I8:
|
||||
case PICA::TextureFmt::IA4:
|
||||
return pixelCount;
|
||||
case PICA::TextureFmt::IA4: return pixelCount;
|
||||
|
||||
case PICA::TextureFmt::I4: // 4 bits per pixel
|
||||
case PICA::TextureFmt::A4:
|
||||
return pixelCount / 2;
|
||||
case PICA::TextureFmt::A4: return pixelCount / 2;
|
||||
|
||||
case PICA::TextureFmt::ETC1: // Compressed formats
|
||||
case PICA::TextureFmt::ETC1A4: {
|
||||
|
@ -94,41 +95,40 @@ u64 Texture::sizeInBytes() {
|
|||
return tileCount * tileSize;
|
||||
}
|
||||
|
||||
default:
|
||||
Helpers::panic("[PICA] Attempted to get size of invalid texture type");
|
||||
default: Helpers::panic("[PICA] Attempted to get size of invalid texture type");
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// u and v are the UVs of the relevant texel
|
||||
// Texture data is stored interleaved in Morton order, ie in a Z - order curve as shown here
|
||||
// https://en.wikipedia.org/wiki/Z-order_curve
|
||||
// Textures are split into 8x8 tiles.This function returns the in - tile offset depending on the u & v of the texel
|
||||
// The in - tile offset is the sum of 2 offsets, one depending on the value of u % 8 and the other on the value of y % 8
|
||||
// As documented in this picture https ://en.wikipedia.org/wiki/File:Moser%E2%80%93de_Bruijn_addition.svg
|
||||
u32 Texture::mortonInterleave(u32 u, u32 v) {
|
||||
static constexpr u32 xOffsets[] = { 0, 1, 4, 5, 16, 17, 20, 21 };
|
||||
static constexpr u32 yOffsets[] = { 0, 2, 8, 10, 32, 34, 40, 42 };
|
||||
// u and v are the UVs of the relevant texel
|
||||
// Texture data is stored interleaved in Morton order, ie in a Z - order curve as shown here
|
||||
// https://en.wikipedia.org/wiki/Z-order_curve
|
||||
// Textures are split into 8x8 tiles.This function returns the in - tile offset depending on the u & v of the texel
|
||||
// The in - tile offset is the sum of 2 offsets, one depending on the value of u % 8 and the other on the value of y % 8
|
||||
// As documented in this picture https ://en.wikipedia.org/wiki/File:Moser%E2%80%93de_Bruijn_addition.svg
|
||||
u32 Texture::mortonInterleave(u32 u, u32 v) {
|
||||
static constexpr u32 xOffsets[] = {0, 1, 4, 5, 16, 17, 20, 21};
|
||||
static constexpr u32 yOffsets[] = {0, 2, 8, 10, 32, 34, 40, 42};
|
||||
|
||||
return xOffsets[u & 7] + yOffsets[v & 7];
|
||||
}
|
||||
}
|
||||
|
||||
// Get the byte offset of texel (u, v) in the texture
|
||||
u32 Texture::getSwizzledOffset(u32 u, u32 v, u32 width, u32 bytesPerPixel) {
|
||||
// Get the byte offset of texel (u, v) in the texture
|
||||
u32 Texture::getSwizzledOffset(u32 u, u32 v, u32 width, u32 bytesPerPixel) {
|
||||
u32 offset = ((u & ~7) * 8) + ((v & ~7) * width); // Offset of the 8x8 tile the texel belongs to
|
||||
offset += mortonInterleave(u, v); // Add the in-tile offset of the texel
|
||||
|
||||
return offset * bytesPerPixel;
|
||||
}
|
||||
}
|
||||
|
||||
// Same as the above code except we need to divide by 2 because 4 bits is smaller than a byte
|
||||
u32 Texture::getSwizzledOffset_4bpp(u32 u, u32 v, u32 width) {
|
||||
// Same as the above code except we need to divide by 2 because 4 bits is smaller than a byte
|
||||
u32 Texture::getSwizzledOffset_4bpp(u32 u, u32 v, u32 width) {
|
||||
u32 offset = ((u & ~7) * 8) + ((v & ~7) * width); // Offset of the 8x8 tile the texel belongs to
|
||||
offset += mortonInterleave(u, v); // Add the in-tile offset of the texel
|
||||
|
||||
return offset / 2;
|
||||
}
|
||||
}
|
||||
|
||||
u8 Texture::decodeTexelU8(u32 u, u32 v, PICA::TextureFmt fmt, std::span<const u8> data) {
|
||||
u8 Texture::decodeTexelU8(u32 u, u32 v, PICA::TextureFmt fmt, std::span<const u8> data) {
|
||||
switch (fmt) {
|
||||
case PICA::TextureFmt::A4: {
|
||||
const u32 offset = getSwizzledOffset_4bpp(u, v, size.u());
|
||||
|
@ -149,12 +149,11 @@ u8 Texture::decodeTexelU8(u32 u, u32 v, PICA::TextureFmt fmt, std::span<const u8
|
|||
return alpha;
|
||||
}
|
||||
|
||||
default:
|
||||
Helpers::panic("[Texture::DecodeTexel] Unimplemented format = %d", static_cast<int>(fmt));
|
||||
default: Helpers::panic("[Texture::DecodeTexel] Unimplemented format = %d", static_cast<int>(fmt));
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
u16 Texture::decodeTexelU16(u32 u, u32 v, PICA::TextureFmt fmt, std::span<const u8> data) {
|
||||
u16 Texture::decodeTexelU16(u32 u, u32 v, PICA::TextureFmt fmt, std::span<const u8> data) {
|
||||
switch (fmt) {
|
||||
case PICA::TextureFmt::RG8: {
|
||||
u32 offset = getSwizzledOffset(u, v, size.u(), 2);
|
||||
|
@ -225,12 +224,11 @@ u16 Texture::decodeTexelU16(u32 u, u32 v, PICA::TextureFmt fmt, std::span<const
|
|||
return (intensity << 12) | (intensity << 8) | (intensity << 4) | 0xff;
|
||||
}
|
||||
|
||||
default:
|
||||
Helpers::panic("[Texture::DecodeTexel] Unimplemented format = %d", static_cast<int>(fmt));
|
||||
default: Helpers::panic("[Texture::DecodeTexel] Unimplemented format = %d", static_cast<int>(fmt));
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
u32 Texture::decodeTexelU32(u32 u, u32 v, PICA::TextureFmt fmt, std::span<const u8> data) {
|
||||
u32 Texture::decodeTexelU32(u32 u, u32 v, PICA::TextureFmt fmt, std::span<const u8> data) {
|
||||
switch (fmt) {
|
||||
case PICA::TextureFmt::RGB8: {
|
||||
const u32 offset = getSwizzledOffset(u, v, size.u(), 3);
|
||||
|
@ -275,12 +273,11 @@ u32 Texture::decodeTexelU32(u32 u, u32 v, PICA::TextureFmt fmt, std::span<const
|
|||
case PICA::TextureFmt::ETC1: return getTexelETC(false, u, v, size.u(), data);
|
||||
case PICA::TextureFmt::ETC1A4: return getTexelETC(true, u, v, size.u(), data);
|
||||
|
||||
default:
|
||||
Helpers::panic("[Texture::DecodeTexel] Unimplemented format = %d", static_cast<int>(fmt));
|
||||
default: Helpers::panic("[Texture::DecodeTexel] Unimplemented format = %d", static_cast<int>(fmt));
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
void Texture::decodeTexture(std::span<const u8> data) {
|
||||
void Texture::decodeTexture(std::span<const u8> data) {
|
||||
std::vector<u8> decoded;
|
||||
decoded.reserve(u64(size.u()) * u64(size.v()) * formatInfo.bytesPerTexel);
|
||||
|
||||
|
@ -307,6 +304,5 @@ void Texture::decodeTexture(std::span<const u8> data) {
|
|||
}
|
||||
|
||||
texture->replaceRegion(MTL::Region(0, 0, size.u(), size.v()), 0, 0, decoded.data(), formatInfo.bytesPerTexel * size.u(), 0);
|
||||
}
|
||||
|
||||
}
|
||||
} // namespace Metal
|
||||
|
|
|
@ -2,9 +2,10 @@
|
|||
|
||||
#include <cmrc/cmrc.hpp>
|
||||
#include <cstddef>
|
||||
|
||||
#include "renderer_mtl/mtl_lut_texture.hpp"
|
||||
|
||||
// HACK
|
||||
// Hack: Apple annoyingly defines a global "NO" macro which ends up conflicting with our own code...
|
||||
#undef NO
|
||||
|
||||
#include "PICA/gpu.hpp"
|
||||
|
@ -14,8 +15,10 @@ using namespace PICA;
|
|||
|
||||
CMRC_DECLARE(RendererMTL);
|
||||
|
||||
const u16 LIGHTING_LUT_TEXTURE_WIDTH = 256;
|
||||
const u32 FOG_LUT_TEXTURE_WIDTH = 128;
|
||||
static constexpr u16 LIGHTING_LUT_TEXTURE_WIDTH = 256;
|
||||
static constexpr u32 FOG_LUT_TEXTURE_WIDTH = 128;
|
||||
// Bind the vertex buffer to binding 30 so that it doesn't occupy the lower indices
|
||||
static constexpr uint VERTEX_BUFFER_BINDING_INDEX = 30;
|
||||
|
||||
// HACK: redefinition...
|
||||
PICA::ColorFmt ToColorFormat(u32 format) {
|
||||
|
@ -40,6 +43,7 @@ MTL::Library* loadLibrary(MTL::Device* device, const cmrc::file& shaderSource) {
|
|||
|
||||
RendererMTL::RendererMTL(GPU& gpu, const std::array<u32, regNum>& internalRegs, const std::array<u32, extRegNum>& externalRegs)
|
||||
: Renderer(gpu, internalRegs, externalRegs) {}
|
||||
|
||||
RendererMTL::~RendererMTL() {}
|
||||
|
||||
void RendererMTL::reset() {
|
||||
|
@ -78,7 +82,7 @@ void RendererMTL::display() {
|
|||
clearColor(nullptr, bottomScreen->get().texture);
|
||||
}
|
||||
|
||||
// -------- Draw --------
|
||||
// Draw
|
||||
commandBuffer->pushDebugGroup(toNSString("Display"));
|
||||
|
||||
MTL::RenderPassDescriptor* renderPassDescriptor = MTL::RenderPassDescriptor::alloc()->init();
|
||||
|
@ -130,8 +134,6 @@ void RendererMTL::initGraphicsContext(SDL_Window* window) {
|
|||
metalLayer->setDevice(device);
|
||||
commandQueue = device->newCommandQueue();
|
||||
|
||||
// -------- Objects --------
|
||||
|
||||
// Textures
|
||||
MTL::TextureDescriptor* textureDescriptor = MTL::TextureDescriptor::alloc()->init();
|
||||
textureDescriptor->setTextureType(MTL::TextureType2D);
|
||||
|
@ -157,7 +159,9 @@ void RendererMTL::initGraphicsContext(SDL_Window* window) {
|
|||
|
||||
samplerDescriptor->release();
|
||||
|
||||
lutLightingTexture = new Metal::LutTexture(device, MTL::TextureType2DArray, MTL::PixelFormatR16Unorm, LIGHTING_LUT_TEXTURE_WIDTH, Lights::LUT_Count, "Lighting LUT texture");
|
||||
lutLightingTexture = new Metal::LutTexture(
|
||||
device, MTL::TextureType2DArray, MTL::PixelFormatR16Unorm, LIGHTING_LUT_TEXTURE_WIDTH, Lights::LUT_Count, "Lighting LUT texture"
|
||||
);
|
||||
lutFogTexture = new Metal::LutTexture(device, MTL::TextureType1DArray, MTL::PixelFormatRG32Float, FOG_LUT_TEXTURE_WIDTH, 1, "Fog LUT texture");
|
||||
|
||||
// -------- Pipelines --------
|
||||
|
@ -166,7 +170,7 @@ void RendererMTL::initGraphicsContext(SDL_Window* window) {
|
|||
auto mtlResources = cmrc::RendererMTL::get_filesystem();
|
||||
library = loadLibrary(device, mtlResources.open("metal_shaders.metallib"));
|
||||
MTL::Library* blitLibrary = loadLibrary(device, mtlResources.open("metal_blit.metallib"));
|
||||
//MTL::Library* copyToLutTextureLibrary = loadLibrary(device, mtlResources.open("metal_copy_to_lut_texture.metallib"));
|
||||
// MTL::Library* copyToLutTextureLibrary = loadLibrary(device, mtlResources.open("metal_copy_to_lut_texture.metallib"));
|
||||
|
||||
// Display
|
||||
MTL::Function* vertexDisplayFunction = library->newFunction(NS::String::string("vertexDisplay", NS::ASCIIStringEncoding));
|
||||
|
@ -295,9 +299,8 @@ void RendererMTL::initGraphicsContext(SDL_Window* window) {
|
|||
defaultDepthStencilState = device->newDepthStencilState(depthStencilDescriptor);
|
||||
depthStencilDescriptor->release();
|
||||
|
||||
// Release
|
||||
blitLibrary->release();
|
||||
//copyToLutTextureLibrary->release();
|
||||
// copyToLutTextureLibrary->release();
|
||||
}
|
||||
|
||||
void RendererMTL::clearBuffer(u32 startAddress, u32 endAddress, u32 value, u32 control) {
|
||||
|
@ -592,8 +595,7 @@ void RendererMTL::deinitGraphicsContext() {
|
|||
delete lutLightingTexture;
|
||||
delete lutFogTexture;
|
||||
|
||||
// Release
|
||||
//copyToLutTexturePipeline->release();
|
||||
// copyToLutTexturePipeline->release();
|
||||
displayPipeline->release();
|
||||
defaultDepthStencilState->release();
|
||||
nullTexture->release();
|
||||
|
@ -736,7 +738,9 @@ void RendererMTL::updateLightingLUT(MTL::RenderCommandEncoder* encoder) {
|
|||
}
|
||||
|
||||
u32 index = lutLightingTexture->getNextIndex();
|
||||
lutLightingTexture->getTexture()->replaceRegion(MTL::Region(0, 0, LIGHTING_LUT_TEXTURE_WIDTH, Lights::LUT_Count), 0, index, lightingLut.data(), LIGHTING_LUT_TEXTURE_WIDTH * 2, 0);
|
||||
lutLightingTexture->getTexture()->replaceRegion(
|
||||
MTL::Region(0, 0, LIGHTING_LUT_TEXTURE_WIDTH, Lights::LUT_Count), 0, index, lightingLut.data(), LIGHTING_LUT_TEXTURE_WIDTH * 2, 0
|
||||
);
|
||||
|
||||
/*
|
||||
endRenderPass();
|
||||
|
@ -768,7 +772,7 @@ void RendererMTL::updateLightingLUT(MTL::RenderCommandEncoder* encoder) {
|
|||
void RendererMTL::updateFogLUT(MTL::RenderCommandEncoder* encoder) {
|
||||
gpu.fogLUTDirty = false;
|
||||
|
||||
std::array<float, FOG_LUT_TEXTURE_WIDTH * 2> fogLut = {0.0f};
|
||||
std::array<float, FOG_LUT_TEXTURE_WIDTH* 2> fogLut = {0.0f};
|
||||
|
||||
for (int i = 0; i < fogLut.size(); i += 2) {
|
||||
const uint32_t value = gpu.fogLUT[i >> 1];
|
||||
|
@ -807,7 +811,8 @@ void RendererMTL::textureCopyImpl(
|
|||
) {
|
||||
nextRenderPassName = "Texture copy";
|
||||
MTL::RenderPassDescriptor* renderPassDescriptor = MTL::RenderPassDescriptor::alloc()->init();
|
||||
// TODO: clearColor sets the load action to load if it didn't find any clear, but that is unnecessary if we are doing a copy to the whole texture
|
||||
// TODO: clearColor sets the load action to load if it didn't find any clear, but that is unnecessary if we are doing a copy to the whole
|
||||
// texture
|
||||
bool doesClear = clearColor(renderPassDescriptor, destFramebuffer.texture);
|
||||
beginRenderPassIfNeeded(renderPassDescriptor, doesClear, destFramebuffer.texture);
|
||||
|
||||
|
@ -819,11 +824,13 @@ void RendererMTL::textureCopyImpl(
|
|||
|
||||
// Viewport
|
||||
renderCommandEncoder->setViewport(MTL::Viewport{
|
||||
double(destRect.left), double(destRect.bottom), double(destRect.right - destRect.left), double(destRect.top - destRect.bottom), 0.0, 1.0
|
||||
});
|
||||
double(destRect.left), double(destRect.bottom), double(destRect.right - destRect.left), double(destRect.top - destRect.bottom), 0.0, 1.0});
|
||||
|
||||
float srcRectNDC[4] = {
|
||||
srcRect.left / (float)srcFramebuffer.size.u(), srcRect.bottom / (float)srcFramebuffer.size.v(),
|
||||
(srcRect.right - srcRect.left) / (float)srcFramebuffer.size.u(), (srcRect.top - srcRect.bottom) / (float)srcFramebuffer.size.v()
|
||||
srcRect.left / (float)srcFramebuffer.size.u(),
|
||||
srcRect.bottom / (float)srcFramebuffer.size.v(),
|
||||
(srcRect.right - srcRect.left) / (float)srcFramebuffer.size.u(),
|
||||
(srcRect.top - srcRect.bottom) / (float)srcFramebuffer.size.v(),
|
||||
};
|
||||
|
||||
// Bind resources
|
||||
|
@ -834,10 +841,13 @@ void RendererMTL::textureCopyImpl(
|
|||
renderCommandEncoder->drawPrimitives(MTL::PrimitiveTypeTriangleStrip, NS::UInteger(0), NS::UInteger(4));
|
||||
}
|
||||
|
||||
void RendererMTL::beginRenderPassIfNeeded(MTL::RenderPassDescriptor* renderPassDescriptor, bool doesClears, MTL::Texture* colorTexture, MTL::Texture* depthTexture) {
|
||||
void RendererMTL::beginRenderPassIfNeeded(
|
||||
MTL::RenderPassDescriptor* renderPassDescriptor, bool doesClears, MTL::Texture* colorTexture, MTL::Texture* depthTexture
|
||||
) {
|
||||
createCommandBufferIfNeeded();
|
||||
|
||||
if (doesClears || !renderCommandEncoder || colorTexture != lastColorTexture || (depthTexture != lastDepthTexture && !(lastDepthTexture && !depthTexture))) {
|
||||
if (doesClears || !renderCommandEncoder || colorTexture != lastColorTexture ||
|
||||
(depthTexture != lastDepthTexture && !(lastDepthTexture && !depthTexture))) {
|
||||
endRenderPass();
|
||||
|
||||
renderCommandEncoder = commandBuffer->renderCommandEncoder(renderPassDescriptor);
|
||||
|
|
Loading…
Add table
Reference in a new issue