#include #include #include "math_util.hpp" #include "renderer.hpp" #include "vk_api.hpp" #include "vk_descriptor_heap.hpp" #include "vk_descriptor_update_batch.hpp" #include "vk_sampler_cache.hpp" class GPU; class RendererVK final : public Renderer { SDL_Window* targetWindow; // The order of these `Unique*` members is important, they will be destroyed in RAII order vk::UniqueInstance instance = {}; vk::UniqueDebugUtilsMessengerEXT debugMessenger = {}; vk::SurfaceKHR swapchainSurface = {}; vk::PhysicalDevice physicalDevice = {}; vk::UniqueDevice device = {}; vk::Queue presentQueue = {}; u32 presentQueueFamily = ~0u; vk::Queue graphicsQueue = {}; u32 graphicsQueueFamily = ~0u; vk::Queue computeQueue = {}; u32 computeQueueFamily = ~0u; vk::Queue transferQueue = {}; u32 transferQueueFamily = ~0u; vk::UniqueCommandPool commandPool = {}; vk::UniqueSwapchainKHR swapchain = {}; u32 swapchainImageCount = ~0u; std::vector swapchainImages = {}; std::vector swapchainImageViews = {}; // This value is the degree of parallelism to allow multiple frames to be in-flight // aka: "double-buffer"/"triple-buffering" // Todo: make this a configuration option static constexpr usize frameBufferingCount = 3; // Frame-buffering data // Each vector is `frameBufferingCount` in size std::vector swapImageFreeSemaphore = {}; std::vector renderFinishedSemaphore = {}; std::vector frameFinishedFences = {}; std::vector> frameFramebuffers = {}; std::vector frameCommandBuffers = {}; const vk::CommandBuffer& getCurrentCommandBuffer() const { return frameCommandBuffers[frameBufferingIndex].get(); } // Todo: // Use `{colourBuffer,depthBuffer}Loc` to maintain an std::map-cache of framebuffers struct Texture { u32 loc = 0; u32 sizePerPixel = 0; std::array size = {}; vk::Format format; vk::UniqueImage image; vk::UniqueDeviceMemory imageMemory; vk::UniqueImageView imageView; Math::Rect getSubRect(u32 inputAddress, u32 width, u32 height) { // PICA textures have top-left origin, same as Vulkan const u32 startOffset = (inputAddress - loc) / sizePerPixel; const u32 x0 = (startOffset % (size[0] * 8)) / 8; const u32 y0 = (startOffset / (size[0] * 8)) * 8; return Math::Rect{x0, y0, x0 + width, y0 + height}; } }; // Hash(loc, size, format) -> Texture std::map textureCache; Texture* findRenderTexture(u32 addr); Texture& getColorRenderTexture(u32 addr, PICA::ColorFmt format, u32 width, u32 height); Texture& getDepthRenderTexture(u32 addr, PICA::DepthFmt format, u32 width, u32 height); // Framebuffer for the top/bottom image std::vector screenTexture = {}; std::vector screenTextureViews = {}; std::vector screenTextureFramebuffers = {}; vk::UniqueDeviceMemory framebufferMemory = {}; std::map renderPassCache; vk::RenderPass getRenderPass(vk::Format colorFormat, std::optional depthFormat); vk::RenderPass getRenderPass(PICA::ColorFmt colorFormat, std::optional depthFormat); std::unique_ptr descriptorUpdateBatch; std::unique_ptr samplerCache; // Display pipeline data std::unique_ptr displayDescriptorHeap; vk::UniquePipeline displayPipeline; vk::UniquePipelineLayout displayPipelineLayout; std::vector topDisplayPipelineDescriptorSet; std::vector bottomDisplayPipelineDescriptorSet; // Recreate the swapchain, possibly re-using the old one in the case of a resize vk::Result recreateSwapchain(vk::SurfaceKHR surface, vk::Extent2D swapchainExtent); u64 frameBufferingIndex = 0; public: RendererVK(GPU& gpu, const std::array& internalRegs, const std::array& externalRegs); ~RendererVK() override; void reset() override; void display() override; void initGraphicsContext(SDL_Window* window) override; void clearBuffer(u32 startAddress, u32 endAddress, u32 value, u32 control) override; void displayTransfer(u32 inputAddr, u32 outputAddr, u32 inputSize, u32 outputSize, u32 flags) override; void textureCopy(u32 inputAddr, u32 outputAddr, u32 totalBytes, u32 inputSize, u32 outputSize, u32 flags) override; void drawVertices(PICA::PrimType primType, std::span vertices) override; void screenshot(const std::string& name) override; void deinitGraphicsContext() override; };