summaryrefslogtreecommitdiffstats
path: root/drivers/vulkan
diff options
context:
space:
mode:
authorRémi Verschelde <rverschelde@gmail.com>2023-06-01 00:40:33 +0200
committerRémi Verschelde <rverschelde@gmail.com>2023-06-01 00:40:33 +0200
commit3dd0307f3fd8efd45057b62dfa14b45e6db0ce49 (patch)
tree0e9cc470880939297d845b3c59933eefbfc7ad35 /drivers/vulkan
parentbb58eb6a9463ca7c07e5d4e36f32fe9641bb21d2 (diff)
parentdded713dc0b808561da8754c384af826a749539e (diff)
downloadredot-engine-3dd0307f3fd8efd45057b62dfa14b45e6db0ce49.tar.gz
Merge pull request #76348 from warriormaster12/pipeline-cache
Implement Vulkan pipeline caching
Diffstat (limited to 'drivers/vulkan')
-rw-r--r--drivers/vulkan/rendering_device_vulkan.cpp138
-rw-r--r--drivers/vulkan/rendering_device_vulkan.h26
2 files changed, 162 insertions, 2 deletions
diff --git a/drivers/vulkan/rendering_device_vulkan.cpp b/drivers/vulkan/rendering_device_vulkan.cpp
index a72252b3e1..4e43c14476 100644
--- a/drivers/vulkan/rendering_device_vulkan.cpp
+++ b/drivers/vulkan/rendering_device_vulkan.cpp
@@ -32,6 +32,7 @@
#include "core/config/project_settings.h"
#include "core/io/compression.h"
+#include "core/io/dir_access.h"
#include "core/io/file_access.h"
#include "core/io/marshalls.h"
#include "core/os/os.h"
@@ -6398,9 +6399,13 @@ RID RenderingDeviceVulkan::render_pipeline_create(RID p_shader, FramebufferForma
graphics_pipeline_create_info.basePipelineIndex = 0;
RenderPipeline pipeline;
- VkResult err = vkCreateGraphicsPipelines(device, VK_NULL_HANDLE, 1, &graphics_pipeline_create_info, nullptr, &pipeline.pipeline);
+ VkResult err = vkCreateGraphicsPipelines(device, pipelines_cache.cache_object, 1, &graphics_pipeline_create_info, nullptr, &pipeline.pipeline);
ERR_FAIL_COND_V_MSG(err, RID(), "vkCreateGraphicsPipelines failed with error " + itos(err) + " for shader '" + shader->name + "'.");
+ if (pipelines_cache.cache_object != VK_NULL_HANDLE) {
+ _update_pipeline_cache();
+ }
+
pipeline.set_formats = shader->set_formats;
pipeline.push_constant_stages_mask = shader->push_constant.vk_stages_mask;
pipeline.pipeline_layout = shader->pipeline_layout;
@@ -6513,9 +6518,13 @@ RID RenderingDeviceVulkan::compute_pipeline_create(RID p_shader, const Vector<Pi
}
ComputePipeline pipeline;
- VkResult err = vkCreateComputePipelines(device, VK_NULL_HANDLE, 1, &compute_pipeline_create_info, nullptr, &pipeline.pipeline);
+ VkResult err = vkCreateComputePipelines(device, pipelines_cache.cache_object, 1, &compute_pipeline_create_info, nullptr, &pipeline.pipeline);
ERR_FAIL_COND_V_MSG(err, RID(), "vkCreateComputePipelines failed with error " + itos(err) + ".");
+ if (pipelines_cache.cache_object != VK_NULL_HANDLE) {
+ _update_pipeline_cache();
+ }
+
pipeline.set_formats = shader->set_formats;
pipeline.push_constant_stages_mask = shader->push_constant.vk_stages_mask;
pipeline.pipeline_layout = shader->pipeline_layout;
@@ -8965,6 +8974,128 @@ void RenderingDeviceVulkan::initialize(VulkanContext *p_context, bool p_local_de
draw_list_split = false;
compute_list = nullptr;
+ _load_pipeline_cache();
+ print_verbose(vformat("Startup PSO cache (%.1f MiB)", pipelines_cache.buffer.size() / (1024.0f * 1024.0f)));
+ VkPipelineCacheCreateInfo cache_info = {};
+ cache_info.sType = VK_STRUCTURE_TYPE_PIPELINE_CACHE_CREATE_INFO;
+ cache_info.pNext = nullptr;
+ cache_info.flags = 0;
+ cache_info.initialDataSize = pipelines_cache.buffer.size();
+ cache_info.pInitialData = pipelines_cache.buffer.ptr();
+ VkResult err = vkCreatePipelineCache(device, &cache_info, nullptr, &pipelines_cache.cache_object);
+
+ if (err != VK_SUCCESS) {
+ WARN_PRINT("vkCreatePipelinecache failed with error " + itos(err) + ".");
+ }
+}
+
+void RenderingDeviceVulkan::_load_pipeline_cache() {
+ if (!DirAccess::exists("user://vulkan/")) {
+ Ref<DirAccess> da = DirAccess::create(DirAccess::ACCESS_USERDATA);
+
+ if (da.is_valid()) {
+ da->make_dir_recursive("user://vulkan/");
+ }
+ }
+
+ if (FileAccess::exists("user://vulkan/pipelines.cache")) {
+ Error file_error;
+ Vector<uint8_t> file_data = FileAccess::get_file_as_bytes("user://vulkan/pipelines.cache", &file_error);
+ if (file_error != OK || file_data.size() <= (int)sizeof(PipelineCacheHeader)) {
+ WARN_PRINT("Invalid/corrupt pipelines cache.");
+ return;
+ }
+ PipelineCacheHeader header = {};
+ memcpy((char *)&header, file_data.ptr(), sizeof(PipelineCacheHeader));
+ if (header.magic != 868 + VK_PIPELINE_CACHE_HEADER_VERSION_ONE) {
+ WARN_PRINT("Invalid pipelines cache magic number.");
+ return;
+ }
+ pipelines_cache.buffer.resize(file_data.size() - sizeof(PipelineCacheHeader));
+ memcpy(pipelines_cache.buffer.ptrw(), file_data.ptr() + sizeof(PipelineCacheHeader), pipelines_cache.buffer.size());
+ VkPhysicalDeviceProperties props;
+ vkGetPhysicalDeviceProperties(context->get_physical_device(), &props);
+ bool invalid_uuid = false;
+ for (size_t i = 0; i < VK_UUID_SIZE; i++) {
+ if (header.uuid[i] != props.pipelineCacheUUID[i]) {
+ invalid_uuid = true;
+ break;
+ }
+ }
+ if (header.data_hash != hash_murmur3_buffer(pipelines_cache.buffer.ptr(), pipelines_cache.buffer.size()) || header.data_size != (uint32_t)pipelines_cache.buffer.size() || header.vendor_id != props.vendorID || header.device_id != props.deviceID || header.driver_abi != sizeof(void *) || invalid_uuid) {
+ WARN_PRINT("Invalid pipelines cache header.");
+ pipelines_cache.current_size = 0;
+ pipelines_cache.buffer.clear();
+ } else {
+ pipelines_cache.current_size = pipelines_cache.buffer.size();
+ }
+ }
+}
+
+void RenderingDeviceVulkan::_update_pipeline_cache(bool p_closing) {
+ size_t pso_blob_size = 0;
+ float save_interval = GLOBAL_GET("rendering/rendering_device/pipeline_cache/save_chunk_size_mb");
+ VkResult vr = vkGetPipelineCacheData(device, pipelines_cache.cache_object, &pso_blob_size, nullptr);
+ ERR_FAIL_COND(vr);
+ size_t difference = (pso_blob_size - pipelines_cache.current_size) / (1024 * 1024);
+ if (p_closing && Engine::get_singleton()->is_editor_hint()) {
+ // This is mostly for the editor to check if after playing the game, game's pipeline cache size still matches with editor's cache.
+ _load_pipeline_cache();
+ if (pipelines_cache.current_size > pso_blob_size) {
+ pso_blob_size = pipelines_cache.current_size;
+ if (pipelines_cache_save_task != WorkerThreadPool::INVALID_TASK_ID || !WorkerThreadPool::get_singleton()->is_task_completed(pipelines_cache_save_task)) {
+ WorkerThreadPool::get_singleton()->wait_for_task_completion(pipelines_cache_save_task);
+ }
+ }
+ }
+ if (pso_blob_size == pipelines_cache.current_size) {
+ return;
+ } else if (difference < save_interval && !p_closing) {
+ return;
+ }
+
+ if (p_closing) {
+ if (pipelines_cache_save_task == WorkerThreadPool::INVALID_TASK_ID || WorkerThreadPool::get_singleton()->is_task_completed(pipelines_cache_save_task)) {
+ pipelines_cache_save_task = WorkerThreadPool::get_singleton()->add_template_task(this, &RenderingDeviceVulkan::_save_pipeline_cache_threaded, pso_blob_size, false, "PipelineCacheSave");
+ WorkerThreadPool::get_singleton()->wait_for_task_completion(pipelines_cache_save_task);
+ } else {
+ WorkerThreadPool::get_singleton()->wait_for_task_completion(pipelines_cache_save_task);
+ pipelines_cache_save_task = WorkerThreadPool::get_singleton()->add_template_task(this, &RenderingDeviceVulkan::_save_pipeline_cache_threaded, pso_blob_size, false, "PipelineCacheSave");
+ WorkerThreadPool::get_singleton()->wait_for_task_completion(pipelines_cache_save_task);
+ }
+ } else {
+ if (pipelines_cache_save_task == WorkerThreadPool::INVALID_TASK_ID || WorkerThreadPool::get_singleton()->is_task_completed(pipelines_cache_save_task)) {
+ pipelines_cache_save_task = WorkerThreadPool::get_singleton()->add_template_task(this, &RenderingDeviceVulkan::_save_pipeline_cache_threaded, pso_blob_size, false, "PipelineCacheSave");
+ }
+ }
+}
+
+void RenderingDeviceVulkan::_save_pipeline_cache_threaded(size_t p_pso_blob_size) {
+ pipelines_cache.current_size = p_pso_blob_size;
+ pipelines_cache.buffer.clear();
+ pipelines_cache.buffer.resize(p_pso_blob_size);
+ VkResult vr = vkGetPipelineCacheData(device, pipelines_cache.cache_object, &p_pso_blob_size, pipelines_cache.buffer.ptrw());
+ ERR_FAIL_COND(vr);
+ print_verbose(vformat("Updated PSO cache (%.1f MiB)", p_pso_blob_size / (1024.0f * 1024.0f)));
+
+ VkPhysicalDeviceProperties props;
+ vkGetPhysicalDeviceProperties(context->get_physical_device(), &props);
+ PipelineCacheHeader header = {};
+ header.magic = 868 + VK_PIPELINE_CACHE_HEADER_VERSION_ONE;
+ header.data_size = pipelines_cache.buffer.size();
+ header.data_hash = hash_murmur3_buffer(pipelines_cache.buffer.ptr(), pipelines_cache.buffer.size());
+ header.device_id = props.deviceID;
+ header.vendor_id = props.vendorID;
+ header.driver_version = props.driverVersion;
+ for (size_t i = 0; i < VK_UUID_SIZE; i++) {
+ header.uuid[i] = props.pipelineCacheUUID[i];
+ }
+ header.driver_abi = sizeof(void *);
+ Ref<FileAccess> f = FileAccess::open("user://vulkan/pipelines.cache", FileAccess::WRITE, nullptr);
+ if (f.is_valid()) {
+ f->store_buffer((const uint8_t *)&header, sizeof(PipelineCacheHeader));
+ f->store_buffer(pipelines_cache.buffer);
+ }
}
template <class T>
@@ -9340,6 +9471,9 @@ void RenderingDeviceVulkan::finalize() {
vkDestroyCommandPool(device, frames[i].command_pool, nullptr);
vkDestroyQueryPool(device, frames[i].timestamp_pool, nullptr);
}
+ _update_pipeline_cache(true);
+
+ vkDestroyPipelineCache(device, pipelines_cache.cache_object, nullptr);
for (int i = 0; i < split_draw_list_allocators.size(); i++) {
vkDestroyCommandPool(device, split_draw_list_allocators[i].command_pool, nullptr);
diff --git a/drivers/vulkan/rendering_device_vulkan.h b/drivers/vulkan/rendering_device_vulkan.h
index 4150e0a8e6..6e61ee890d 100644
--- a/drivers/vulkan/rendering_device_vulkan.h
+++ b/drivers/vulkan/rendering_device_vulkan.h
@@ -31,6 +31,7 @@
#ifndef RENDERING_DEVICE_VULKAN_H
#define RENDERING_DEVICE_VULKAN_H
+#include "core/object/worker_thread_pool.h"
#include "core/os/thread_safe.h"
#include "core/templates/local_vector.h"
#include "core/templates/oa_hash_map.h"
@@ -792,6 +793,31 @@ class RenderingDeviceVulkan : public RenderingDevice {
RID_Owner<RenderPipeline, true> render_pipeline_owner;
+ struct PipelineCacheHeader {
+ uint32_t magic;
+ uint32_t data_size;
+ uint64_t data_hash;
+ uint32_t vendor_id;
+ uint32_t device_id;
+ uint32_t driver_version;
+ uint8_t uuid[VK_UUID_SIZE];
+ uint8_t driver_abi;
+ };
+
+ struct PipelineCache {
+ size_t current_size = 0;
+ Vector<uint8_t> buffer;
+ VkPipelineCache cache_object = VK_NULL_HANDLE;
+ };
+
+ PipelineCache pipelines_cache;
+
+ WorkerThreadPool::TaskID pipelines_cache_save_task = WorkerThreadPool::INVALID_TASK_ID;
+
+ void _load_pipeline_cache();
+ void _update_pipeline_cache(bool p_closing = false);
+ void _save_pipeline_cache_threaded(size_t pso_blob_size);
+
struct ComputePipeline {
RID shader;
Vector<uint32_t> set_formats;