diff options
| author | 2021-06-16 21:14:57 -0300 | |
|---|---|---|
| committer | 2021-07-22 21:51:38 -0400 | |
| commit | ca67077ca87772b4b4ac61d08f5b2c60616348e0 (patch) | |
| tree | 2a861de6f5be92cbed1542f115a99e646a1793c9 /src/video_core/vulkan_common | |
| parent | glsl: Fix cbuf component indexing bug falback (diff) | |
| download | yuzu-ca67077ca87772b4b4ac61d08f5b2c60616348e0.tar.gz yuzu-ca67077ca87772b4b4ac61d08f5b2c60616348e0.tar.xz yuzu-ca67077ca87772b4b4ac61d08f5b2c60616348e0.zip | |
vk_graphics_pipeline: Use VK_KHR_push_descriptor when available
~51% faster on Nvidia compared to previous method.
Diffstat (limited to 'src/video_core/vulkan_common')
| -rw-r--r-- | src/video_core/vulkan_common/vulkan_device.cpp | 11 | ||||
| -rw-r--r-- | src/video_core/vulkan_common/vulkan_device.h | 12 | ||||
| -rw-r--r-- | src/video_core/vulkan_common/vulkan_wrapper.cpp | 1 | ||||
| -rw-r--r-- | src/video_core/vulkan_common/vulkan_wrapper.h | 31 |
4 files changed, 43 insertions, 12 deletions
diff --git a/src/video_core/vulkan_common/vulkan_device.cpp b/src/video_core/vulkan_common/vulkan_device.cpp index 0d8c6cd08..9d918de8d 100644 --- a/src/video_core/vulkan_common/vulkan_device.cpp +++ b/src/video_core/vulkan_common/vulkan_device.cpp | |||
| @@ -767,6 +767,7 @@ std::vector<const char*> Device::LoadExtensions(bool requires_surface) { | |||
| 767 | test(khr_uniform_buffer_standard_layout, | 767 | test(khr_uniform_buffer_standard_layout, |
| 768 | VK_KHR_UNIFORM_BUFFER_STANDARD_LAYOUT_EXTENSION_NAME, true); | 768 | VK_KHR_UNIFORM_BUFFER_STANDARD_LAYOUT_EXTENSION_NAME, true); |
| 769 | test(khr_spirv_1_4, VK_KHR_SPIRV_1_4_EXTENSION_NAME, true); | 769 | test(khr_spirv_1_4, VK_KHR_SPIRV_1_4_EXTENSION_NAME, true); |
| 770 | test(khr_push_descriptor, VK_KHR_PUSH_DESCRIPTOR_EXTENSION_NAME, true); | ||
| 770 | test(has_khr_shader_float16_int8, VK_KHR_SHADER_FLOAT16_INT8_EXTENSION_NAME, false); | 771 | test(has_khr_shader_float16_int8, VK_KHR_SHADER_FLOAT16_INT8_EXTENSION_NAME, false); |
| 771 | test(ext_depth_range_unrestricted, VK_EXT_DEPTH_RANGE_UNRESTRICTED_EXTENSION_NAME, true); | 772 | test(ext_depth_range_unrestricted, VK_EXT_DEPTH_RANGE_UNRESTRICTED_EXTENSION_NAME, true); |
| 772 | test(ext_index_type_uint8, VK_EXT_INDEX_TYPE_UINT8_EXTENSION_NAME, true); | 773 | test(ext_index_type_uint8, VK_EXT_INDEX_TYPE_UINT8_EXTENSION_NAME, true); |
| @@ -932,6 +933,16 @@ std::vector<const char*> Device::LoadExtensions(bool requires_surface) { | |||
| 932 | khr_workgroup_memory_explicit_layout = true; | 933 | khr_workgroup_memory_explicit_layout = true; |
| 933 | } | 934 | } |
| 934 | } | 935 | } |
| 936 | if (khr_push_descriptor) { | ||
| 937 | VkPhysicalDevicePushDescriptorPropertiesKHR push_descriptor; | ||
| 938 | push_descriptor.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_PUSH_DESCRIPTOR_PROPERTIES_KHR; | ||
| 939 | push_descriptor.pNext = nullptr; | ||
| 940 | |||
| 941 | physical_properties.pNext = &push_descriptor; | ||
| 942 | physical.GetProperties2KHR(physical_properties); | ||
| 943 | |||
| 944 | max_push_descriptors = push_descriptor.maxPushDescriptors; | ||
| 945 | } | ||
| 935 | return extensions; | 946 | return extensions; |
| 936 | } | 947 | } |
| 937 | 948 | ||
diff --git a/src/video_core/vulkan_common/vulkan_device.h b/src/video_core/vulkan_common/vulkan_device.h index 4fda472b0..49605752d 100644 --- a/src/video_core/vulkan_common/vulkan_device.h +++ b/src/video_core/vulkan_common/vulkan_device.h | |||
| @@ -154,6 +154,11 @@ public: | |||
| 154 | return guest_warp_stages & stage; | 154 | return guest_warp_stages & stage; |
| 155 | } | 155 | } |
| 156 | 156 | ||
| 157 | /// Returns the maximum number of push descriptors. | ||
| 158 | u32 MaxPushDescriptors() const { | ||
| 159 | return max_push_descriptors; | ||
| 160 | } | ||
| 161 | |||
| 157 | /// Returns true if formatless image load is supported. | 162 | /// Returns true if formatless image load is supported. |
| 158 | bool IsFormatlessImageLoadSupported() const { | 163 | bool IsFormatlessImageLoadSupported() const { |
| 159 | return is_formatless_image_load_supported; | 164 | return is_formatless_image_load_supported; |
| @@ -194,6 +199,11 @@ public: | |||
| 194 | return khr_spirv_1_4; | 199 | return khr_spirv_1_4; |
| 195 | } | 200 | } |
| 196 | 201 | ||
| 202 | /// Returns true if the device supports VK_KHR_push_descriptor. | ||
| 203 | bool IsKhrPushDescriptorSupported() const { | ||
| 204 | return khr_push_descriptor; | ||
| 205 | } | ||
| 206 | |||
| 197 | /// Returns true if the device supports VK_KHR_workgroup_memory_explicit_layout. | 207 | /// Returns true if the device supports VK_KHR_workgroup_memory_explicit_layout. |
| 198 | bool IsKhrWorkgroupMemoryExplicitLayoutSupported() const { | 208 | bool IsKhrWorkgroupMemoryExplicitLayoutSupported() const { |
| 199 | return khr_workgroup_memory_explicit_layout; | 209 | return khr_workgroup_memory_explicit_layout; |
| @@ -330,6 +340,7 @@ private: | |||
| 330 | VkDriverIdKHR driver_id{}; ///< Driver ID. | 340 | VkDriverIdKHR driver_id{}; ///< Driver ID. |
| 331 | VkShaderStageFlags guest_warp_stages{}; ///< Stages where the guest warp size can be forced. | 341 | VkShaderStageFlags guest_warp_stages{}; ///< Stages where the guest warp size can be forced. |
| 332 | u64 device_access_memory{}; ///< Total size of device local memory in bytes. | 342 | u64 device_access_memory{}; ///< Total size of device local memory in bytes. |
| 343 | u32 max_push_descriptors{}; ///< Maximum number of push descriptors | ||
| 333 | bool is_optimal_astc_supported{}; ///< Support for native ASTC. | 344 | bool is_optimal_astc_supported{}; ///< Support for native ASTC. |
| 334 | bool is_float16_supported{}; ///< Support for float16 arithmetics. | 345 | bool is_float16_supported{}; ///< Support for float16 arithmetics. |
| 335 | bool is_warp_potentially_bigger{}; ///< Host warp size can be bigger than guest. | 346 | bool is_warp_potentially_bigger{}; ///< Host warp size can be bigger than guest. |
| @@ -345,6 +356,7 @@ private: | |||
| 345 | bool khr_uniform_buffer_standard_layout{}; ///< Support for scalar uniform buffer layouts. | 356 | bool khr_uniform_buffer_standard_layout{}; ///< Support for scalar uniform buffer layouts. |
| 346 | bool khr_spirv_1_4{}; ///< Support for VK_KHR_spirv_1_4. | 357 | bool khr_spirv_1_4{}; ///< Support for VK_KHR_spirv_1_4. |
| 347 | bool khr_workgroup_memory_explicit_layout{}; ///< Support for explicit workgroup layouts. | 358 | bool khr_workgroup_memory_explicit_layout{}; ///< Support for explicit workgroup layouts. |
| 359 | bool khr_push_descriptor{}; ///< Support for VK_KHR_push_descritor. | ||
| 348 | bool ext_index_type_uint8{}; ///< Support for VK_EXT_index_type_uint8. | 360 | bool ext_index_type_uint8{}; ///< Support for VK_EXT_index_type_uint8. |
| 349 | bool ext_sampler_filter_minmax{}; ///< Support for VK_EXT_sampler_filter_minmax. | 361 | bool ext_sampler_filter_minmax{}; ///< Support for VK_EXT_sampler_filter_minmax. |
| 350 | bool ext_depth_range_unrestricted{}; ///< Support for VK_EXT_depth_range_unrestricted. | 362 | bool ext_depth_range_unrestricted{}; ///< Support for VK_EXT_depth_range_unrestricted. |
diff --git a/src/video_core/vulkan_common/vulkan_wrapper.cpp b/src/video_core/vulkan_common/vulkan_wrapper.cpp index 7e13ae8af..d7e9fac22 100644 --- a/src/video_core/vulkan_common/vulkan_wrapper.cpp +++ b/src/video_core/vulkan_common/vulkan_wrapper.cpp | |||
| @@ -103,6 +103,7 @@ void Load(VkDevice device, DeviceDispatch& dld) noexcept { | |||
| 103 | X(vkCmdFillBuffer); | 103 | X(vkCmdFillBuffer); |
| 104 | X(vkCmdPipelineBarrier); | 104 | X(vkCmdPipelineBarrier); |
| 105 | X(vkCmdPushConstants); | 105 | X(vkCmdPushConstants); |
| 106 | X(vkCmdPushDescriptorSetWithTemplateKHR); | ||
| 106 | X(vkCmdSetBlendConstants); | 107 | X(vkCmdSetBlendConstants); |
| 107 | X(vkCmdSetDepthBias); | 108 | X(vkCmdSetDepthBias); |
| 108 | X(vkCmdSetDepthBounds); | 109 | X(vkCmdSetDepthBounds); |
diff --git a/src/video_core/vulkan_common/vulkan_wrapper.h b/src/video_core/vulkan_common/vulkan_wrapper.h index 6e5be1186..d43b606f1 100644 --- a/src/video_core/vulkan_common/vulkan_wrapper.h +++ b/src/video_core/vulkan_common/vulkan_wrapper.h | |||
| @@ -193,15 +193,16 @@ struct DeviceDispatch : InstanceDispatch { | |||
| 193 | PFN_vkBeginCommandBuffer vkBeginCommandBuffer{}; | 193 | PFN_vkBeginCommandBuffer vkBeginCommandBuffer{}; |
| 194 | PFN_vkBindBufferMemory vkBindBufferMemory{}; | 194 | PFN_vkBindBufferMemory vkBindBufferMemory{}; |
| 195 | PFN_vkBindImageMemory vkBindImageMemory{}; | 195 | PFN_vkBindImageMemory vkBindImageMemory{}; |
| 196 | PFN_vkCmdBeginDebugUtilsLabelEXT vkCmdBeginDebugUtilsLabelEXT{}; | ||
| 196 | PFN_vkCmdBeginQuery vkCmdBeginQuery{}; | 197 | PFN_vkCmdBeginQuery vkCmdBeginQuery{}; |
| 197 | PFN_vkCmdBeginRenderPass vkCmdBeginRenderPass{}; | 198 | PFN_vkCmdBeginRenderPass vkCmdBeginRenderPass{}; |
| 198 | PFN_vkCmdBeginTransformFeedbackEXT vkCmdBeginTransformFeedbackEXT{}; | 199 | PFN_vkCmdBeginTransformFeedbackEXT vkCmdBeginTransformFeedbackEXT{}; |
| 199 | PFN_vkCmdBeginDebugUtilsLabelEXT vkCmdBeginDebugUtilsLabelEXT{}; | ||
| 200 | PFN_vkCmdBindDescriptorSets vkCmdBindDescriptorSets{}; | 200 | PFN_vkCmdBindDescriptorSets vkCmdBindDescriptorSets{}; |
| 201 | PFN_vkCmdBindIndexBuffer vkCmdBindIndexBuffer{}; | 201 | PFN_vkCmdBindIndexBuffer vkCmdBindIndexBuffer{}; |
| 202 | PFN_vkCmdBindPipeline vkCmdBindPipeline{}; | 202 | PFN_vkCmdBindPipeline vkCmdBindPipeline{}; |
| 203 | PFN_vkCmdBindTransformFeedbackBuffersEXT vkCmdBindTransformFeedbackBuffersEXT{}; | 203 | PFN_vkCmdBindTransformFeedbackBuffersEXT vkCmdBindTransformFeedbackBuffersEXT{}; |
| 204 | PFN_vkCmdBindVertexBuffers vkCmdBindVertexBuffers{}; | 204 | PFN_vkCmdBindVertexBuffers vkCmdBindVertexBuffers{}; |
| 205 | PFN_vkCmdBindVertexBuffers2EXT vkCmdBindVertexBuffers2EXT{}; | ||
| 205 | PFN_vkCmdBlitImage vkCmdBlitImage{}; | 206 | PFN_vkCmdBlitImage vkCmdBlitImage{}; |
| 206 | PFN_vkCmdClearAttachments vkCmdClearAttachments{}; | 207 | PFN_vkCmdClearAttachments vkCmdClearAttachments{}; |
| 207 | PFN_vkCmdCopyBuffer vkCmdCopyBuffer{}; | 208 | PFN_vkCmdCopyBuffer vkCmdCopyBuffer{}; |
| @@ -211,35 +212,35 @@ struct DeviceDispatch : InstanceDispatch { | |||
| 211 | PFN_vkCmdDispatch vkCmdDispatch{}; | 212 | PFN_vkCmdDispatch vkCmdDispatch{}; |
| 212 | PFN_vkCmdDraw vkCmdDraw{}; | 213 | PFN_vkCmdDraw vkCmdDraw{}; |
| 213 | PFN_vkCmdDrawIndexed vkCmdDrawIndexed{}; | 214 | PFN_vkCmdDrawIndexed vkCmdDrawIndexed{}; |
| 215 | PFN_vkCmdEndDebugUtilsLabelEXT vkCmdEndDebugUtilsLabelEXT{}; | ||
| 214 | PFN_vkCmdEndQuery vkCmdEndQuery{}; | 216 | PFN_vkCmdEndQuery vkCmdEndQuery{}; |
| 215 | PFN_vkCmdEndRenderPass vkCmdEndRenderPass{}; | 217 | PFN_vkCmdEndRenderPass vkCmdEndRenderPass{}; |
| 216 | PFN_vkCmdEndTransformFeedbackEXT vkCmdEndTransformFeedbackEXT{}; | 218 | PFN_vkCmdEndTransformFeedbackEXT vkCmdEndTransformFeedbackEXT{}; |
| 217 | PFN_vkCmdEndDebugUtilsLabelEXT vkCmdEndDebugUtilsLabelEXT{}; | ||
| 218 | PFN_vkCmdFillBuffer vkCmdFillBuffer{}; | 219 | PFN_vkCmdFillBuffer vkCmdFillBuffer{}; |
| 219 | PFN_vkCmdPipelineBarrier vkCmdPipelineBarrier{}; | 220 | PFN_vkCmdPipelineBarrier vkCmdPipelineBarrier{}; |
| 220 | PFN_vkCmdPushConstants vkCmdPushConstants{}; | 221 | PFN_vkCmdPushConstants vkCmdPushConstants{}; |
| 222 | PFN_vkCmdPushDescriptorSetWithTemplateKHR vkCmdPushDescriptorSetWithTemplateKHR{}; | ||
| 223 | PFN_vkCmdResolveImage vkCmdResolveImage{}; | ||
| 221 | PFN_vkCmdSetBlendConstants vkCmdSetBlendConstants{}; | 224 | PFN_vkCmdSetBlendConstants vkCmdSetBlendConstants{}; |
| 225 | PFN_vkCmdSetCullModeEXT vkCmdSetCullModeEXT{}; | ||
| 222 | PFN_vkCmdSetDepthBias vkCmdSetDepthBias{}; | 226 | PFN_vkCmdSetDepthBias vkCmdSetDepthBias{}; |
| 223 | PFN_vkCmdSetDepthBounds vkCmdSetDepthBounds{}; | 227 | PFN_vkCmdSetDepthBounds vkCmdSetDepthBounds{}; |
| 224 | PFN_vkCmdSetEvent vkCmdSetEvent{}; | ||
| 225 | PFN_vkCmdSetScissor vkCmdSetScissor{}; | ||
| 226 | PFN_vkCmdSetStencilCompareMask vkCmdSetStencilCompareMask{}; | ||
| 227 | PFN_vkCmdSetStencilReference vkCmdSetStencilReference{}; | ||
| 228 | PFN_vkCmdSetStencilWriteMask vkCmdSetStencilWriteMask{}; | ||
| 229 | PFN_vkCmdSetViewport vkCmdSetViewport{}; | ||
| 230 | PFN_vkCmdWaitEvents vkCmdWaitEvents{}; | ||
| 231 | PFN_vkCmdBindVertexBuffers2EXT vkCmdBindVertexBuffers2EXT{}; | ||
| 232 | PFN_vkCmdSetCullModeEXT vkCmdSetCullModeEXT{}; | ||
| 233 | PFN_vkCmdSetDepthBoundsTestEnableEXT vkCmdSetDepthBoundsTestEnableEXT{}; | 228 | PFN_vkCmdSetDepthBoundsTestEnableEXT vkCmdSetDepthBoundsTestEnableEXT{}; |
| 234 | PFN_vkCmdSetDepthCompareOpEXT vkCmdSetDepthCompareOpEXT{}; | 229 | PFN_vkCmdSetDepthCompareOpEXT vkCmdSetDepthCompareOpEXT{}; |
| 235 | PFN_vkCmdSetDepthTestEnableEXT vkCmdSetDepthTestEnableEXT{}; | 230 | PFN_vkCmdSetDepthTestEnableEXT vkCmdSetDepthTestEnableEXT{}; |
| 236 | PFN_vkCmdSetDepthWriteEnableEXT vkCmdSetDepthWriteEnableEXT{}; | 231 | PFN_vkCmdSetDepthWriteEnableEXT vkCmdSetDepthWriteEnableEXT{}; |
| 232 | PFN_vkCmdSetEvent vkCmdSetEvent{}; | ||
| 237 | PFN_vkCmdSetFrontFaceEXT vkCmdSetFrontFaceEXT{}; | 233 | PFN_vkCmdSetFrontFaceEXT vkCmdSetFrontFaceEXT{}; |
| 238 | PFN_vkCmdSetPrimitiveTopologyEXT vkCmdSetPrimitiveTopologyEXT{}; | 234 | PFN_vkCmdSetPrimitiveTopologyEXT vkCmdSetPrimitiveTopologyEXT{}; |
| 235 | PFN_vkCmdSetScissor vkCmdSetScissor{}; | ||
| 236 | PFN_vkCmdSetStencilCompareMask vkCmdSetStencilCompareMask{}; | ||
| 239 | PFN_vkCmdSetStencilOpEXT vkCmdSetStencilOpEXT{}; | 237 | PFN_vkCmdSetStencilOpEXT vkCmdSetStencilOpEXT{}; |
| 238 | PFN_vkCmdSetStencilReference vkCmdSetStencilReference{}; | ||
| 240 | PFN_vkCmdSetStencilTestEnableEXT vkCmdSetStencilTestEnableEXT{}; | 239 | PFN_vkCmdSetStencilTestEnableEXT vkCmdSetStencilTestEnableEXT{}; |
| 240 | PFN_vkCmdSetStencilWriteMask vkCmdSetStencilWriteMask{}; | ||
| 241 | PFN_vkCmdSetVertexInputEXT vkCmdSetVertexInputEXT{}; | 241 | PFN_vkCmdSetVertexInputEXT vkCmdSetVertexInputEXT{}; |
| 242 | PFN_vkCmdResolveImage vkCmdResolveImage{}; | 242 | PFN_vkCmdSetViewport vkCmdSetViewport{}; |
| 243 | PFN_vkCmdWaitEvents vkCmdWaitEvents{}; | ||
| 243 | PFN_vkCreateBuffer vkCreateBuffer{}; | 244 | PFN_vkCreateBuffer vkCreateBuffer{}; |
| 244 | PFN_vkCreateBufferView vkCreateBufferView{}; | 245 | PFN_vkCreateBufferView vkCreateBufferView{}; |
| 245 | PFN_vkCreateCommandPool vkCreateCommandPool{}; | 246 | PFN_vkCreateCommandPool vkCreateCommandPool{}; |
| @@ -990,6 +991,12 @@ public: | |||
| 990 | dynamic_offsets.size(), dynamic_offsets.data()); | 991 | dynamic_offsets.size(), dynamic_offsets.data()); |
| 991 | } | 992 | } |
| 992 | 993 | ||
| 994 | void PushDescriptorSetWithTemplateKHR(VkDescriptorUpdateTemplateKHR update_template, | ||
| 995 | VkPipelineLayout layout, u32 set, | ||
| 996 | const void* data) const noexcept { | ||
| 997 | dld->vkCmdPushDescriptorSetWithTemplateKHR(handle, update_template, layout, set, data); | ||
| 998 | } | ||
| 999 | |||
| 993 | void BindPipeline(VkPipelineBindPoint bind_point, VkPipeline pipeline) const noexcept { | 1000 | void BindPipeline(VkPipelineBindPoint bind_point, VkPipeline pipeline) const noexcept { |
| 994 | dld->vkCmdBindPipeline(handle, bind_point, pipeline); | 1001 | dld->vkCmdBindPipeline(handle, bind_point, pipeline); |
| 995 | } | 1002 | } |