// Copyright 2018 yuzu Emulator Project // Licensed under GPLv2 or any later version // Refer to the license.txt file included. #include #include #include #include #include #include "common/assert.h" #include "video_core/renderer_vulkan/declarations.h" #include "video_core/renderer_vulkan/vk_device.h" namespace Vulkan { namespace { template void SetNext(void**& next, T& data) { *next = &data; next = &data.pNext; } template T GetFeatures(vk::PhysicalDevice physical, vk::DispatchLoaderDynamic dldi) { vk::PhysicalDeviceFeatures2 features; T extension_features; features.pNext = &extension_features; physical.getFeatures2(&features, dldi); return extension_features; } } // Anonymous namespace namespace Alternatives { constexpr std::array Depth24UnormS8Uint = {vk::Format::eD32SfloatS8Uint, vk::Format::eD16UnormS8Uint, vk::Format{}}; constexpr std::array Depth16UnormS8Uint = {vk::Format::eD24UnormS8Uint, vk::Format::eD32SfloatS8Uint, vk::Format{}}; constexpr std::array Astc = {vk::Format::eA8B8G8R8UnormPack32, vk::Format{}}; } // namespace Alternatives constexpr const vk::Format* GetFormatAlternatives(vk::Format format) { switch (format) { case vk::Format::eD24UnormS8Uint: return Alternatives::Depth24UnormS8Uint.data(); case vk::Format::eD16UnormS8Uint: return Alternatives::Depth16UnormS8Uint.data(); default: return nullptr; } } constexpr vk::FormatFeatureFlags GetFormatFeatures(vk::FormatProperties properties, FormatType format_type) { switch (format_type) { case FormatType::Linear: return properties.linearTilingFeatures; case FormatType::Optimal: return properties.optimalTilingFeatures; case FormatType::Buffer: return properties.bufferFeatures; default: return {}; } } VKDevice::VKDevice(const vk::DispatchLoaderDynamic& dldi, vk::PhysicalDevice physical, vk::SurfaceKHR surface) : physical{physical}, format_properties{GetFormatProperties(dldi, physical)} { SetupFamilies(dldi, surface); SetupProperties(dldi); SetupFeatures(dldi); } VKDevice::~VKDevice() = default; bool VKDevice::Create(const vk::DispatchLoaderDynamic& dldi, vk::Instance instance) { const auto queue_cis = GetDeviceQueueCreateInfos(); const std::vector extensions = LoadExtensions(dldi); vk::PhysicalDeviceFeatures2 features2; void** next = &features2.pNext; auto& features = features2.features; features.vertexPipelineStoresAndAtomics = true; features.independentBlend = true; features.depthClamp = true; features.samplerAnisotropy = true; features.largePoints = true; features.textureCompressionASTC_LDR = is_optimal_astc_supported; vk::PhysicalDeviceVertexAttributeDivisorFeaturesEXT vertex_divisor; vertex_divisor.vertexAttributeInstanceRateDivisor = true; vertex_divisor.vertexAttributeInstanceRateZeroDivisor = true; SetNext(next, vertex_divisor); vk::PhysicalDeviceFloat16Int8FeaturesKHR float16_int8; if (is_float16_supported) { float16_int8.shaderFloat16 = true; SetNext(next, float16_int8); } else { LOG_INFO(Render_Vulkan, "Device doesn't support float16 natively"); } vk::PhysicalDeviceUniformBufferStandardLayoutFeaturesKHR std430_layout; if (khr_uniform_buffer_standard_layout) { std430_layout.uniformBufferStandardLayout = true; SetNext(next, std430_layout); } else { LOG_INFO(Render_Vulkan, "Device doesn't support packed UBOs"); } vk::PhysicalDeviceIndexTypeUint8FeaturesEXT index_type_uint8; if (ext_index_type_uint8) { index_type_uint8.indexTypeUint8 = true; SetNext(next, index_type_uint8); } else { LOG_INFO(Render_Vulkan, "Device doesn't support uint8 indexes"); } vk::DeviceCreateInfo device_ci({}, static_cast(queue_cis.size()), queue_cis.data(), 0, nullptr, static_cast(extensions.size()), extensions.data(), nullptr); device_ci.pNext = &features2; vk::Device dummy_logical; if (physical.createDevice(&device_ci, nullptr, &dummy_logical, dldi) != vk::Result::eSuccess) { LOG_CRITICAL(Render_Vulkan, "Logical device failed to be created!"); return false; } dld.init(instance, dldi.vkGetInstanceProcAddr, dummy_logical, dldi.vkGetDeviceProcAddr); logical = UniqueDevice( dummy_logical, vk::ObjectDestroy(nullptr, dld)); if (khr_driver_properties) { vk::PhysicalDeviceDriverPropertiesKHR driver; vk::PhysicalDeviceProperties2 properties; properties.pNext = &driver; physical.getProperties2(&properties, dld); driver_id = driver.driverID; LOG_INFO(Render_Vulkan, "Driver: {} {}", driver.driverName, driver.driverInfo); } else { LOG_INFO(Render_Vulkan, "Driver: Unknown"); } graphics_queue = logical->getQueue(graphics_family, 0, dld); present_queue = logical->getQueue(present_family, 0, dld); return true; } vk::Format VKDevice::GetSupportedFormat(vk::Format wanted_format, vk::FormatFeatureFlags wanted_usage, FormatType format_type) const { if (IsFormatSupported(wanted_format, wanted_usage, format_type)) { return wanted_format; } // The wanted format is not supported by hardware, search for alternatives const vk::Format* alternatives = GetFormatAlternatives(wanted_format); if (alternatives == nullptr) { UNREACHABLE_MSG("Format={} with usage={} and type={} has no defined alternatives and host " "hardware does not support it", vk::to_string(wanted_format), vk::to_string(wanted_usage), static_cast(format_type)); return wanted_format; } std::size_t i = 0; for (vk::Format alternative = alternatives[0]; alternative != vk::Format{}; alternative = alternatives[++i]) { if (!IsFormatSupported(alternative, wanted_usage, format_type)) { continue; } LOG_WARNING(Render_Vulkan, "Emulating format={} with alternative format={} with usage={} and type={}", static_cast(wanted_format), static_cast(alternative), static_cast(wanted_usage), static_cast(format_type)); return alternative; } // No alternatives found, panic UNREACHABLE_MSG("Format={} with usage={} and type={} is not supported by the host hardware and " "doesn't support any of the alternatives", static_cast(wanted_format), static_cast(wanted_usage), static_cast(format_type)); return wanted_format; } bool VKDevice::IsOptimalAstcSupported(const vk::PhysicalDeviceFeatures& features, const vk::DispatchLoaderDynamic& dldi) const { if (!features.textureCompressionASTC_LDR) { return false; } const auto format_feature_usage{ vk::FormatFeatureFlagBits::eSampledImage | vk::FormatFeatureFlagBits::eBlitSrc | vk::FormatFeatureFlagBits::eBlitDst | vk::FormatFeatureFlagBits::eTransferSrc | vk::FormatFeatureFlagBits::eTransferDst}; constexpr std::array astc_formats = { vk::Format::eAstc4x4UnormBlock, vk::Format::eAstc4x4SrgbBlock, vk::Format::eAstc8x8SrgbBlock, vk::Format::eAstc8x6SrgbBlock, vk::Format::eAstc5x4SrgbBlock, vk::Format::eAstc5x5UnormBlock, vk::Format::eAstc5x5SrgbBlock, vk::Format::eAstc10x8UnormBlock, vk::Format::eAstc10x8SrgbBlock}; for (const auto format : astc_formats) { const auto format_properties{physical.getFormatProperties(format, dldi)}; if (!(format_properties.optimalTilingFeatures & format_feature_usage)) { return false; } } return true; } bool VKDevice::IsFormatSupported(vk::Format wanted_format, vk::FormatFeatureFlags wanted_usage, FormatType format_type) const { const auto it = format_properties.find(wanted_format); if (it == format_properties.end()) { UNIMPLEMENTED_MSG("Unimplemented format query={}", vk::to_string(wanted_format)); return true; } const auto supported_usage = GetFormatFeatures(it->second, format_type); return (supported_usage & wanted_usage) == wanted_usage; } bool VKDevice::IsSuitable(const vk::DispatchLoaderDynamic& dldi, vk::PhysicalDevice physical, vk::SurfaceKHR surface) { LOG_INFO(Render_Vulkan, "{}", physical.getProperties(dldi).deviceName); bool is_suitable = true; constexpr std::array required_extensions = {VK_KHR_SWAPCHAIN_EXTENSION_NAME, VK_EXT_VERTEX_ATTRIBUTE_DIVISOR_EXTENSION_NAME}; std::bitset available_extensions{}; for (const auto& prop : physical.enumerateDeviceExtensionProperties(nullptr, dldi)) { for (std::size_t i = 0; i < required_extensions.size(); ++i) { if (available_extensions[i]) { continue; } available_extensions[i] = required_extensions[i] == std::string_view{prop.extensionName}; } } if (!available_extensions.all()) { for (std::size_t i = 0; i < required_extensions.size(); ++i) { if (available_extensions[i]) { continue; } LOG_INFO(Render_Vulkan, "Missing required extension: {}", required_extensions[i]); is_suitable = false; } } bool has_graphics{}, has_present{}; const auto queue_family_properties = physical.getQueueFamilyProperties(dldi); for (u32 i = 0; i < static_cast(queue_family_properties.size()); ++i) { const auto& family = queue_family_properties[i]; if (family.queueCount == 0) { continue; } has_graphics |= (family.queueFlags & vk::QueueFlagBits::eGraphics) != static_cast(0); has_present |= physical.getSurfaceSupportKHR(i, surface, dldi) != 0; } if (!has_graphics || !has_present) { LOG_INFO(Render_Vulkan, "Device lacks a graphics and present queue"); is_suitable = false; } // TODO(Rodrigo): Check if the device matches all requeriments. const auto properties{physical.getProperties(dldi)}; const auto& limits{properties.limits}; constexpr u32 required_ubo_size = 65536; if (limits.maxUniformBufferRange < required_ubo_size) { LOG_INFO(Render_Vulkan, "Device UBO size {} is too small, {} is required)", limits.maxUniformBufferRange, required_ubo_size); is_suitable = false; } const auto features{physical.getFeatures(dldi)}; const std::array feature_report = { std::make_pair(features.vertexPipelineStoresAndAtomics, "vertexPipelineStoresAndAtomics"), std::make_pair(features.independentBlend, "independentBlend"), std::make_pair(features.depthClamp, "depthClamp"), std::make_pair(features.samplerAnisotropy, "samplerAnisotropy"), std::make_pair(features.largePoints, "largePoints"), }; for (const auto& [supported, name] : feature_report) { if (supported) { continue; } LOG_INFO(Render_Vulkan, "Missing required feature: {}", name); is_suitable = false; } return is_suitable; } std::vector VKDevice::LoadExtensions(const vk::DispatchLoaderDynamic& dldi) { std::vector extensions; extensions.reserve(7); extensions.push_back(VK_KHR_SWAPCHAIN_EXTENSION_NAME); extensions.push_back(VK_EXT_VERTEX_ATTRIBUTE_DIVISOR_EXTENSION_NAME); const auto Test = [&](const vk::ExtensionProperties& extension, std::optional> status, const char* name, bool push) { if (extension.extensionName != std::string_view(name)) { return; } if (push) { extensions.push_back(name); } if (status) { status->get() = true; } }; bool khr_shader_float16_int8{}; for (const auto& extension : physical.enumerateDeviceExtensionProperties(nullptr, dldi)) { Test(extension, khr_uniform_buffer_standard_layout, VK_KHR_UNIFORM_BUFFER_STANDARD_LAYOUT_EXTENSION_NAME, true); Test(extension, ext_index_type_uint8, VK_EXT_INDEX_TYPE_UINT8_EXTENSION_NAME, true); Test(extension, khr_driver_properties, VK_KHR_DRIVER_PROPERTIES_EXTENSION_NAME, true); Test(extension, khr_shader_float16_int8, VK_KHR_SHADER_FLOAT16_INT8_EXTENSION_NAME, false); } if (khr_shader_float16_int8) { is_float16_supported = GetFeatures(physical, dldi).shaderFloat16; extensions.push_back(VK_KHR_SHADER_FLOAT16_INT8_EXTENSION_NAME); } return extensions; } void VKDevice::SetupFamilies(const vk::DispatchLoaderDynamic& dldi, vk::SurfaceKHR surface) { std::optional graphics_family_, present_family_; const auto queue_family_properties = physical.getQueueFamilyProperties(dldi); for (u32 i = 0; i < static_cast(queue_family_properties.size()); ++i) { if (graphics_family_ && present_family_) break; const auto& queue_family = queue_family_properties[i]; if (queue_family.queueCount == 0) continue; if (queue_family.queueFlags & vk::QueueFlagBits::eGraphics) graphics_family_ = i; if (physical.getSurfaceSupportKHR(i, surface, dldi)) present_family_ = i; } ASSERT(graphics_family_ && present_family_); graphics_family = *graphics_family_; present_family = *present_family_; } void VKDevice::SetupProperties(const vk::DispatchLoaderDynamic& dldi) { const auto props = physical.getProperties(dldi); device_type = props.deviceType; uniform_buffer_alignment = static_cast(props.limits.minUniformBufferOffsetAlignment); storage_buffer_alignment = static_cast(props.limits.minStorageBufferOffsetAlignment); max_storage_buffer_range = static_cast(props.limits.maxStorageBufferRange); } void VKDevice::SetupFeatures(const vk::DispatchLoaderDynamic& dldi) { const auto supported_features{physical.getFeatures(dldi)}; is_optimal_astc_supported = IsOptimalAstcSupported(supported_features, dldi); } std::vector VKDevice::GetDeviceQueueCreateInfos() const { static const float QUEUE_PRIORITY = 1.0f; std::set unique_queue_families = {graphics_family, present_family}; std::vector queue_cis; for (u32 queue_family : unique_queue_families) queue_cis.push_back({{}, queue_family, 1, &QUEUE_PRIORITY}); return queue_cis; } std::unordered_map VKDevice::GetFormatProperties( const vk::DispatchLoaderDynamic& dldi, vk::PhysicalDevice physical) { constexpr std::array formats{vk::Format::eA8B8G8R8UnormPack32, vk::Format::eA8B8G8R8SnormPack32, vk::Format::eA8B8G8R8SrgbPack32, vk::Format::eB5G6R5UnormPack16, vk::Format::eA2B10G10R10UnormPack32, vk::Format::eR32G32B32A32Sfloat, vk::Format::eR16G16B16A16Uint, vk::Format::eR16G16Unorm, vk::Format::eR16G16Snorm, vk::Format::eR16G16Sfloat, vk::Format::eR16Unorm, vk::Format::eR8G8B8A8Srgb, vk::Format::eR8G8Unorm, vk::Format::eR8G8Snorm, vk::Format::eR8Unorm, vk::Format::eB10G11R11UfloatPack32, vk::Format::eR32Sfloat, vk::Format::eR16Sfloat, vk::Format::eR16G16B16A16Sfloat, vk::Format::eB8G8R8A8Unorm, vk::Format::eD32Sfloat, vk::Format::eD16Unorm, vk::Format::eD16UnormS8Uint, vk::Format::eD24UnormS8Uint, vk::Format::eD32SfloatS8Uint, vk::Format::eBc1RgbaUnormBlock, vk::Format::eBc2UnormBlock, vk::Format::eBc3UnormBlock, vk::Format::eBc4UnormBlock, vk::Format::eBc5UnormBlock, vk::Format::eBc5SnormBlock, vk::Format::eBc7UnormBlock, vk::Format::eBc1RgbaSrgbBlock, vk::Format::eBc3SrgbBlock, vk::Format::eBc7SrgbBlock, vk::Format::eAstc4x4UnormBlock, vk::Format::eAstc4x4SrgbBlock, vk::Format::eAstc8x8SrgbBlock, vk::Format::eAstc8x6SrgbBlock, vk::Format::eAstc5x4SrgbBlock, vk::Format::eAstc5x5UnormBlock, vk::Format::eAstc5x5SrgbBlock, vk::Format::eAstc10x8UnormBlock, vk::Format::eAstc10x8SrgbBlock}; std::unordered_map format_properties; for (const auto format : formats) { format_properties.emplace(format, physical.getFormatProperties(format, dldi)); } return format_properties; } } // namespace Vulkan