[VK] Hybrid memory allocation with robust alignment (#325)

Combines robust OOM handling with progressive size reduction and spec-compliant alignment: This hybrid approach maximizes allocation success rates through multiple recovery tries. Reviewed-on: #325 Reviewed-by: CamilleLaVey <camillelavey99@gmail.com> Credits to Wildcard Co-authored-by: wildcard <wildcard@eden-emu.dev> Co-committed-by: wildcard <wildcard@eden-emu.dev>
2025-08-27 04:45:50 +02:00 · 2025-08-27 04:45:50 +02:00 · 380cfcaeed
commit 380cfcaeed
parent 44d658bbc5
1 changed files with 119 additions and 20 deletions
--- a/src/video_core/vulkan_common/vulkan_memory_allocator.cpp
+++ b/src/video_core/vulkan_common/vulkan_memory_allocator.cpp
@ -143,6 +143,10 @@ public:
        return (flags & property_flags) == flags && (type_mask & shifted_memory_type) != 0;
    }
    [[nodiscard]] bool IsEmpty() const noexcept {
        return commits.empty();
    }
 private:
    [[nodiscard]] static constexpr u32 ShiftType(u32 type) {
        return 1U << type;
@ -290,36 +294,117 @@ MemoryCommit MemoryAllocator::Commit(const VkMemoryRequirements& requirements, M
    if (std::optional<MemoryCommit> commit = TryCommit(requirements, flags)) {
        return std::move(*commit);
    }
-    // Commit has failed, allocate more memory.
+
-    const u64 chunk_size = AllocationChunkSize(requirements.size);
+    // Commit has failed, try progressive fallback strategy
-    if (!TryAllocMemory(flags, type_mask, chunk_size)) {
+    u64 chunk_size = AllocationChunkSize(requirements.size);
-        // TODO(Rodrigo): Handle out of memory situations in some way like flushing to guest memory.
+    const u64 minimum_size = std::max<u64>(requirements.size, 4ULL << 20); // 4MB minimum
-        throw vk::Exception(VK_ERROR_OUT_OF_DEVICE_MEMORY);
+
    // try 1: Try allocating with original chunk size
    if (TryAllocMemory(flags, type_mask, chunk_size)) {
        return TryCommit(requirements, flags).value();
    }
-    // Commit again, this time it won't fail since there's a fresh allocation above.
+
-    // If it does, there's a bug.
+    // try 2: Clean up empty allocations and try again
-    return TryCommit(requirements, flags).value();
+    bool cleaned_up = false;
    for (auto it = allocations.begin(); it != allocations.end();) {
        if ((*it)->IsEmpty()) {
            it = allocations.erase(it);
            cleaned_up = true;
        } else {
            ++it;
        }
    }
    if (cleaned_up && TryAllocMemory(flags, type_mask, chunk_size)) {
        LOG_INFO(Render_Vulkan, "Memory allocation succeeded after cleanup");
        return TryCommit(requirements, flags).value();
    }
    // try 3: Progressive size reduction with cleanup between attempts
    while (chunk_size > minimum_size) {
        chunk_size >>= 1; // Halve the chunk size
        chunk_size = std::max(chunk_size, minimum_size);
        if (TryAllocMemory(flags, type_mask, chunk_size)) {
            LOG_WARNING(Render_Vulkan, "Memory allocation succeeded with reduced chunk size: {} MB",
                       chunk_size >> 20);
            return TryCommit(requirements, flags).value();
        }
        // Clean up again between size reduction attempts
        for (auto it = allocations.begin(); it != allocations.end();) {
            if ((*it)->IsEmpty()) {
                it = allocations.erase(it);
            } else {
                ++it;
            }
        }
    }
    // try 4: Try minimum size allocation
    if (chunk_size <= minimum_size && TryAllocMemory(flags, type_mask, minimum_size)) {
        LOG_WARNING(Render_Vulkan, "Memory allocation succeeded with minimum size: {} MB",
                    minimum_size >> 20);
        return TryCommit(requirements, flags).value();
    }
    // try 5: Fallback to non-device-local memory if original was device-local
    if (flags & VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT) {
            const VkMemoryPropertyFlags fallback_flags = flags & ~VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT;
            // Try with original chunk size first
            u64 fallback_chunk_size = AllocationChunkSize(requirements.size);
            if (TryAllocMemory(fallback_flags, type_mask, fallback_chunk_size)) {
                if (auto commit = TryCommit(requirements, fallback_flags)) {
                    LOG_WARNING(Render_Vulkan, "Falling back to non-device-local memory due to OOM");
                    return std::move(*commit);
                }
            }
            // Progressive size reduction for non-device-local memory
            while (fallback_chunk_size > minimum_size) {
                fallback_chunk_size >>= 1;
                fallback_chunk_size = std::max(fallback_chunk_size, minimum_size);
                if (TryAllocMemory(fallback_flags, type_mask, fallback_chunk_size)) {
                    if (auto commit = TryCommit(requirements, fallback_flags)) {
                        LOG_WARNING(Render_Vulkan,
                                   "Falling back to non-device-local memory with reduced size: {} MB",
                                   fallback_chunk_size >> 20);
                        return std::move(*commit);
                    }
                }
            }
    }
    LOG_CRITICAL(Render_Vulkan, "Vulkan memory allocation failed - exhausted all strategies");
    throw vk::Exception(VK_ERROR_OUT_OF_DEVICE_MEMORY);
 }
 bool MemoryAllocator::TryAllocMemory(VkMemoryPropertyFlags flags, u32 type_mask, u64 size) {
-    const u32 type = FindType(flags, type_mask).value();
+    const auto type_opt = FindType(flags, type_mask);
    if (!type_opt) {
        return false;
    }
    // Adreno requires 4KB alignment(subject to review)
    const u64 aligned_size = (device.GetDriverID() == VK_DRIVER_ID_QUALCOMM_PROPRIETARY) ?
                            Common::AlignUp(size, 4096) :
                            size;
    vk::DeviceMemory memory = device.GetLogical().TryAllocateMemory({
        .sType = VK_STRUCTURE_TYPE_MEMORY_ALLOCATE_INFO,
        .pNext = nullptr,
-        .allocationSize = size,
+        .allocationSize = aligned_size,
-        .memoryTypeIndex = type,
+        .memoryTypeIndex = *type_opt,
    });
    if (!memory) {
-        if ((flags & VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT) != 0) {
+        return false;
            // Try to allocate non device local memory
            return TryAllocMemory(flags & ~VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT, type_mask, size);
        } else {
            // RIP
            return false;
        }
    }
    allocations.push_back(
-        std::make_unique<MemoryAllocation>(this, std::move(memory), flags, size, type));
+        std::make_unique<MemoryAllocation>(this, std::move(memory), flags, aligned_size, *type_opt));
    return true;
 }
@ -331,11 +416,25 @@ void MemoryAllocator::ReleaseMemory(MemoryAllocation* alloc) {
 std::optional<MemoryCommit> MemoryAllocator::TryCommit(const VkMemoryRequirements& requirements,
                                                       VkMemoryPropertyFlags flags) {
    // Conservative, spec-compliant alignment for suballocation
    VkDeviceSize eff_align = requirements.alignment;
    const auto& limits = device.GetPhysical().GetProperties().limits;
    if ((flags & VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT) &&
        !(flags & VK_MEMORY_PROPERTY_HOST_COHERENT_BIT)) {
        // Non-coherent memory must be invalidated on atom boundary
        if (limits.nonCoherentAtomSize > eff_align) eff_align = limits.nonCoherentAtomSize;
    }
    // Separate buffers to avoid stalls on tilers
    if (buffer_image_granularity > eff_align) {
        eff_align = buffer_image_granularity;
    }
    eff_align = std::bit_ceil(eff_align);
    for (auto& allocation : allocations) {
        if (!allocation->IsCompatible(flags, requirements.memoryTypeBits)) {
            continue;
        }
-        if (auto commit = allocation->Commit(requirements.size, requirements.alignment)) {
+        if (auto commit = allocation->Commit(requirements.size, eff_align)) {
            return commit;
        }
    }