forked from eden-emu/eden
		
	Reaper: Tune it up to be an smart GC.
This commit is contained in:
		
							parent
							
								
									a11bc4a382
								
							
						
					
					
						commit
						d8ad6aa187
					
				
					 5 changed files with 130 additions and 13 deletions
				
			
		|  | @ -65,6 +65,9 @@ class BufferCache { | ||||||
| 
 | 
 | ||||||
|     static constexpr BufferId NULL_BUFFER_ID{0}; |     static constexpr BufferId NULL_BUFFER_ID{0}; | ||||||
| 
 | 
 | ||||||
|  |     static constexpr u64 expected_memory = 512ULL * 1024ULL * 1024ULL; | ||||||
|  |     static constexpr u64 critical_memory = 1024ULL * 1024ULL * 1024ULL; | ||||||
|  | 
 | ||||||
|     using Maxwell = Tegra::Engines::Maxwell3D::Regs; |     using Maxwell = Tegra::Engines::Maxwell3D::Regs; | ||||||
| 
 | 
 | ||||||
|     using Runtime = typename P::Runtime; |     using Runtime = typename P::Runtime; | ||||||
|  | @ -327,6 +330,7 @@ private: | ||||||
| 
 | 
 | ||||||
|     typename SlotVector<Buffer>::Iterator deletion_iterator; |     typename SlotVector<Buffer>::Iterator deletion_iterator; | ||||||
|     u64 frame_tick = 0; |     u64 frame_tick = 0; | ||||||
|  |     u64 total_used_memory = 0; | ||||||
| 
 | 
 | ||||||
|     std::array<BufferId, ((1ULL << 39) >> PAGE_BITS)> page_table; |     std::array<BufferId, ((1ULL << 39) >> PAGE_BITS)> page_table; | ||||||
| }; | }; | ||||||
|  | @ -346,6 +350,10 @@ BufferCache<P>::BufferCache(VideoCore::RasterizerInterface& rasterizer_, | ||||||
| 
 | 
 | ||||||
| template <class P> | template <class P> | ||||||
| void BufferCache<P>::TickFrame() { | void BufferCache<P>::TickFrame() { | ||||||
|  |     SCOPE_EXIT({ | ||||||
|  |       ++frame_tick; | ||||||
|  |       delayed_destruction_ring.Tick(); | ||||||
|  |     }); | ||||||
|     // Calculate hits and shots and move hit bits to the right
 |     // Calculate hits and shots and move hit bits to the right
 | ||||||
|     const u32 hits = std::reduce(uniform_cache_hits.begin(), uniform_cache_hits.end()); |     const u32 hits = std::reduce(uniform_cache_hits.begin(), uniform_cache_hits.end()); | ||||||
|     const u32 shots = std::reduce(uniform_cache_shots.begin(), uniform_cache_shots.end()); |     const u32 shots = std::reduce(uniform_cache_shots.begin(), uniform_cache_shots.end()); | ||||||
|  | @ -359,8 +367,13 @@ void BufferCache<P>::TickFrame() { | ||||||
|     const bool skip_preferred = hits * 256 < shots * 251; |     const bool skip_preferred = hits * 256 < shots * 251; | ||||||
|     uniform_buffer_skip_cache_size = skip_preferred ? DEFAULT_SKIP_CACHE_SIZE : 0; |     uniform_buffer_skip_cache_size = skip_preferred ? DEFAULT_SKIP_CACHE_SIZE : 0; | ||||||
| 
 | 
 | ||||||
|     static constexpr u64 ticks_to_destroy = 120; |     const bool activate_gc = total_used_memory >= expected_memory; | ||||||
|     int num_iterations = 32; |     if (!activate_gc) { | ||||||
|  |         return; | ||||||
|  |     } | ||||||
|  |     const bool agressive_gc = total_used_memory >= critical_memory; | ||||||
|  |     const u64 ticks_to_destroy = agressive_gc ? 60 : 120; | ||||||
|  |     int num_iterations = agressive_gc ? 64 : 32; | ||||||
|     for (; num_iterations > 0; --num_iterations) { |     for (; num_iterations > 0; --num_iterations) { | ||||||
|         if (deletion_iterator == slot_buffers.end()) { |         if (deletion_iterator == slot_buffers.end()) { | ||||||
|             deletion_iterator = slot_buffers.begin(); |             deletion_iterator = slot_buffers.begin(); | ||||||
|  | @ -375,8 +388,6 @@ void BufferCache<P>::TickFrame() { | ||||||
|             DeleteBuffer(buffer_id); |             DeleteBuffer(buffer_id); | ||||||
|         } |         } | ||||||
|     } |     } | ||||||
|     delayed_destruction_ring.Tick(); |  | ||||||
|     ++frame_tick; |  | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| template <class P> | template <class P> | ||||||
|  | @ -1115,8 +1126,14 @@ template <class P> | ||||||
| template <bool insert> | template <bool insert> | ||||||
| void BufferCache<P>::ChangeRegister(BufferId buffer_id) { | void BufferCache<P>::ChangeRegister(BufferId buffer_id) { | ||||||
|     const Buffer& buffer = slot_buffers[buffer_id]; |     const Buffer& buffer = slot_buffers[buffer_id]; | ||||||
|  |     const auto size = buffer.SizeBytes(); | ||||||
|  |     if (insert) { | ||||||
|  |         total_used_memory += Common::AlignUp(size, 1024); | ||||||
|  |     } else { | ||||||
|  |         total_used_memory -= Common::AlignUp(size, 1024); | ||||||
|  |     } | ||||||
|     const VAddr cpu_addr_begin = buffer.CpuAddr(); |     const VAddr cpu_addr_begin = buffer.CpuAddr(); | ||||||
|     const VAddr cpu_addr_end = cpu_addr_begin + buffer.SizeBytes(); |     const VAddr cpu_addr_end = cpu_addr_begin + size; | ||||||
|     const u64 page_begin = cpu_addr_begin / PAGE_SIZE; |     const u64 page_begin = cpu_addr_begin / PAGE_SIZE; | ||||||
|     const u64 page_end = Common::DivCeil(cpu_addr_end, PAGE_SIZE); |     const u64 page_end = Common::DivCeil(cpu_addr_end, PAGE_SIZE); | ||||||
|     for (u64 page = page_begin; page != page_end; ++page) { |     for (u64 page = page_begin; page != page_end; ++page) { | ||||||
|  |  | ||||||
|  | @ -130,6 +130,26 @@ bool ImageBase::IsSafeDownload() const noexcept { | ||||||
|     return true; |     return true; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | void ImageBase::CheckBadOverlapState() { | ||||||
|  |     if (False(flags & ImageFlagBits::BadOverlap)) { | ||||||
|  |         return; | ||||||
|  |     } | ||||||
|  |     if (!overlapping_images.empty()) { | ||||||
|  |         return; | ||||||
|  |     } | ||||||
|  |     flags &= ~ImageFlagBits::BadOverlap; | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | void ImageBase::CheckAliasState() { | ||||||
|  |     if (False(flags & ImageFlagBits::Alias)) { | ||||||
|  |         return; | ||||||
|  |     } | ||||||
|  |     if (!aliased_images.empty()) { | ||||||
|  |         return; | ||||||
|  |     } | ||||||
|  |     flags &= ~ImageFlagBits::Alias; | ||||||
|  | } | ||||||
|  | 
 | ||||||
| void AddImageAlias(ImageBase& lhs, ImageBase& rhs, ImageId lhs_id, ImageId rhs_id) { | void AddImageAlias(ImageBase& lhs, ImageBase& rhs, ImageId lhs_id, ImageId rhs_id) { | ||||||
|     static constexpr auto OPTIONS = RelaxedOptions::Size | RelaxedOptions::Format; |     static constexpr auto OPTIONS = RelaxedOptions::Size | RelaxedOptions::Format; | ||||||
|     ASSERT(lhs.info.type == rhs.info.type); |     ASSERT(lhs.info.type == rhs.info.type); | ||||||
|  |  | ||||||
|  | @ -25,6 +25,12 @@ enum class ImageFlagBits : u32 { | ||||||
|     Strong = 1 << 5,      ///< Exists in the image table, the dimensions are can be trusted
 |     Strong = 1 << 5,      ///< Exists in the image table, the dimensions are can be trusted
 | ||||||
|     Registered = 1 << 6,  ///< True when the image is registered
 |     Registered = 1 << 6,  ///< True when the image is registered
 | ||||||
|     Picked = 1 << 7,      ///< Temporary flag to mark the image as picked
 |     Picked = 1 << 7,      ///< Temporary flag to mark the image as picked
 | ||||||
|  | 
 | ||||||
|  |     // Garbage Collection Flags
 | ||||||
|  |     BadOverlap = 1 << 8,     ///< This image overlaps other but doesn't fit, has higher
 | ||||||
|  |                              ///< garbage collection priority
 | ||||||
|  |     Alias = 1 << 9,          ///< This image has aliases and has priority on garbage
 | ||||||
|  |                              ///< collection
 | ||||||
| }; | }; | ||||||
| DECLARE_ENUM_FLAG_OPERATORS(ImageFlagBits) | DECLARE_ENUM_FLAG_OPERATORS(ImageFlagBits) | ||||||
| 
 | 
 | ||||||
|  | @ -51,6 +57,9 @@ struct ImageBase { | ||||||
|         return cpu_addr < overlap_end && overlap_cpu_addr < cpu_addr_end; |         return cpu_addr < overlap_end && overlap_cpu_addr < cpu_addr_end; | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|  |     void CheckBadOverlapState(); | ||||||
|  |     void CheckAliasState(); | ||||||
|  | 
 | ||||||
|     ImageInfo info; |     ImageInfo info; | ||||||
| 
 | 
 | ||||||
|     u32 guest_size_bytes = 0; |     u32 guest_size_bytes = 0; | ||||||
|  | @ -74,6 +83,7 @@ struct ImageBase { | ||||||
|     std::vector<SubresourceBase> slice_subresources; |     std::vector<SubresourceBase> slice_subresources; | ||||||
| 
 | 
 | ||||||
|     std::vector<AliasedImage> aliased_images; |     std::vector<AliasedImage> aliased_images; | ||||||
|  |     std::vector<ImageId> overlapping_images; | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
| struct ImageAllocBase { | struct ImageAllocBase { | ||||||
|  |  | ||||||
|  | @ -75,6 +75,9 @@ class TextureCache { | ||||||
|     /// Sampler ID for bugged sampler ids
 |     /// Sampler ID for bugged sampler ids
 | ||||||
|     static constexpr SamplerId NULL_SAMPLER_ID{0}; |     static constexpr SamplerId NULL_SAMPLER_ID{0}; | ||||||
| 
 | 
 | ||||||
|  |     static constexpr u64 expected_memory = 1024ULL * 1024ULL * 1024ULL; | ||||||
|  |     static constexpr u64 critical_memory = 2 * 1024ULL * 1024ULL * 1024ULL; | ||||||
|  | 
 | ||||||
|     using Runtime = typename P::Runtime; |     using Runtime = typename P::Runtime; | ||||||
|     using Image = typename P::Image; |     using Image = typename P::Image; | ||||||
|     using ImageAlloc = typename P::ImageAlloc; |     using ImageAlloc = typename P::ImageAlloc; | ||||||
|  | @ -333,6 +336,7 @@ private: | ||||||
|     std::unordered_map<u64, std::vector<ImageId>, IdentityHash<u64>> page_table; |     std::unordered_map<u64, std::vector<ImageId>, IdentityHash<u64>> page_table; | ||||||
| 
 | 
 | ||||||
|     bool has_deleted_images = false; |     bool has_deleted_images = false; | ||||||
|  |     u64 total_used_memory = 0; | ||||||
| 
 | 
 | ||||||
|     SlotVector<Image> slot_images; |     SlotVector<Image> slot_images; | ||||||
|     SlotVector<ImageView> slot_image_views; |     SlotVector<ImageView> slot_image_views; | ||||||
|  | @ -380,8 +384,10 @@ TextureCache<P>::TextureCache(Runtime& runtime_, VideoCore::RasterizerInterface& | ||||||
| 
 | 
 | ||||||
| template <class P> | template <class P> | ||||||
| void TextureCache<P>::TickFrame() { | void TextureCache<P>::TickFrame() { | ||||||
|     static constexpr u64 ticks_to_destroy = 120; |     const bool high_priority_mode = total_used_memory >= expected_memory; | ||||||
|     int num_iterations = 32; |     const bool aggressive_mode = total_used_memory >= critical_memory; | ||||||
|  |     const u64 ticks_to_destroy = high_priority_mode ? 60 : 100; | ||||||
|  |     int num_iterations = aggressive_mode ? 256 : (high_priority_mode ? 128 : 64); | ||||||
|     for (; num_iterations > 0; --num_iterations) { |     for (; num_iterations > 0; --num_iterations) { | ||||||
|         if (deletion_iterator == slot_images.end()) { |         if (deletion_iterator == slot_images.end()) { | ||||||
|             deletion_iterator = slot_images.begin(); |             deletion_iterator = slot_images.begin(); | ||||||
|  | @ -390,11 +396,42 @@ void TextureCache<P>::TickFrame() { | ||||||
|             } |             } | ||||||
|         } |         } | ||||||
|         const auto [image_id, image] = *deletion_iterator; |         const auto [image_id, image] = *deletion_iterator; | ||||||
|         if (image->frame_tick + ticks_to_destroy < frame_tick) { |         const bool is_alias = True(image->flags & ImageFlagBits::Alias); | ||||||
|             if (image->IsSafeDownload() && |         if (is_alias && image->aliased_images.size() <= 1) { | ||||||
|                 std::ranges::none_of(image->aliased_images, [&](const AliasedImage& alias) { |             ++deletion_iterator; | ||||||
|                     return slot_images[alias.id].modification_tick > image->modification_tick; |             continue; | ||||||
|                 })) { |         } | ||||||
|  |         const bool is_bad_overlap = True(image->flags & ImageFlagBits::BadOverlap); | ||||||
|  |         const bool must_download = image->IsSafeDownload(); | ||||||
|  |         const u64 ticks_needed = is_bad_overlap ? ticks_to_destroy >> 4 : ticks_to_destroy; | ||||||
|  |         const bool should_care = | ||||||
|  |             aggressive_mode || is_bad_overlap || is_alias || (high_priority_mode && !must_download); | ||||||
|  |         if (should_care && image->frame_tick + ticks_needed < frame_tick) { | ||||||
|  |             if (is_bad_overlap) { | ||||||
|  |                 const bool overlap_check = | ||||||
|  |                     std::ranges::all_of(image->overlapping_images, [&](const ImageId& overlap_id) { | ||||||
|  |                         auto& overlap = slot_images[overlap_id]; | ||||||
|  |                         return (overlap.frame_tick >= image->frame_tick) && | ||||||
|  |                                (overlap.modification_tick > image->modification_tick); | ||||||
|  |                     }); | ||||||
|  |                 if (!overlap_check) { | ||||||
|  |                     ++deletion_iterator; | ||||||
|  |                     continue; | ||||||
|  |                 } | ||||||
|  |             } | ||||||
|  |             if (!is_bad_overlap && must_download) { | ||||||
|  |                 if (is_alias) { | ||||||
|  |                     const bool alias_check = | ||||||
|  |                         std::ranges::all_of(image->aliased_images, [&](const AliasedImage& alias) { | ||||||
|  |                             auto& alias_image = slot_images[alias.id]; | ||||||
|  |                             return (alias_image.frame_tick >= image->frame_tick) && | ||||||
|  |                                    (alias_image.modification_tick > image->modification_tick); | ||||||
|  |                         }); | ||||||
|  |                     if (!alias_check) { | ||||||
|  |                         ++deletion_iterator; | ||||||
|  |                         continue; | ||||||
|  |                     } | ||||||
|  |                 } | ||||||
|                 auto map = runtime.DownloadStagingBuffer(image->unswizzled_size_bytes); |                 auto map = runtime.DownloadStagingBuffer(image->unswizzled_size_bytes); | ||||||
|                 const auto copies = FullDownloadCopies(image->info); |                 const auto copies = FullDownloadCopies(image->info); | ||||||
|                 image->DownloadMemory(map, copies); |                 image->DownloadMemory(map, copies); | ||||||
|  | @ -406,10 +443,12 @@ void TextureCache<P>::TickFrame() { | ||||||
|             } |             } | ||||||
|             UnregisterImage(image_id); |             UnregisterImage(image_id); | ||||||
|             DeleteImage(image_id); |             DeleteImage(image_id); | ||||||
|  |             if (is_bad_overlap) { | ||||||
|  |                 num_iterations++; | ||||||
|  |             } | ||||||
|         } |         } | ||||||
|         ++deletion_iterator; |         ++deletion_iterator; | ||||||
|     } |     } | ||||||
|     // Tick sentenced resources in this order to ensure they are destroyed in the right order
 |  | ||||||
|     sentenced_images.Tick(); |     sentenced_images.Tick(); | ||||||
|     sentenced_framebuffers.Tick(); |     sentenced_framebuffers.Tick(); | ||||||
|     sentenced_image_view.Tick(); |     sentenced_image_view.Tick(); | ||||||
|  | @ -989,6 +1028,7 @@ ImageId TextureCache<P>::JoinImages(const ImageInfo& info, GPUVAddr gpu_addr, VA | ||||||
|     std::vector<ImageId> overlap_ids; |     std::vector<ImageId> overlap_ids; | ||||||
|     std::vector<ImageId> left_aliased_ids; |     std::vector<ImageId> left_aliased_ids; | ||||||
|     std::vector<ImageId> right_aliased_ids; |     std::vector<ImageId> right_aliased_ids; | ||||||
|  |     std::vector<ImageId> bad_overlap_ids; | ||||||
|     ForEachImageInRegion(cpu_addr, size_bytes, [&](ImageId overlap_id, ImageBase& overlap) { |     ForEachImageInRegion(cpu_addr, size_bytes, [&](ImageId overlap_id, ImageBase& overlap) { | ||||||
|         if (info.type != overlap.info.type) { |         if (info.type != overlap.info.type) { | ||||||
|             return; |             return; | ||||||
|  | @ -1014,9 +1054,14 @@ ImageId TextureCache<P>::JoinImages(const ImageInfo& info, GPUVAddr gpu_addr, VA | ||||||
|         const ImageBase new_image_base(new_info, gpu_addr, cpu_addr); |         const ImageBase new_image_base(new_info, gpu_addr, cpu_addr); | ||||||
|         if (IsSubresource(new_info, overlap, gpu_addr, options, broken_views, native_bgr)) { |         if (IsSubresource(new_info, overlap, gpu_addr, options, broken_views, native_bgr)) { | ||||||
|             left_aliased_ids.push_back(overlap_id); |             left_aliased_ids.push_back(overlap_id); | ||||||
|  |             overlap.flags |= ImageFlagBits::Alias; | ||||||
|         } else if (IsSubresource(overlap.info, new_image_base, overlap.gpu_addr, options, |         } else if (IsSubresource(overlap.info, new_image_base, overlap.gpu_addr, options, | ||||||
|                                  broken_views, native_bgr)) { |                                  broken_views, native_bgr)) { | ||||||
|             right_aliased_ids.push_back(overlap_id); |             right_aliased_ids.push_back(overlap_id); | ||||||
|  |             overlap.flags |= ImageFlagBits::Alias; | ||||||
|  |         } else { | ||||||
|  |             bad_overlap_ids.push_back(overlap_id); | ||||||
|  |             overlap.flags |= ImageFlagBits::BadOverlap; | ||||||
|         } |         } | ||||||
|     }); |     }); | ||||||
|     const ImageId new_image_id = slot_images.insert(runtime, new_info, gpu_addr, cpu_addr); |     const ImageId new_image_id = slot_images.insert(runtime, new_info, gpu_addr, cpu_addr); | ||||||
|  | @ -1044,10 +1089,18 @@ ImageId TextureCache<P>::JoinImages(const ImageInfo& info, GPUVAddr gpu_addr, VA | ||||||
|     for (const ImageId aliased_id : right_aliased_ids) { |     for (const ImageId aliased_id : right_aliased_ids) { | ||||||
|         ImageBase& aliased = slot_images[aliased_id]; |         ImageBase& aliased = slot_images[aliased_id]; | ||||||
|         AddImageAlias(new_image_base, aliased, new_image_id, aliased_id); |         AddImageAlias(new_image_base, aliased, new_image_id, aliased_id); | ||||||
|  |         new_image.flags |= ImageFlagBits::Alias; | ||||||
|     } |     } | ||||||
|     for (const ImageId aliased_id : left_aliased_ids) { |     for (const ImageId aliased_id : left_aliased_ids) { | ||||||
|         ImageBase& aliased = slot_images[aliased_id]; |         ImageBase& aliased = slot_images[aliased_id]; | ||||||
|         AddImageAlias(aliased, new_image_base, aliased_id, new_image_id); |         AddImageAlias(aliased, new_image_base, aliased_id, new_image_id); | ||||||
|  |         new_image.flags |= ImageFlagBits::Alias; | ||||||
|  |     } | ||||||
|  |     for (const ImageId aliased_id : bad_overlap_ids) { | ||||||
|  |         ImageBase& aliased = slot_images[aliased_id]; | ||||||
|  |         aliased.overlapping_images.push_back(new_image_id); | ||||||
|  |         new_image.overlapping_images.push_back(aliased_id); | ||||||
|  |         new_image.flags |= ImageFlagBits::BadOverlap; | ||||||
|     } |     } | ||||||
|     RegisterImage(new_image_id); |     RegisterImage(new_image_id); | ||||||
|     return new_image_id; |     return new_image_id; | ||||||
|  | @ -1217,6 +1270,8 @@ void TextureCache<P>::RegisterImage(ImageId image_id) { | ||||||
|     image.flags |= ImageFlagBits::Registered; |     image.flags |= ImageFlagBits::Registered; | ||||||
|     ForEachPage(image.cpu_addr, image.guest_size_bytes, |     ForEachPage(image.cpu_addr, image.guest_size_bytes, | ||||||
|                 [this, image_id](u64 page) { page_table[page].push_back(image_id); }); |                 [this, image_id](u64 page) { page_table[page].push_back(image_id); }); | ||||||
|  |     total_used_memory += | ||||||
|  |         Common::AlignUp(std::max(image.guest_size_bytes, image.unswizzled_size_bytes), 1024); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| template <class P> | template <class P> | ||||||
|  | @ -1225,6 +1280,9 @@ void TextureCache<P>::UnregisterImage(ImageId image_id) { | ||||||
|     ASSERT_MSG(True(image.flags & ImageFlagBits::Registered), |     ASSERT_MSG(True(image.flags & ImageFlagBits::Registered), | ||||||
|                "Trying to unregister an already registered image"); |                "Trying to unregister an already registered image"); | ||||||
|     image.flags &= ~ImageFlagBits::Registered; |     image.flags &= ~ImageFlagBits::Registered; | ||||||
|  |     image.flags &= ~ImageFlagBits::BadOverlap; | ||||||
|  |     total_used_memory -= | ||||||
|  |         Common::AlignUp(std::max(image.guest_size_bytes, image.unswizzled_size_bytes), 1024); | ||||||
|     ForEachPage(image.cpu_addr, image.guest_size_bytes, [this, image_id](u64 page) { |     ForEachPage(image.cpu_addr, image.guest_size_bytes, [this, image_id](u64 page) { | ||||||
|         const auto page_it = page_table.find(page); |         const auto page_it = page_table.find(page); | ||||||
|         if (page_it == page_table.end()) { |         if (page_it == page_table.end()) { | ||||||
|  | @ -1298,9 +1356,19 @@ void TextureCache<P>::DeleteImage(ImageId image_id) { | ||||||
|             std::erase_if(other_image.aliased_images, [image_id](const AliasedImage& other_alias) { |             std::erase_if(other_image.aliased_images, [image_id](const AliasedImage& other_alias) { | ||||||
|                 return other_alias.id == image_id; |                 return other_alias.id == image_id; | ||||||
|             }); |             }); | ||||||
|  |         other_image.CheckAliasState(); | ||||||
|         ASSERT_MSG(num_removed_aliases == 1, "Invalid number of removed aliases: {}", |         ASSERT_MSG(num_removed_aliases == 1, "Invalid number of removed aliases: {}", | ||||||
|                    num_removed_aliases); |                    num_removed_aliases); | ||||||
|     } |     } | ||||||
|  |     for (const ImageId overlap_id : image.overlapping_images) { | ||||||
|  |         ImageBase& other_image = slot_images[overlap_id]; | ||||||
|  |         [[maybe_unused]] const size_t num_removed_overlaps = std::erase_if( | ||||||
|  |             other_image.overlapping_images, | ||||||
|  |             [image_id](const ImageId other_overlap_id) { return other_overlap_id == image_id; }); | ||||||
|  |         other_image.CheckBadOverlapState(); | ||||||
|  |         ASSERT_MSG(num_removed_overlaps == 1, "Invalid number of removed overlapps: {}", | ||||||
|  |                    num_removed_overlaps); | ||||||
|  |     } | ||||||
|     for (const ImageViewId image_view_id : image_view_ids) { |     for (const ImageViewId image_view_id : image_view_ids) { | ||||||
|         sentenced_image_view.Push(std::move(slot_image_views[image_view_id])); |         sentenced_image_view.Push(std::move(slot_image_views[image_view_id])); | ||||||
|         slot_image_views.erase(image_view_id); |         slot_image_views.erase(image_view_id); | ||||||
|  |  | ||||||
|  | @ -581,6 +581,8 @@ void SwizzleBlockLinearImage(Tegra::MemoryManager& gpu_memory, GPUVAddr gpu_addr | ||||||
| 
 | 
 | ||||||
|     for (s32 layer = 0; layer < info.resources.layers; ++layer) { |     for (s32 layer = 0; layer < info.resources.layers; ++layer) { | ||||||
|         const std::span<const u8> src = input.subspan(host_offset); |         const std::span<const u8> src = input.subspan(host_offset); | ||||||
|  |         gpu_memory.ReadBlockUnsafe(gpu_addr + guest_offset, dst.data(), dst.size_bytes()); | ||||||
|  | 
 | ||||||
|         SwizzleTexture(dst, src, bytes_per_block, num_tiles.width, num_tiles.height, |         SwizzleTexture(dst, src, bytes_per_block, num_tiles.width, num_tiles.height, | ||||||
|                        num_tiles.depth, block.height, block.depth); |                        num_tiles.depth, block.height, block.depth); | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue
	
	 Fernando Sahmkow
						Fernando Sahmkow