| 
									
										
										
										
											2022-04-23 04:59:50 -04:00
										 |  |  | // SPDX-FileCopyrightText: Copyright 2018 yuzu Emulator Project
 | 
					
						
							|  |  |  | // SPDX-License-Identifier: GPL-2.0-or-later
 | 
					
						
							| 
									
										
										
										
											2018-02-07 21:54:35 -05:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-09-08 21:43:02 -04:00
										 |  |  | #include <algorithm>
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-04-23 10:57:12 -05:00
										 |  |  | #include "common/alignment.h"
 | 
					
						
							| 
									
										
										
										
											2018-02-07 21:54:35 -05:00
										 |  |  | #include "common/assert.h"
 | 
					
						
							| 
									
										
										
										
											2021-01-22 18:31:08 -03:00
										 |  |  | #include "common/logging/log.h"
 | 
					
						
							| 
									
										
										
										
											2019-07-08 22:19:27 -07:00
										 |  |  | #include "core/core.h"
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  | #include "core/device_memory.h"
 | 
					
						
							| 
									
										
										
										
											2021-02-12 17:58:31 -08:00
										 |  |  | #include "core/hle/kernel/k_page_table.h"
 | 
					
						
							| 
									
										
										
										
											2021-04-23 22:04:28 -07:00
										 |  |  | #include "core/hle/kernel/k_process.h"
 | 
					
						
							| 
									
										
										
										
											2019-02-24 00:15:35 -05:00
										 |  |  | #include "core/memory.h"
 | 
					
						
							| 
									
										
										
										
											2018-02-11 23:44:12 -05:00
										 |  |  | #include "video_core/memory_manager.h"
 | 
					
						
							| 
									
										
										
										
											2020-02-15 17:47:15 -05:00
										 |  |  | #include "video_core/rasterizer_interface.h"
 | 
					
						
							| 
									
										
										
										
											2020-10-26 23:07:36 -04:00
										 |  |  | #include "video_core/renderer_base.h"
 | 
					
						
							| 
									
										
										
										
											2018-02-07 21:54:35 -05:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-02-11 23:44:12 -05:00
										 |  |  | namespace Tegra { | 
					
						
							| 
									
										
										
										
											2018-02-07 21:54:35 -05:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-12-17 16:45:06 +01:00
										 |  |  | std::atomic<size_t> MemoryManager::unique_identifier_generator{}; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  | MemoryManager::MemoryManager(Core::System& system_, u64 address_space_bits_, u64 big_page_bits_, | 
					
						
							|  |  |  |                              u64 page_bits_) | 
					
						
							|  |  |  |     : system{system_}, memory{system.Memory()}, device_memory{system.DeviceMemory()}, | 
					
						
							|  |  |  |       address_space_bits{address_space_bits_}, page_bits{page_bits_}, big_page_bits{big_page_bits_}, | 
					
						
							|  |  |  |       entries{}, big_entries{}, page_table{address_space_bits, address_space_bits + page_bits - 38, | 
					
						
							|  |  |  |                                            page_bits != big_page_bits ? page_bits : 0}, | 
					
						
							| 
									
										
										
										
											2021-12-17 16:45:06 +01:00
										 |  |  |       unique_identifier{unique_identifier_generator.fetch_add(1, std::memory_order_acq_rel)} { | 
					
						
							| 
									
										
										
										
											2021-11-11 21:24:40 +01:00
										 |  |  |     address_space_size = 1ULL << address_space_bits; | 
					
						
							|  |  |  |     page_size = 1ULL << page_bits; | 
					
						
							|  |  |  |     page_mask = page_size - 1ULL; | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     big_page_size = 1ULL << big_page_bits; | 
					
						
							|  |  |  |     big_page_mask = big_page_size - 1ULL; | 
					
						
							|  |  |  |     const u64 page_table_bits = address_space_bits - page_bits; | 
					
						
							|  |  |  |     const u64 big_page_table_bits = address_space_bits - big_page_bits; | 
					
						
							| 
									
										
										
										
											2021-11-11 21:24:40 +01:00
										 |  |  |     const u64 page_table_size = 1ULL << page_table_bits; | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     const u64 big_page_table_size = 1ULL << big_page_table_bits; | 
					
						
							| 
									
										
										
										
											2021-11-11 21:24:40 +01:00
										 |  |  |     page_table_mask = page_table_size - 1; | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     big_page_table_mask = big_page_table_size - 1; | 
					
						
							| 
									
										
										
										
											2021-11-11 21:24:40 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     big_entries.resize(big_page_table_size / 32, 0); | 
					
						
							|  |  |  |     big_page_table_cpu.resize(big_page_table_size); | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |     big_page_continous.resize(big_page_table_size / continous_bits, 0); | 
					
						
							| 
									
										
										
										
											2021-11-11 21:24:40 +01:00
										 |  |  |     entries.resize(page_table_size / 32, 0); | 
					
						
							|  |  |  | } | 
					
						
							| 
									
										
										
										
											2018-11-23 12:58:55 -05:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-05-09 19:04:41 -04:00
										 |  |  | MemoryManager::~MemoryManager() = default; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  | template <bool is_big_page> | 
					
						
							| 
									
										
										
										
											2021-11-11 21:24:40 +01:00
										 |  |  | MemoryManager::EntryType MemoryManager::GetEntry(size_t position) const { | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     if constexpr (is_big_page) { | 
					
						
							|  |  |  |         position = position >> big_page_bits; | 
					
						
							|  |  |  |         const u64 entry_mask = big_entries[position / 32]; | 
					
						
							|  |  |  |         const size_t sub_index = position % 32; | 
					
						
							|  |  |  |         return static_cast<EntryType>((entry_mask >> (2 * sub_index)) & 0x03ULL); | 
					
						
							|  |  |  |     } else { | 
					
						
							|  |  |  |         position = position >> page_bits; | 
					
						
							|  |  |  |         const u64 entry_mask = entries[position / 32]; | 
					
						
							|  |  |  |         const size_t sub_index = position % 32; | 
					
						
							|  |  |  |         return static_cast<EntryType>((entry_mask >> (2 * sub_index)) & 0x03ULL); | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2020-06-11 00:58:57 -03:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  | template <bool is_big_page> | 
					
						
							| 
									
										
										
										
											2021-11-11 21:24:40 +01:00
										 |  |  | void MemoryManager::SetEntry(size_t position, MemoryManager::EntryType entry) { | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     if constexpr (is_big_page) { | 
					
						
							|  |  |  |         position = position >> big_page_bits; | 
					
						
							|  |  |  |         const u64 entry_mask = big_entries[position / 32]; | 
					
						
							|  |  |  |         const size_t sub_index = position % 32; | 
					
						
							|  |  |  |         big_entries[position / 32] = | 
					
						
							|  |  |  |             (~(3ULL << sub_index * 2) & entry_mask) | (static_cast<u64>(entry) << sub_index * 2); | 
					
						
							|  |  |  |     } else { | 
					
						
							|  |  |  |         position = position >> page_bits; | 
					
						
							|  |  |  |         const u64 entry_mask = entries[position / 32]; | 
					
						
							|  |  |  |         const size_t sub_index = position % 32; | 
					
						
							|  |  |  |         entries[position / 32] = | 
					
						
							|  |  |  |             (~(3ULL << sub_index * 2) & entry_mask) | (static_cast<u64>(entry) << sub_index * 2); | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2021-11-11 21:24:40 +01:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  | inline bool MemoryManager::IsBigPageContinous(size_t big_page_index) const { | 
					
						
							|  |  |  |     const u64 entry_mask = big_page_continous[big_page_index / continous_bits]; | 
					
						
							|  |  |  |     const size_t sub_index = big_page_index % continous_bits; | 
					
						
							|  |  |  |     return ((entry_mask >> sub_index) & 0x1ULL) != 0; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | inline void MemoryManager::SetBigPageContinous(size_t big_page_index, bool value) { | 
					
						
							|  |  |  |     const u64 continous_mask = big_page_continous[big_page_index / continous_bits]; | 
					
						
							|  |  |  |     const size_t sub_index = big_page_index % continous_bits; | 
					
						
							|  |  |  |     big_page_continous[big_page_index / continous_bits] = | 
					
						
							|  |  |  |         (~(1ULL << sub_index) & continous_mask) | (value ? 1ULL << sub_index : 0); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-11-11 21:24:40 +01:00
										 |  |  | template <MemoryManager::EntryType entry_type> | 
					
						
							|  |  |  | GPUVAddr MemoryManager::PageTableOp(GPUVAddr gpu_addr, [[maybe_unused]] VAddr cpu_addr, | 
					
						
							|  |  |  |                                     size_t size) { | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  |     u64 remaining_size{size}; | 
					
						
							| 
									
										
										
										
											2021-11-11 21:24:40 +01:00
										 |  |  |     if constexpr (entry_type == EntryType::Mapped) { | 
					
						
							|  |  |  |         page_table.ReserveRange(gpu_addr, size); | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  |     for (u64 offset{}; offset < size; offset += page_size) { | 
					
						
							| 
									
										
										
										
											2021-11-11 21:24:40 +01:00
										 |  |  |         const GPUVAddr current_gpu_addr = gpu_addr + offset; | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |         [[maybe_unused]] const auto current_entry_type = GetEntry<false>(current_gpu_addr); | 
					
						
							|  |  |  |         SetEntry<false>(current_gpu_addr, entry_type); | 
					
						
							| 
									
										
										
										
											2022-01-01 22:03:37 +01:00
										 |  |  |         if (current_entry_type != entry_type) { | 
					
						
							|  |  |  |             rasterizer->ModifyGPUMemory(unique_identifier, gpu_addr, page_size); | 
					
						
							|  |  |  |         } | 
					
						
							| 
									
										
										
										
											2021-11-11 21:24:40 +01:00
										 |  |  |         if constexpr (entry_type == EntryType::Mapped) { | 
					
						
							|  |  |  |             const VAddr current_cpu_addr = cpu_addr + offset; | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |             const auto index = PageEntryIndex<false>(current_gpu_addr); | 
					
						
							|  |  |  |             const u32 sub_value = static_cast<u32>(current_cpu_addr >> cpu_page_bits); | 
					
						
							|  |  |  |             page_table[index] = sub_value; | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  |         } | 
					
						
							|  |  |  |         remaining_size -= page_size; | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2019-03-03 23:54:16 -05:00
										 |  |  |     return gpu_addr; | 
					
						
							|  |  |  | } | 
					
						
							| 
									
										
										
										
											2018-02-07 21:54:35 -05:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  | template <MemoryManager::EntryType entry_type> | 
					
						
							|  |  |  | GPUVAddr MemoryManager::BigPageTableOp(GPUVAddr gpu_addr, [[maybe_unused]] VAddr cpu_addr, | 
					
						
							|  |  |  |                                        size_t size) { | 
					
						
							|  |  |  |     u64 remaining_size{size}; | 
					
						
							|  |  |  |     for (u64 offset{}; offset < size; offset += big_page_size) { | 
					
						
							|  |  |  |         const GPUVAddr current_gpu_addr = gpu_addr + offset; | 
					
						
							|  |  |  |         [[maybe_unused]] const auto current_entry_type = GetEntry<true>(current_gpu_addr); | 
					
						
							|  |  |  |         SetEntry<true>(current_gpu_addr, entry_type); | 
					
						
							|  |  |  |         if (current_entry_type != entry_type) { | 
					
						
							|  |  |  |             rasterizer->ModifyGPUMemory(unique_identifier, gpu_addr, big_page_size); | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         if constexpr (entry_type == EntryType::Mapped) { | 
					
						
							|  |  |  |             const VAddr current_cpu_addr = cpu_addr + offset; | 
					
						
							|  |  |  |             const auto index = PageEntryIndex<true>(current_gpu_addr); | 
					
						
							|  |  |  |             const u32 sub_value = static_cast<u32>(current_cpu_addr >> cpu_page_bits); | 
					
						
							|  |  |  |             big_page_table_cpu[index] = sub_value; | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |             const bool is_continous = ([&] { | 
					
						
							|  |  |  |                 uintptr_t base_ptr{ | 
					
						
							| 
									
										
										
										
											2022-02-19 14:18:02 +01:00
										 |  |  |                     reinterpret_cast<uintptr_t>(memory.GetPointerSilent(current_cpu_addr))}; | 
					
						
							|  |  |  |                 if (base_ptr == 0) { | 
					
						
							|  |  |  |                     return false; | 
					
						
							|  |  |  |                 } | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |                 for (VAddr start_cpu = current_cpu_addr + page_size; | 
					
						
							|  |  |  |                      start_cpu < current_cpu_addr + big_page_size; start_cpu += page_size) { | 
					
						
							|  |  |  |                     base_ptr += page_size; | 
					
						
							| 
									
										
										
										
											2022-02-19 14:18:02 +01:00
										 |  |  |                     auto next_ptr = reinterpret_cast<uintptr_t>(memory.GetPointerSilent(start_cpu)); | 
					
						
							|  |  |  |                     if (next_ptr == 0 || base_ptr != next_ptr) { | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |                         return false; | 
					
						
							|  |  |  |                     } | 
					
						
							|  |  |  |                 } | 
					
						
							|  |  |  |                 return true; | 
					
						
							|  |  |  |             })(); | 
					
						
							|  |  |  |             SetBigPageContinous(index, is_continous); | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |         } | 
					
						
							|  |  |  |         remaining_size -= big_page_size; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     return gpu_addr; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-11-11 21:24:40 +01:00
										 |  |  | void MemoryManager::BindRasterizer(VideoCore::RasterizerInterface* rasterizer_) { | 
					
						
							|  |  |  |     rasterizer = rasterizer_; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  | GPUVAddr MemoryManager::Map(GPUVAddr gpu_addr, VAddr cpu_addr, std::size_t size, | 
					
						
							|  |  |  |                             bool is_big_pages) { | 
					
						
							|  |  |  |     if (is_big_pages) [[likely]] { | 
					
						
							|  |  |  |         return BigPageTableOp<EntryType::Mapped>(gpu_addr, cpu_addr, size); | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2021-11-11 21:24:40 +01:00
										 |  |  |     return PageTableOp<EntryType::Mapped>(gpu_addr, cpu_addr, size); | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  | } | 
					
						
							| 
									
										
										
										
											2019-03-20 22:58:49 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  | GPUVAddr MemoryManager::MapSparse(GPUVAddr gpu_addr, std::size_t size, bool is_big_pages) { | 
					
						
							|  |  |  |     if (is_big_pages) [[likely]] { | 
					
						
							|  |  |  |         return BigPageTableOp<EntryType::Reserved>(gpu_addr, 0, size); | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2021-11-14 20:55:52 +01:00
										 |  |  |     return PageTableOp<EntryType::Reserved>(gpu_addr, 0, size); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  | void MemoryManager::Unmap(GPUVAddr gpu_addr, std::size_t size) { | 
					
						
							| 
									
										
										
										
											2021-01-22 18:31:08 -03:00
										 |  |  |     if (size == 0) { | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  |         return; | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  |     const auto submapped_ranges = GetSubmappedRange(gpu_addr, size); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-12-31 02:07:59 -05:00
										 |  |  |     for (const auto& [map_addr, map_size] : submapped_ranges) { | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  |         // Flush and invalidate through the GPU interface, to be asynchronous if possible.
 | 
					
						
							| 
									
										
										
										
											2021-12-31 02:07:59 -05:00
										 |  |  |         const std::optional<VAddr> cpu_addr = GpuToCpuAddress(map_addr); | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  |         ASSERT(cpu_addr); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-12-31 02:07:59 -05:00
										 |  |  |         rasterizer->UnmapMemory(*cpu_addr, map_size); | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     BigPageTableOp<EntryType::Free>(gpu_addr, 0, size); | 
					
						
							| 
									
										
										
										
											2021-11-11 21:24:40 +01:00
										 |  |  |     PageTableOp<EntryType::Free>(gpu_addr, 0, size); | 
					
						
							| 
									
										
										
										
											2019-03-03 23:54:16 -05:00
										 |  |  | } | 
					
						
							| 
									
										
										
										
											2018-07-24 11:19:51 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  | std::optional<VAddr> MemoryManager::GpuToCpuAddress(GPUVAddr gpu_addr) const { | 
					
						
							| 
									
										
										
										
											2022-04-13 16:20:34 +02:00
										 |  |  |     if (!IsWithinGPUAddressRange(gpu_addr)) [[unlikely]] { | 
					
						
							| 
									
										
										
										
											2022-04-02 22:38:58 +02:00
										 |  |  |         return std::nullopt; | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     if (GetEntry<true>(gpu_addr) != EntryType::Mapped) [[unlikely]] { | 
					
						
							|  |  |  |         if (GetEntry<false>(gpu_addr) != EntryType::Mapped) { | 
					
						
							| 
									
										
										
										
											2020-09-22 17:31:53 -04:00
										 |  |  |             return std::nullopt; | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2018-10-31 22:20:37 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |         const VAddr cpu_addr_base = static_cast<VAddr>(page_table[PageEntryIndex<false>(gpu_addr)]) | 
					
						
							|  |  |  |                                     << cpu_page_bits; | 
					
						
							|  |  |  |         return cpu_addr_base + (gpu_addr & page_mask); | 
					
						
							| 
									
										
										
										
											2019-03-09 14:06:51 -05:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     const VAddr cpu_addr_base = | 
					
						
							|  |  |  |         static_cast<VAddr>(big_page_table_cpu[PageEntryIndex<true>(gpu_addr)]) << cpu_page_bits; | 
					
						
							|  |  |  |     return cpu_addr_base + (gpu_addr & big_page_mask); | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  | std::optional<VAddr> MemoryManager::GpuToCpuAddress(GPUVAddr addr, std::size_t size) const { | 
					
						
							|  |  |  |     size_t page_index{addr >> page_bits}; | 
					
						
							|  |  |  |     const size_t page_last{(addr + size + page_size - 1) >> page_bits}; | 
					
						
							|  |  |  |     while (page_index < page_last) { | 
					
						
							|  |  |  |         const auto page_addr{GpuToCpuAddress(page_index << page_bits)}; | 
					
						
							| 
									
										
										
										
											2022-01-01 22:03:37 +01:00
										 |  |  |         if (page_addr) { | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  |             return page_addr; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         ++page_index; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     return std::nullopt; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  | template <typename T> | 
					
						
							|  |  |  | T MemoryManager::Read(GPUVAddr addr) const { | 
					
						
							|  |  |  |     if (auto page_pointer{GetPointer(addr)}; page_pointer) { | 
					
						
							| 
									
										
										
										
											2019-03-03 23:54:16 -05:00
										 |  |  |         // NOTE: Avoid adding any extra logic to this fast-path block
 | 
					
						
							|  |  |  |         T value; | 
					
						
							| 
									
										
										
										
											2020-04-08 12:08:06 -04:00
										 |  |  |         std::memcpy(&value, page_pointer, sizeof(T)); | 
					
						
							| 
									
										
										
										
											2019-03-03 23:54:16 -05:00
										 |  |  |         return value; | 
					
						
							| 
									
										
										
										
											2018-02-07 21:54:35 -05:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-06-07 17:02:29 -04:00
										 |  |  |     ASSERT(false); | 
					
						
							| 
									
										
										
										
											2020-04-08 22:51:31 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-03-03 23:54:16 -05:00
										 |  |  |     return {}; | 
					
						
							| 
									
										
										
										
											2018-02-07 21:54:35 -05:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-03-03 23:54:16 -05:00
										 |  |  | template <typename T> | 
					
						
							| 
									
										
										
										
											2019-03-09 14:06:51 -05:00
										 |  |  | void MemoryManager::Write(GPUVAddr addr, T data) { | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  |     if (auto page_pointer{GetPointer(addr)}; page_pointer) { | 
					
						
							| 
									
										
										
										
											2019-03-03 23:54:16 -05:00
										 |  |  |         // NOTE: Avoid adding any extra logic to this fast-path block
 | 
					
						
							| 
									
										
										
										
											2020-04-08 12:08:06 -04:00
										 |  |  |         std::memcpy(page_pointer, &data, sizeof(T)); | 
					
						
							| 
									
										
										
										
											2019-03-03 23:54:16 -05:00
										 |  |  |         return; | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2018-05-20 14:21:06 -05:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-06-07 17:02:29 -04:00
										 |  |  |     ASSERT(false); | 
					
						
							| 
									
										
										
										
											2019-03-03 23:54:16 -05:00
										 |  |  | } | 
					
						
							| 
									
										
										
										
											2018-07-24 11:19:51 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-04-05 20:30:46 -04:00
										 |  |  | template u8 MemoryManager::Read<u8>(GPUVAddr addr) const; | 
					
						
							|  |  |  | template u16 MemoryManager::Read<u16>(GPUVAddr addr) const; | 
					
						
							|  |  |  | template u32 MemoryManager::Read<u32>(GPUVAddr addr) const; | 
					
						
							|  |  |  | template u64 MemoryManager::Read<u64>(GPUVAddr addr) const; | 
					
						
							| 
									
										
										
										
											2019-03-03 23:54:16 -05:00
										 |  |  | template void MemoryManager::Write<u8>(GPUVAddr addr, u8 data); | 
					
						
							|  |  |  | template void MemoryManager::Write<u16>(GPUVAddr addr, u16 data); | 
					
						
							|  |  |  | template void MemoryManager::Write<u32>(GPUVAddr addr, u32 data); | 
					
						
							|  |  |  | template void MemoryManager::Write<u64>(GPUVAddr addr, u64 data); | 
					
						
							| 
									
										
										
										
											2018-10-31 22:20:37 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  | u8* MemoryManager::GetPointer(GPUVAddr gpu_addr) { | 
					
						
							|  |  |  |     const auto address{GpuToCpuAddress(gpu_addr)}; | 
					
						
							|  |  |  |     if (!address) { | 
					
						
							|  |  |  |         return {}; | 
					
						
							| 
									
										
										
										
											2019-04-05 20:25:25 -04:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     return memory.GetPointer(*address); | 
					
						
							| 
									
										
										
										
											2019-04-05 20:25:25 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  | const u8* MemoryManager::GetPointer(GPUVAddr gpu_addr) const { | 
					
						
							|  |  |  |     const auto address{GpuToCpuAddress(gpu_addr)}; | 
					
						
							|  |  |  |     if (!address) { | 
					
						
							|  |  |  |         return {}; | 
					
						
							| 
									
										
										
										
											2018-05-20 14:21:06 -05:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     return memory.GetPointer(*address); | 
					
						
							| 
									
										
										
										
											2019-04-16 15:45:24 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  | #ifdef _MSC_VER // no need for gcc / clang but msvc's compiler is more conservative with inlining.
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  | #pragma inline_recursion(on)
 | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  | template <bool is_big_pages, typename FuncMapped, typename FuncReserved, typename FuncUnmapped> | 
					
						
							|  |  |  | inline void MemoryManager::MemoryOperation(GPUVAddr gpu_src_addr, std::size_t size, | 
					
						
							|  |  |  |                                            FuncMapped&& func_mapped, FuncReserved&& func_reserved, | 
					
						
							|  |  |  |                                            FuncUnmapped&& func_unmapped) const { | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |     static constexpr bool BOOL_BREAK_MAPPED = std::is_same_v<FuncMapped, bool>; | 
					
						
							|  |  |  |     static constexpr bool BOOL_BREAK_RESERVED = std::is_same_v<FuncReserved, bool>; | 
					
						
							|  |  |  |     static constexpr bool BOOL_BREAK_UNMAPPED = std::is_same_v<FuncUnmapped, bool>; | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     u64 used_page_size; | 
					
						
							|  |  |  |     u64 used_page_mask; | 
					
						
							|  |  |  |     u64 used_page_bits; | 
					
						
							|  |  |  |     if constexpr (is_big_pages) { | 
					
						
							|  |  |  |         used_page_size = big_page_size; | 
					
						
							|  |  |  |         used_page_mask = big_page_mask; | 
					
						
							|  |  |  |         used_page_bits = big_page_bits; | 
					
						
							|  |  |  |     } else { | 
					
						
							|  |  |  |         used_page_size = page_size; | 
					
						
							|  |  |  |         used_page_mask = page_mask; | 
					
						
							|  |  |  |         used_page_bits = page_bits; | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2019-03-28 21:58:28 -04:00
										 |  |  |     std::size_t remaining_size{size}; | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     std::size_t page_index{gpu_src_addr >> used_page_bits}; | 
					
						
							|  |  |  |     std::size_t page_offset{gpu_src_addr & used_page_mask}; | 
					
						
							|  |  |  |     GPUVAddr current_address = gpu_src_addr; | 
					
						
							| 
									
										
										
										
											2019-03-28 21:58:28 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  |     while (remaining_size > 0) { | 
					
						
							|  |  |  |         const std::size_t copy_amount{ | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |             std::min(static_cast<std::size_t>(used_page_size) - page_offset, remaining_size)}; | 
					
						
							|  |  |  |         auto entry = GetEntry<is_big_pages>(current_address); | 
					
						
							|  |  |  |         if (entry == EntryType::Mapped) [[likely]] { | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |             if constexpr (BOOL_BREAK_MAPPED) { | 
					
						
							|  |  |  |                 if (func_mapped(page_index, page_offset, copy_amount)) { | 
					
						
							|  |  |  |                     return; | 
					
						
							|  |  |  |                 } | 
					
						
							|  |  |  |             } else { | 
					
						
							|  |  |  |                 func_mapped(page_index, page_offset, copy_amount); | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |         } else if (entry == EntryType::Reserved) { | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |             if constexpr (BOOL_BREAK_RESERVED) { | 
					
						
							|  |  |  |                 if (func_reserved(page_index, page_offset, copy_amount)) { | 
					
						
							|  |  |  |                     return; | 
					
						
							|  |  |  |                 } | 
					
						
							|  |  |  |             } else { | 
					
						
							|  |  |  |                 func_reserved(page_index, page_offset, copy_amount); | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |         } else [[unlikely]] { | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |             if constexpr (BOOL_BREAK_UNMAPPED) { | 
					
						
							|  |  |  |                 if (func_unmapped(page_index, page_offset, copy_amount)) { | 
					
						
							|  |  |  |                     return; | 
					
						
							|  |  |  |                 } | 
					
						
							|  |  |  |             } else { | 
					
						
							|  |  |  |                 func_unmapped(page_index, page_offset, copy_amount); | 
					
						
							|  |  |  |             } | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2019-03-28 21:58:28 -04:00
										 |  |  |         page_index++; | 
					
						
							|  |  |  |         page_offset = 0; | 
					
						
							|  |  |  |         remaining_size -= copy_amount; | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |         current_address += copy_amount; | 
					
						
							| 
									
										
										
										
											2019-03-28 21:58:28 -04:00
										 |  |  |     } | 
					
						
							| 
									
										
										
										
											2019-03-03 23:54:16 -05:00
										 |  |  | } | 
					
						
							| 
									
										
										
										
											2019-03-28 21:58:28 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  | template <bool is_safe> | 
					
						
							|  |  |  | void MemoryManager::ReadBlockImpl(GPUVAddr gpu_src_addr, void* dest_buffer, | 
					
						
							|  |  |  |                                   std::size_t size) const { | 
					
						
							|  |  |  |     auto set_to_zero = [&]([[maybe_unused]] std::size_t page_index, | 
					
						
							|  |  |  |                            [[maybe_unused]] std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         std::memset(dest_buffer, 0, copy_amount); | 
					
						
							|  |  |  |         dest_buffer = static_cast<u8*>(dest_buffer) + copy_amount; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto mapped_normal = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(page_table[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         if constexpr (is_safe) { | 
					
						
							|  |  |  |             rasterizer->FlushRegion(cpu_addr_base, copy_amount); | 
					
						
							|  |  |  |         } | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |         u8* physical = memory.GetPointer(cpu_addr_base); | 
					
						
							|  |  |  |         std::memcpy(dest_buffer, physical, copy_amount); | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |         dest_buffer = static_cast<u8*>(dest_buffer) + copy_amount; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto mapped_big = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(big_page_table_cpu[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         if constexpr (is_safe) { | 
					
						
							|  |  |  |             rasterizer->FlushRegion(cpu_addr_base, copy_amount); | 
					
						
							|  |  |  |         } | 
					
						
							| 
									
										
										
										
											2022-02-19 14:18:02 +01:00
										 |  |  |         if (!IsBigPageContinous(page_index)) [[unlikely]] { | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |             memory.ReadBlockUnsafe(cpu_addr_base, dest_buffer, copy_amount); | 
					
						
							|  |  |  |         } else { | 
					
						
							|  |  |  |             u8* physical = memory.GetPointer(cpu_addr_base); | 
					
						
							|  |  |  |             std::memcpy(dest_buffer, physical, copy_amount); | 
					
						
							|  |  |  |         } | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |         dest_buffer = static_cast<u8*>(dest_buffer) + copy_amount; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto read_short_pages = [&](std::size_t page_index, std::size_t offset, | 
					
						
							|  |  |  |                                 std::size_t copy_amount) { | 
					
						
							|  |  |  |         GPUVAddr base = (page_index << big_page_bits) + offset; | 
					
						
							|  |  |  |         MemoryOperation<false>(base, copy_amount, mapped_normal, set_to_zero, set_to_zero); | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     MemoryOperation<true>(gpu_src_addr, size, mapped_big, set_to_zero, read_short_pages); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-12-30 23:36:00 -05:00
										 |  |  | void MemoryManager::ReadBlock(GPUVAddr gpu_src_addr, void* dest_buffer, std::size_t size) const { | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     ReadBlockImpl<true>(gpu_src_addr, dest_buffer, size); | 
					
						
							| 
									
										
										
										
											2021-12-30 23:36:00 -05:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-06-19 22:02:56 -04:00
										 |  |  | void MemoryManager::ReadBlockUnsafe(GPUVAddr gpu_src_addr, void* dest_buffer, | 
					
						
							| 
									
										
										
										
											2019-04-16 10:11:35 -04:00
										 |  |  |                                     const std::size_t size) const { | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     ReadBlockImpl<false>(gpu_src_addr, dest_buffer, size); | 
					
						
							| 
									
										
										
										
											2019-04-15 23:01:35 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  | template <bool is_safe> | 
					
						
							|  |  |  | void MemoryManager::WriteBlockImpl(GPUVAddr gpu_dest_addr, const void* src_buffer, | 
					
						
							|  |  |  |                                    std::size_t size) { | 
					
						
							|  |  |  |     auto just_advance = [&]([[maybe_unused]] std::size_t page_index, | 
					
						
							|  |  |  |                             [[maybe_unused]] std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         src_buffer = static_cast<const u8*>(src_buffer) + copy_amount; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto mapped_normal = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(page_table[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         if constexpr (is_safe) { | 
					
						
							|  |  |  |             rasterizer->InvalidateRegion(cpu_addr_base, copy_amount); | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |         u8* physical = memory.GetPointer(cpu_addr_base); | 
					
						
							|  |  |  |         std::memcpy(physical, src_buffer, copy_amount); | 
					
						
							| 
									
										
										
										
											2019-03-28 21:58:28 -04:00
										 |  |  |         src_buffer = static_cast<const u8*>(src_buffer) + copy_amount; | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     }; | 
					
						
							|  |  |  |     auto mapped_big = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(big_page_table_cpu[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         if constexpr (is_safe) { | 
					
						
							|  |  |  |             rasterizer->InvalidateRegion(cpu_addr_base, copy_amount); | 
					
						
							|  |  |  |         } | 
					
						
							| 
									
										
										
										
											2022-02-19 14:18:02 +01:00
										 |  |  |         if (!IsBigPageContinous(page_index)) [[unlikely]] { | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |             memory.WriteBlockUnsafe(cpu_addr_base, src_buffer, copy_amount); | 
					
						
							|  |  |  |         } else { | 
					
						
							|  |  |  |             u8* physical = memory.GetPointer(cpu_addr_base); | 
					
						
							|  |  |  |             std::memcpy(physical, src_buffer, copy_amount); | 
					
						
							|  |  |  |         } | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |         src_buffer = static_cast<const u8*>(src_buffer) + copy_amount; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto write_short_pages = [&](std::size_t page_index, std::size_t offset, | 
					
						
							|  |  |  |                                  std::size_t copy_amount) { | 
					
						
							|  |  |  |         GPUVAddr base = (page_index << big_page_bits) + offset; | 
					
						
							|  |  |  |         MemoryOperation<false>(base, copy_amount, mapped_normal, just_advance, just_advance); | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     MemoryOperation<true>(gpu_dest_addr, size, mapped_big, just_advance, write_short_pages); | 
					
						
							| 
									
										
										
										
											2019-03-03 23:54:16 -05:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-12-30 23:36:00 -05:00
										 |  |  | void MemoryManager::WriteBlock(GPUVAddr gpu_dest_addr, const void* src_buffer, std::size_t size) { | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     WriteBlockImpl<true>(gpu_dest_addr, src_buffer, size); | 
					
						
							| 
									
										
										
										
											2021-12-30 23:36:00 -05:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-06-19 22:02:56 -04:00
										 |  |  | void MemoryManager::WriteBlockUnsafe(GPUVAddr gpu_dest_addr, const void* src_buffer, | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  |                                      std::size_t size) { | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     WriteBlockImpl<false>(gpu_dest_addr, src_buffer, size); | 
					
						
							| 
									
										
										
										
											2019-04-15 23:01:35 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-01-21 19:08:15 -03:00
										 |  |  | void MemoryManager::FlushRegion(GPUVAddr gpu_addr, size_t size) const { | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     auto do_nothing = [&]([[maybe_unused]] std::size_t page_index, | 
					
						
							|  |  |  |                           [[maybe_unused]] std::size_t offset, | 
					
						
							|  |  |  |                           [[maybe_unused]] std::size_t copy_amount) {}; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     auto mapped_normal = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(page_table[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         rasterizer->FlushRegion(cpu_addr_base, copy_amount); | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto mapped_big = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(big_page_table_cpu[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         rasterizer->FlushRegion(cpu_addr_base, copy_amount); | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto flush_short_pages = [&](std::size_t page_index, std::size_t offset, | 
					
						
							|  |  |  |                                  std::size_t copy_amount) { | 
					
						
							|  |  |  |         GPUVAddr base = (page_index << big_page_bits) + offset; | 
					
						
							|  |  |  |         MemoryOperation<false>(base, copy_amount, mapped_normal, do_nothing, do_nothing); | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     MemoryOperation<true>(gpu_addr, size, mapped_big, do_nothing, flush_short_pages); | 
					
						
							| 
									
										
										
										
											2021-01-21 19:08:15 -03:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-08-14 02:36:36 -07:00
										 |  |  | bool MemoryManager::IsMemoryDirty(GPUVAddr gpu_addr, size_t size) const { | 
					
						
							|  |  |  |     bool result = false; | 
					
						
							|  |  |  |     auto do_nothing = [&]([[maybe_unused]] std::size_t page_index, | 
					
						
							|  |  |  |                           [[maybe_unused]] std::size_t offset, | 
					
						
							|  |  |  |                           [[maybe_unused]] std::size_t copy_amount) { return false; }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     auto mapped_normal = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(page_table[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         result |= rasterizer->MustFlushRegion(cpu_addr_base, copy_amount); | 
					
						
							|  |  |  |         return result; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto mapped_big = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(big_page_table_cpu[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         result |= rasterizer->MustFlushRegion(cpu_addr_base, copy_amount); | 
					
						
							|  |  |  |         return result; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto check_short_pages = [&](std::size_t page_index, std::size_t offset, | 
					
						
							|  |  |  |                                  std::size_t copy_amount) { | 
					
						
							|  |  |  |         GPUVAddr base = (page_index << big_page_bits) + offset; | 
					
						
							|  |  |  |         MemoryOperation<false>(base, copy_amount, mapped_normal, do_nothing, do_nothing); | 
					
						
							|  |  |  |         return result; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     MemoryOperation<true>(gpu_addr, size, mapped_big, do_nothing, check_short_pages); | 
					
						
							|  |  |  |     return result; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | size_t MemoryManager::MaxContinousRange(GPUVAddr gpu_addr, size_t size) const { | 
					
						
							|  |  |  |     std::optional<VAddr> old_page_addr{}; | 
					
						
							|  |  |  |     size_t range_so_far = 0; | 
					
						
							|  |  |  |     bool result{false}; | 
					
						
							|  |  |  |     auto fail = [&]([[maybe_unused]] std::size_t page_index, [[maybe_unused]] std::size_t offset, | 
					
						
							|  |  |  |                     std::size_t copy_amount) { | 
					
						
							|  |  |  |         result = true; | 
					
						
							|  |  |  |         return true; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto short_check = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(page_table[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         if (old_page_addr && *old_page_addr != cpu_addr_base) { | 
					
						
							|  |  |  |             result = true; | 
					
						
							|  |  |  |             return true; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         range_so_far += copy_amount; | 
					
						
							|  |  |  |         old_page_addr = {cpu_addr_base + copy_amount}; | 
					
						
							|  |  |  |         return false; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto big_check = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(big_page_table_cpu[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         if (old_page_addr && *old_page_addr != cpu_addr_base) { | 
					
						
							|  |  |  |             return true; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         range_so_far += copy_amount; | 
					
						
							|  |  |  |         old_page_addr = {cpu_addr_base + copy_amount}; | 
					
						
							|  |  |  |         return false; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto check_short_pages = [&](std::size_t page_index, std::size_t offset, | 
					
						
							|  |  |  |                                  std::size_t copy_amount) { | 
					
						
							|  |  |  |         GPUVAddr base = (page_index << big_page_bits) + offset; | 
					
						
							|  |  |  |         MemoryOperation<false>(base, copy_amount, short_check, fail, fail); | 
					
						
							|  |  |  |         return result; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     MemoryOperation<true>(gpu_addr, size, big_check, fail, check_short_pages); | 
					
						
							|  |  |  |     return range_so_far; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | void MemoryManager::InvalidateRegion(GPUVAddr gpu_addr, size_t size) const { | 
					
						
							|  |  |  |     auto do_nothing = [&]([[maybe_unused]] std::size_t page_index, | 
					
						
							|  |  |  |                           [[maybe_unused]] std::size_t offset, | 
					
						
							|  |  |  |                           [[maybe_unused]] std::size_t copy_amount) {}; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     auto mapped_normal = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(page_table[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         rasterizer->InvalidateRegion(cpu_addr_base, copy_amount); | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto mapped_big = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(big_page_table_cpu[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         rasterizer->InvalidateRegion(cpu_addr_base, copy_amount); | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto invalidate_short_pages = [&](std::size_t page_index, std::size_t offset, | 
					
						
							|  |  |  |                                       std::size_t copy_amount) { | 
					
						
							|  |  |  |         GPUVAddr base = (page_index << big_page_bits) + offset; | 
					
						
							|  |  |  |         MemoryOperation<false>(base, copy_amount, mapped_normal, do_nothing, do_nothing); | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     MemoryOperation<true>(gpu_addr, size, mapped_big, do_nothing, invalidate_short_pages); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-07-26 00:16:21 -04:00
										 |  |  | void MemoryManager::CopyBlock(GPUVAddr gpu_dest_addr, GPUVAddr gpu_src_addr, std::size_t size) { | 
					
						
							| 
									
										
										
										
											2020-04-08 12:08:06 -04:00
										 |  |  |     std::vector<u8> tmp_buffer(size); | 
					
						
							| 
									
										
										
										
											2020-06-19 22:02:56 -04:00
										 |  |  |     ReadBlock(gpu_src_addr, tmp_buffer.data(), size); | 
					
						
							| 
									
										
										
										
											2021-01-21 19:08:43 -03:00
										 |  |  | 
 | 
					
						
							|  |  |  |     // The output block must be flushed in case it has data modified from the GPU.
 | 
					
						
							|  |  |  |     // Fixes NPC geometry in Zombie Panic in Wonderland DX
 | 
					
						
							|  |  |  |     FlushRegion(gpu_dest_addr, size); | 
					
						
							| 
									
										
										
										
											2020-06-19 22:02:56 -04:00
										 |  |  |     WriteBlock(gpu_dest_addr, tmp_buffer.data(), size); | 
					
						
							| 
									
										
										
										
											2018-10-12 21:52:16 -04:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-08-24 00:37:54 -04:00
										 |  |  | bool MemoryManager::IsGranularRange(GPUVAddr gpu_addr, std::size_t size) const { | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |     if (GetEntry<true>(gpu_addr) == EntryType::Mapped) [[likely]] { | 
					
						
							|  |  |  |         size_t page_index = gpu_addr >> big_page_bits; | 
					
						
							|  |  |  |         if (IsBigPageContinous(page_index)) [[likely]] { | 
					
						
							|  |  |  |             const std::size_t page{(page_index & big_page_mask) + size}; | 
					
						
							|  |  |  |             return page <= big_page_size; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         const std::size_t page{(gpu_addr & Core::Memory::YUZU_PAGEMASK) + size}; | 
					
						
							|  |  |  |         return page <= Core::Memory::YUZU_PAGESIZE; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     if (GetEntry<false>(gpu_addr) != EntryType::Mapped) { | 
					
						
							| 
									
										
										
										
											2020-08-24 00:37:54 -04:00
										 |  |  |         return false; | 
					
						
							| 
									
										
										
										
											2019-03-03 23:54:16 -05:00
										 |  |  |     } | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |     const std::size_t page{(gpu_addr & Core::Memory::YUZU_PAGEMASK) + size}; | 
					
						
							| 
									
										
										
										
											2022-08-18 16:28:55 -07:00
										 |  |  |     return page <= Core::Memory::YUZU_PAGESIZE; | 
					
						
							| 
									
										
										
										
											2018-02-07 21:54:35 -05:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  | bool MemoryManager::IsContinousRange(GPUVAddr gpu_addr, std::size_t size) const { | 
					
						
							|  |  |  |     std::optional<VAddr> old_page_addr{}; | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |     bool result{true}; | 
					
						
							|  |  |  |     auto fail = [&]([[maybe_unused]] std::size_t page_index, [[maybe_unused]] std::size_t offset, | 
					
						
							|  |  |  |                     std::size_t copy_amount) { | 
					
						
							|  |  |  |         result = false; | 
					
						
							|  |  |  |         return true; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto short_check = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(page_table[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         if (old_page_addr && *old_page_addr != cpu_addr_base) { | 
					
						
							|  |  |  |             result = false; | 
					
						
							|  |  |  |             return true; | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |         old_page_addr = {cpu_addr_base + copy_amount}; | 
					
						
							|  |  |  |         return false; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto big_check = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(big_page_table_cpu[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         if (old_page_addr && *old_page_addr != cpu_addr_base) { | 
					
						
							|  |  |  |             result = false; | 
					
						
							|  |  |  |             return true; | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |         old_page_addr = {cpu_addr_base + copy_amount}; | 
					
						
							|  |  |  |         return false; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto check_short_pages = [&](std::size_t page_index, std::size_t offset, | 
					
						
							|  |  |  |                                  std::size_t copy_amount) { | 
					
						
							|  |  |  |         GPUVAddr base = (page_index << big_page_bits) + offset; | 
					
						
							|  |  |  |         MemoryOperation<false>(base, copy_amount, short_check, fail, fail); | 
					
						
							|  |  |  |         return !result; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     MemoryOperation<true>(gpu_addr, size, big_check, fail, check_short_pages); | 
					
						
							|  |  |  |     return result; | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | bool MemoryManager::IsFullyMappedRange(GPUVAddr gpu_addr, std::size_t size) const { | 
					
						
							| 
									
										
										
										
											2022-02-06 18:51:07 +01:00
										 |  |  |     bool result{true}; | 
					
						
							|  |  |  |     auto fail = [&]([[maybe_unused]] std::size_t page_index, [[maybe_unused]] std::size_t offset, | 
					
						
							|  |  |  |                     [[maybe_unused]] std::size_t copy_amount) { | 
					
						
							|  |  |  |         result = false; | 
					
						
							|  |  |  |         return true; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto pass = [&]([[maybe_unused]] std::size_t page_index, [[maybe_unused]] std::size_t offset, | 
					
						
							|  |  |  |                     [[maybe_unused]] std::size_t copy_amount) { return false; }; | 
					
						
							|  |  |  |     auto check_short_pages = [&](std::size_t page_index, std::size_t offset, | 
					
						
							|  |  |  |                                  std::size_t copy_amount) { | 
					
						
							|  |  |  |         GPUVAddr base = (page_index << big_page_bits) + offset; | 
					
						
							|  |  |  |         MemoryOperation<false>(base, copy_amount, pass, pass, fail); | 
					
						
							|  |  |  |         return !result; | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     MemoryOperation<true>(gpu_addr, size, pass, fail, check_short_pages); | 
					
						
							|  |  |  |     return result; | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | std::vector<std::pair<GPUVAddr, std::size_t>> MemoryManager::GetSubmappedRange( | 
					
						
							|  |  |  |     GPUVAddr gpu_addr, std::size_t size) const { | 
					
						
							|  |  |  |     std::vector<std::pair<GPUVAddr, std::size_t>> result{}; | 
					
						
							|  |  |  |     std::optional<std::pair<GPUVAddr, std::size_t>> last_segment{}; | 
					
						
							|  |  |  |     std::optional<VAddr> old_page_addr{}; | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     const auto split = [&last_segment, &result]([[maybe_unused]] std::size_t page_index, | 
					
						
							|  |  |  |                                                 [[maybe_unused]] std::size_t offset, | 
					
						
							|  |  |  |                                                 [[maybe_unused]] std::size_t copy_amount) { | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  |         if (last_segment) { | 
					
						
							|  |  |  |             result.push_back(*last_segment); | 
					
						
							|  |  |  |             last_segment = std::nullopt; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |     }; | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     const auto extend_size_big = [this, &split, &old_page_addr, | 
					
						
							|  |  |  |                                   &last_segment](std::size_t page_index, std::size_t offset, | 
					
						
							|  |  |  |                                                  std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(big_page_table_cpu[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         if (old_page_addr) { | 
					
						
							|  |  |  |             if (*old_page_addr != cpu_addr_base) { | 
					
						
							|  |  |  |                 split(0, 0, 0); | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  |             } | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |         } | 
					
						
							|  |  |  |         old_page_addr = {cpu_addr_base + copy_amount}; | 
					
						
							|  |  |  |         if (!last_segment) { | 
					
						
							|  |  |  |             const GPUVAddr new_base_addr = (page_index << big_page_bits) + offset; | 
					
						
							|  |  |  |             last_segment = {new_base_addr, copy_amount}; | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  |         } else { | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |             last_segment->second += copy_amount; | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2022-02-05 18:15:26 +01:00
										 |  |  |     }; | 
					
						
							|  |  |  |     const auto extend_size_short = [this, &split, &old_page_addr, | 
					
						
							|  |  |  |                                     &last_segment](std::size_t page_index, std::size_t offset, | 
					
						
							|  |  |  |                                                    std::size_t copy_amount) { | 
					
						
							|  |  |  |         const VAddr cpu_addr_base = | 
					
						
							|  |  |  |             (static_cast<VAddr>(page_table[page_index]) << cpu_page_bits) + offset; | 
					
						
							|  |  |  |         if (old_page_addr) { | 
					
						
							|  |  |  |             if (*old_page_addr != cpu_addr_base) { | 
					
						
							|  |  |  |                 split(0, 0, 0); | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         old_page_addr = {cpu_addr_base + copy_amount}; | 
					
						
							|  |  |  |         if (!last_segment) { | 
					
						
							|  |  |  |             const GPUVAddr new_base_addr = (page_index << page_bits) + offset; | 
					
						
							|  |  |  |             last_segment = {new_base_addr, copy_amount}; | 
					
						
							|  |  |  |         } else { | 
					
						
							|  |  |  |             last_segment->second += copy_amount; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     auto do_short_pages = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) { | 
					
						
							|  |  |  |         GPUVAddr base = (page_index << big_page_bits) + offset; | 
					
						
							|  |  |  |         MemoryOperation<false>(base, copy_amount, extend_size_short, split, split); | 
					
						
							|  |  |  |     }; | 
					
						
							|  |  |  |     MemoryOperation<true>(gpu_addr, size, extend_size_big, split, do_short_pages); | 
					
						
							|  |  |  |     split(0, 0, 0); | 
					
						
							| 
									
										
										
										
											2021-06-13 03:34:06 +02:00
										 |  |  |     return result; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-02-11 23:44:12 -05:00
										 |  |  | } // namespace Tegra
 |