forked from eden-emu/eden
		
	Merge pull request #2055 from bunnei/gpu-thread
Asynchronous GPU command processing
This commit is contained in:
		
						commit
						757fd21d98
					
				
					 26 changed files with 529 additions and 52 deletions
				
			
		|  | @ -36,7 +36,8 @@ | |||
| #include "frontend/applets/software_keyboard.h" | ||||
| #include "frontend/applets/web_browser.h" | ||||
| #include "video_core/debug_utils/debug_utils.h" | ||||
| #include "video_core/gpu.h" | ||||
| #include "video_core/gpu_asynch.h" | ||||
| #include "video_core/gpu_synch.h" | ||||
| #include "video_core/renderer_base.h" | ||||
| #include "video_core/video_core.h" | ||||
| 
 | ||||
|  | @ -129,10 +130,16 @@ struct System::Impl { | |||
|             return ResultStatus::ErrorVideoCore; | ||||
|         } | ||||
| 
 | ||||
|         gpu_core = std::make_unique<Tegra::GPU>(system, renderer->Rasterizer()); | ||||
|         is_powered_on = true; | ||||
| 
 | ||||
|         if (Settings::values.use_asynchronous_gpu_emulation) { | ||||
|             gpu_core = std::make_unique<VideoCommon::GPUAsynch>(system, *renderer); | ||||
|         } else { | ||||
|             gpu_core = std::make_unique<VideoCommon::GPUSynch>(system, *renderer); | ||||
|         } | ||||
| 
 | ||||
|         cpu_core_manager.Initialize(system); | ||||
|         is_powered_on = true; | ||||
| 
 | ||||
|         LOG_DEBUG(Core, "Initialized OK"); | ||||
| 
 | ||||
|         // Reset counters and set time origin to current frame
 | ||||
|  |  | |||
|  | @ -36,7 +36,7 @@ void nvdisp_disp0::flip(u32 buffer_handle, u32 offset, u32 format, u32 width, u3 | |||
| 
 | ||||
|     auto& instance = Core::System::GetInstance(); | ||||
|     instance.GetPerfStats().EndGameFrame(); | ||||
|     instance.Renderer().SwapBuffers(framebuffer); | ||||
|     instance.GPU().SwapBuffers(framebuffer); | ||||
| } | ||||
| 
 | ||||
| } // namespace Service::Nvidia::Devices
 | ||||
|  |  | |||
|  | @ -178,7 +178,7 @@ u32 nvhost_as_gpu::UnmapBuffer(const std::vector<u8>& input, std::vector<u8>& ou | |||
|     auto& gpu = system_instance.GPU(); | ||||
|     auto cpu_addr = gpu.MemoryManager().GpuToCpuAddress(params.offset); | ||||
|     ASSERT(cpu_addr); | ||||
|     system_instance.Renderer().Rasterizer().FlushAndInvalidateRegion(*cpu_addr, itr->second.size); | ||||
|     gpu.FlushAndInvalidateRegion(*cpu_addr, itr->second.size); | ||||
| 
 | ||||
|     params.offset = gpu.MemoryManager().UnmapBuffer(params.offset, itr->second.size); | ||||
| 
 | ||||
|  |  | |||
|  | @ -136,16 +136,6 @@ u32 nvhost_gpu::AllocateObjectContext(const std::vector<u8>& input, std::vector< | |||
|     return 0; | ||||
| } | ||||
| 
 | ||||
| static void PushGPUEntries(Tegra::CommandList&& entries) { | ||||
|     if (entries.empty()) { | ||||
|         return; | ||||
|     } | ||||
| 
 | ||||
|     auto& dma_pusher{Core::System::GetInstance().GPU().DmaPusher()}; | ||||
|     dma_pusher.Push(std::move(entries)); | ||||
|     dma_pusher.DispatchCalls(); | ||||
| } | ||||
| 
 | ||||
| u32 nvhost_gpu::SubmitGPFIFO(const std::vector<u8>& input, std::vector<u8>& output) { | ||||
|     if (input.size() < sizeof(IoctlSubmitGpfifo)) { | ||||
|         UNIMPLEMENTED(); | ||||
|  | @ -163,7 +153,7 @@ u32 nvhost_gpu::SubmitGPFIFO(const std::vector<u8>& input, std::vector<u8>& outp | |||
|     std::memcpy(entries.data(), &input[sizeof(IoctlSubmitGpfifo)], | ||||
|                 params.num_entries * sizeof(Tegra::CommandListHeader)); | ||||
| 
 | ||||
|     PushGPUEntries(std::move(entries)); | ||||
|     Core::System::GetInstance().GPU().PushGPUEntries(std::move(entries)); | ||||
| 
 | ||||
|     params.fence_out.id = 0; | ||||
|     params.fence_out.value = 0; | ||||
|  | @ -184,7 +174,7 @@ u32 nvhost_gpu::KickoffPB(const std::vector<u8>& input, std::vector<u8>& output) | |||
|     Memory::ReadBlock(params.address, entries.data(), | ||||
|                       params.num_entries * sizeof(Tegra::CommandListHeader)); | ||||
| 
 | ||||
|     PushGPUEntries(std::move(entries)); | ||||
|     Core::System::GetInstance().GPU().PushGPUEntries(std::move(entries)); | ||||
| 
 | ||||
|     params.fence_out.id = 0; | ||||
|     params.fence_out.value = 0; | ||||
|  |  | |||
|  | @ -186,7 +186,7 @@ void NVFlinger::Compose() { | |||
| 
 | ||||
|             // There was no queued buffer to draw, render previous frame
 | ||||
|             system_instance.GetPerfStats().EndGameFrame(); | ||||
|             system_instance.Renderer().SwapBuffers({}); | ||||
|             system_instance.GPU().SwapBuffers({}); | ||||
|             continue; | ||||
|         } | ||||
| 
 | ||||
|  |  | |||
|  | @ -356,16 +356,16 @@ void RasterizerFlushVirtualRegion(VAddr start, u64 size, FlushMode mode) { | |||
|         const VAddr overlap_end = std::min(end, region_end); | ||||
|         const VAddr overlap_size = overlap_end - overlap_start; | ||||
| 
 | ||||
|         auto& rasterizer = system_instance.Renderer().Rasterizer(); | ||||
|         auto& gpu = system_instance.GPU(); | ||||
|         switch (mode) { | ||||
|         case FlushMode::Flush: | ||||
|             rasterizer.FlushRegion(overlap_start, overlap_size); | ||||
|             gpu.FlushRegion(overlap_start, overlap_size); | ||||
|             break; | ||||
|         case FlushMode::Invalidate: | ||||
|             rasterizer.InvalidateRegion(overlap_start, overlap_size); | ||||
|             gpu.InvalidateRegion(overlap_start, overlap_size); | ||||
|             break; | ||||
|         case FlushMode::FlushAndInvalidate: | ||||
|             rasterizer.FlushAndInvalidateRegion(overlap_start, overlap_size); | ||||
|             gpu.FlushAndInvalidateRegion(overlap_start, overlap_size); | ||||
|             break; | ||||
|         } | ||||
|     }; | ||||
|  |  | |||
|  | @ -393,6 +393,7 @@ struct Values { | |||
|     u16 frame_limit; | ||||
|     bool use_disk_shader_cache; | ||||
|     bool use_accurate_gpu_emulation; | ||||
|     bool use_asynchronous_gpu_emulation; | ||||
| 
 | ||||
|     float bg_red; | ||||
|     float bg_green; | ||||
|  |  | |||
|  | @ -162,6 +162,8 @@ TelemetrySession::TelemetrySession() { | |||
|              Settings::values.use_disk_shader_cache); | ||||
|     AddField(Telemetry::FieldType::UserConfig, "Renderer_UseAccurateGpuEmulation", | ||||
|              Settings::values.use_accurate_gpu_emulation); | ||||
|     AddField(Telemetry::FieldType::UserConfig, "Renderer_UseAsynchronousGpuEmulation", | ||||
|              Settings::values.use_asynchronous_gpu_emulation); | ||||
|     AddField(Telemetry::FieldType::UserConfig, "System_UseDockedMode", | ||||
|              Settings::values.use_docked_mode); | ||||
| } | ||||
|  |  | |||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue
	
	 bunnei
						bunnei