forked from eden-emu/eden
		
	Merge pull request #3742 from FernandoS27/command-list
Optimize GPU Command Lists and Introduce Fast GPU Time Option
This commit is contained in:
		
						commit
						d952b2e1da
					
				
					 20 changed files with 214 additions and 14 deletions
				
			
		|  | @ -446,6 +446,7 @@ struct Values { | ||||||
|     bool use_asynchronous_gpu_emulation; |     bool use_asynchronous_gpu_emulation; | ||||||
|     bool use_vsync; |     bool use_vsync; | ||||||
|     bool force_30fps_mode; |     bool force_30fps_mode; | ||||||
|  |     bool use_fast_gpu_time; | ||||||
| 
 | 
 | ||||||
|     float bg_red; |     float bg_red; | ||||||
|     float bg_green; |     float bg_green; | ||||||
|  |  | ||||||
|  | @ -71,16 +71,22 @@ bool DmaPusher::Step() { | ||||||
|     gpu.MemoryManager().ReadBlockUnsafe(dma_get, command_headers.data(), |     gpu.MemoryManager().ReadBlockUnsafe(dma_get, command_headers.data(), | ||||||
|                                         command_list_header.size * sizeof(u32)); |                                         command_list_header.size * sizeof(u32)); | ||||||
| 
 | 
 | ||||||
|     for (const CommandHeader& command_header : command_headers) { |     for (std::size_t index = 0; index < command_headers.size();) { | ||||||
|  |         const CommandHeader& command_header = command_headers[index]; | ||||||
| 
 | 
 | ||||||
|         // now, see if we're in the middle of a command
 |         if (dma_state.method_count) { | ||||||
|         if (dma_state.length_pending) { |  | ||||||
|             // Second word of long non-inc methods command - method count
 |  | ||||||
|             dma_state.length_pending = 0; |  | ||||||
|             dma_state.method_count = command_header.method_count_; |  | ||||||
|         } else if (dma_state.method_count) { |  | ||||||
|             // Data word of methods command
 |             // Data word of methods command
 | ||||||
|             CallMethod(command_header.argument); |             if (dma_state.non_incrementing) { | ||||||
|  |                 const u32 max_write = static_cast<u32>( | ||||||
|  |                     std::min<std::size_t>(index + dma_state.method_count, command_headers.size()) - | ||||||
|  |                     index); | ||||||
|  |                 CallMultiMethod(&command_header.argument, max_write); | ||||||
|  |                 dma_state.method_count -= max_write; | ||||||
|  |                 index += max_write; | ||||||
|  |                 continue; | ||||||
|  |             } else { | ||||||
|  |                 CallMethod(command_header.argument); | ||||||
|  |             } | ||||||
| 
 | 
 | ||||||
|             if (!dma_state.non_incrementing) { |             if (!dma_state.non_incrementing) { | ||||||
|                 dma_state.method++; |                 dma_state.method++; | ||||||
|  | @ -120,6 +126,7 @@ bool DmaPusher::Step() { | ||||||
|                 break; |                 break; | ||||||
|             } |             } | ||||||
|         } |         } | ||||||
|  |         index++; | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|     if (!non_main) { |     if (!non_main) { | ||||||
|  | @ -140,4 +147,9 @@ void DmaPusher::CallMethod(u32 argument) const { | ||||||
|     gpu.CallMethod({dma_state.method, argument, dma_state.subchannel, dma_state.method_count}); |     gpu.CallMethod({dma_state.method, argument, dma_state.subchannel, dma_state.method_count}); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | void DmaPusher::CallMultiMethod(const u32* base_start, u32 num_methods) const { | ||||||
|  |     gpu.CallMultiMethod(dma_state.method, dma_state.subchannel, base_start, num_methods, | ||||||
|  |                         dma_state.method_count); | ||||||
|  | } | ||||||
|  | 
 | ||||||
| } // namespace Tegra
 | } // namespace Tegra
 | ||||||
|  |  | ||||||
|  | @ -75,6 +75,7 @@ private: | ||||||
|     void SetState(const CommandHeader& command_header); |     void SetState(const CommandHeader& command_header); | ||||||
| 
 | 
 | ||||||
|     void CallMethod(u32 argument) const; |     void CallMethod(u32 argument) const; | ||||||
|  |     void CallMultiMethod(const u32* base_start, u32 num_methods) const; | ||||||
| 
 | 
 | ||||||
|     std::vector<CommandHeader> command_headers; ///< Buffer for list of commands fetched at once
 |     std::vector<CommandHeader> command_headers; ///< Buffer for list of commands fetched at once
 | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -28,6 +28,12 @@ void Fermi2D::CallMethod(const GPU::MethodCall& method_call) { | ||||||
|     } |     } | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | void Fermi2D::CallMultiMethod(u32 method, const u32* base_start, u32 amount, u32 methods_pending) { | ||||||
|  |     for (std::size_t i = 0; i < amount; i++) { | ||||||
|  |         CallMethod({method, base_start[i], 0, methods_pending - static_cast<u32>(i)}); | ||||||
|  |     } | ||||||
|  | } | ||||||
|  | 
 | ||||||
| static std::pair<u32, u32> DelimitLine(u32 src_1, u32 src_2, u32 dst_1, u32 dst_2, u32 src_line) { | static std::pair<u32, u32> DelimitLine(u32 src_1, u32 src_2, u32 dst_1, u32 dst_2, u32 src_line) { | ||||||
|     const u32 line_a = src_2 - src_1; |     const u32 line_a = src_2 - src_1; | ||||||
|     const u32 line_b = dst_2 - dst_1; |     const u32 line_b = dst_2 - dst_1; | ||||||
|  |  | ||||||
|  | @ -39,6 +39,9 @@ public: | ||||||
|     /// Write the value to the register identified by method.
 |     /// Write the value to the register identified by method.
 | ||||||
|     void CallMethod(const GPU::MethodCall& method_call); |     void CallMethod(const GPU::MethodCall& method_call); | ||||||
| 
 | 
 | ||||||
|  |     /// Write multiple values to the register identified by method.
 | ||||||
|  |     void CallMultiMethod(u32 method, const u32* base_start, u32 amount, u32 methods_pending); | ||||||
|  | 
 | ||||||
|     enum class Origin : u32 { |     enum class Origin : u32 { | ||||||
|         Center = 0, |         Center = 0, | ||||||
|         Corner = 1, |         Corner = 1, | ||||||
|  |  | ||||||
|  | @ -51,6 +51,13 @@ void KeplerCompute::CallMethod(const GPU::MethodCall& method_call) { | ||||||
|     } |     } | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | void KeplerCompute::CallMultiMethod(u32 method, const u32* base_start, u32 amount, | ||||||
|  |                                     u32 methods_pending) { | ||||||
|  |     for (std::size_t i = 0; i < amount; i++) { | ||||||
|  |         CallMethod({method, base_start[i], 0, methods_pending - static_cast<u32>(i)}); | ||||||
|  |     } | ||||||
|  | } | ||||||
|  | 
 | ||||||
| Texture::FullTextureInfo KeplerCompute::GetTexture(std::size_t offset) const { | Texture::FullTextureInfo KeplerCompute::GetTexture(std::size_t offset) const { | ||||||
|     const std::bitset<8> cbuf_mask = launch_description.const_buffer_enable_mask.Value(); |     const std::bitset<8> cbuf_mask = launch_description.const_buffer_enable_mask.Value(); | ||||||
|     ASSERT(cbuf_mask[regs.tex_cb_index]); |     ASSERT(cbuf_mask[regs.tex_cb_index]); | ||||||
|  |  | ||||||
|  | @ -202,6 +202,9 @@ public: | ||||||
|     /// Write the value to the register identified by method.
 |     /// Write the value to the register identified by method.
 | ||||||
|     void CallMethod(const GPU::MethodCall& method_call); |     void CallMethod(const GPU::MethodCall& method_call); | ||||||
| 
 | 
 | ||||||
|  |     /// Write multiple values to the register identified by method.
 | ||||||
|  |     void CallMultiMethod(u32 method, const u32* base_start, u32 amount, u32 methods_pending); | ||||||
|  | 
 | ||||||
|     Texture::FullTextureInfo GetTexture(std::size_t offset) const; |     Texture::FullTextureInfo GetTexture(std::size_t offset) const; | ||||||
| 
 | 
 | ||||||
|     /// Given a texture handle, returns the TSC and TIC entries.
 |     /// Given a texture handle, returns the TSC and TIC entries.
 | ||||||
|  |  | ||||||
|  | @ -41,4 +41,11 @@ void KeplerMemory::CallMethod(const GPU::MethodCall& method_call) { | ||||||
|     } |     } | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | void KeplerMemory::CallMultiMethod(u32 method, const u32* base_start, u32 amount, | ||||||
|  |                                    u32 methods_pending) { | ||||||
|  |     for (std::size_t i = 0; i < amount; i++) { | ||||||
|  |         CallMethod({method, base_start[i], 0, methods_pending - static_cast<u32>(i)}); | ||||||
|  |     } | ||||||
|  | } | ||||||
|  | 
 | ||||||
| } // namespace Tegra::Engines
 | } // namespace Tegra::Engines
 | ||||||
|  |  | ||||||
|  | @ -40,6 +40,9 @@ public: | ||||||
|     /// Write the value to the register identified by method.
 |     /// Write the value to the register identified by method.
 | ||||||
|     void CallMethod(const GPU::MethodCall& method_call); |     void CallMethod(const GPU::MethodCall& method_call); | ||||||
| 
 | 
 | ||||||
|  |     /// Write multiple values to the register identified by method.
 | ||||||
|  |     void CallMultiMethod(u32 method, const u32* base_start, u32 amount, u32 methods_pending); | ||||||
|  | 
 | ||||||
|     struct Regs { |     struct Regs { | ||||||
|         static constexpr size_t NUM_REGS = 0x7F; |         static constexpr size_t NUM_REGS = 0x7F; | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -280,6 +280,58 @@ void Maxwell3D::CallMethod(const GPU::MethodCall& method_call) { | ||||||
|     } |     } | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | void Maxwell3D::CallMultiMethod(u32 method, const u32* base_start, u32 amount, | ||||||
|  |                                 u32 methods_pending) { | ||||||
|  |     // Methods after 0xE00 are special, they're actually triggers for some microcode that was
 | ||||||
|  |     // uploaded to the GPU during initialization.
 | ||||||
|  |     if (method >= MacroRegistersStart) { | ||||||
|  |         // We're trying to execute a macro
 | ||||||
|  |         if (executing_macro == 0) { | ||||||
|  |             // A macro call must begin by writing the macro method's register, not its argument.
 | ||||||
|  |             ASSERT_MSG((method % 2) == 0, | ||||||
|  |                        "Can't start macro execution by writing to the ARGS register"); | ||||||
|  |             executing_macro = method; | ||||||
|  |         } | ||||||
|  | 
 | ||||||
|  |         for (std::size_t i = 0; i < amount; i++) { | ||||||
|  |             macro_params.push_back(base_start[i]); | ||||||
|  |         } | ||||||
|  | 
 | ||||||
|  |         // Call the macro when there are no more parameters in the command buffer
 | ||||||
|  |         if (amount == methods_pending) { | ||||||
|  |             CallMacroMethod(executing_macro, macro_params.size(), macro_params.data()); | ||||||
|  |             macro_params.clear(); | ||||||
|  |         } | ||||||
|  |         return; | ||||||
|  |     } | ||||||
|  |     switch (method) { | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[0]): | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[1]): | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[2]): | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[3]): | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[4]): | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[5]): | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[6]): | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[7]): | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[8]): | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[9]): | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[10]): | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[11]): | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[12]): | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[13]): | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[14]): | ||||||
|  |     case MAXWELL3D_REG_INDEX(const_buffer.cb_data[15]): { | ||||||
|  |         ProcessCBMultiData(method, base_start, amount); | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  |     default: { | ||||||
|  |         for (std::size_t i = 0; i < amount; i++) { | ||||||
|  |             CallMethod({method, base_start[i], 0, methods_pending - static_cast<u32>(i)}); | ||||||
|  |         } | ||||||
|  |     } | ||||||
|  |     } | ||||||
|  | } | ||||||
|  | 
 | ||||||
| void Maxwell3D::StepInstance(const MMEDrawMode expected_mode, const u32 count) { | void Maxwell3D::StepInstance(const MMEDrawMode expected_mode, const u32 count) { | ||||||
|     if (mme_draw.current_mode == MMEDrawMode::Undefined) { |     if (mme_draw.current_mode == MMEDrawMode::Undefined) { | ||||||
|         if (mme_draw.gl_begin_consume) { |         if (mme_draw.gl_begin_consume) { | ||||||
|  | @ -570,6 +622,28 @@ void Maxwell3D::StartCBData(u32 method) { | ||||||
|     ProcessCBData(regs.const_buffer.cb_data[cb_data_state.id]); |     ProcessCBData(regs.const_buffer.cb_data[cb_data_state.id]); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | void Maxwell3D::ProcessCBMultiData(u32 method, const u32* start_base, u32 amount) { | ||||||
|  |     if (cb_data_state.current != method) { | ||||||
|  |         if (cb_data_state.current != null_cb_data) { | ||||||
|  |             FinishCBData(); | ||||||
|  |         } | ||||||
|  |         constexpr u32 first_cb_data = MAXWELL3D_REG_INDEX(const_buffer.cb_data[0]); | ||||||
|  |         cb_data_state.start_pos = regs.const_buffer.cb_pos; | ||||||
|  |         cb_data_state.id = method - first_cb_data; | ||||||
|  |         cb_data_state.current = method; | ||||||
|  |         cb_data_state.counter = 0; | ||||||
|  |     } | ||||||
|  |     const std::size_t id = cb_data_state.id; | ||||||
|  |     const std::size_t size = amount; | ||||||
|  |     std::size_t i = 0; | ||||||
|  |     for (; i < size; i++) { | ||||||
|  |         cb_data_state.buffer[id][cb_data_state.counter] = start_base[i]; | ||||||
|  |         cb_data_state.counter++; | ||||||
|  |     } | ||||||
|  |     // Increment the current buffer position.
 | ||||||
|  |     regs.const_buffer.cb_pos = regs.const_buffer.cb_pos + 4 * amount; | ||||||
|  | } | ||||||
|  | 
 | ||||||
| void Maxwell3D::FinishCBData() { | void Maxwell3D::FinishCBData() { | ||||||
|     // Write the input value to the current const buffer at the current position.
 |     // Write the input value to the current const buffer at the current position.
 | ||||||
|     const GPUVAddr buffer_address = regs.const_buffer.BufferAddress(); |     const GPUVAddr buffer_address = regs.const_buffer.BufferAddress(); | ||||||
|  |  | ||||||
|  | @ -1359,6 +1359,9 @@ public: | ||||||
|     /// Write the value to the register identified by method.
 |     /// Write the value to the register identified by method.
 | ||||||
|     void CallMethod(const GPU::MethodCall& method_call); |     void CallMethod(const GPU::MethodCall& method_call); | ||||||
| 
 | 
 | ||||||
|  |     /// Write multiple values to the register identified by method.
 | ||||||
|  |     void CallMultiMethod(u32 method, const u32* base_start, u32 amount, u32 methods_pending); | ||||||
|  | 
 | ||||||
|     /// Write the value to the register identified by method.
 |     /// Write the value to the register identified by method.
 | ||||||
|     void CallMethodFromMME(const GPU::MethodCall& method_call); |     void CallMethodFromMME(const GPU::MethodCall& method_call); | ||||||
| 
 | 
 | ||||||
|  | @ -1512,6 +1515,7 @@ private: | ||||||
|     /// Handles a write to the CB_DATA[i] register.
 |     /// Handles a write to the CB_DATA[i] register.
 | ||||||
|     void StartCBData(u32 method); |     void StartCBData(u32 method); | ||||||
|     void ProcessCBData(u32 value); |     void ProcessCBData(u32 value); | ||||||
|  |     void ProcessCBMultiData(u32 method, const u32* start_base, u32 amount); | ||||||
|     void FinishCBData(); |     void FinishCBData(); | ||||||
| 
 | 
 | ||||||
|     /// Handles a write to the CB_BIND register.
 |     /// Handles a write to the CB_BIND register.
 | ||||||
|  |  | ||||||
|  | @ -36,6 +36,13 @@ void MaxwellDMA::CallMethod(const GPU::MethodCall& method_call) { | ||||||
| #undef MAXWELLDMA_REG_INDEX | #undef MAXWELLDMA_REG_INDEX | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | void MaxwellDMA::CallMultiMethod(u32 method, const u32* base_start, u32 amount, | ||||||
|  |                                  u32 methods_pending) { | ||||||
|  |     for (std::size_t i = 0; i < amount; i++) { | ||||||
|  |         CallMethod({method, base_start[i], 0, methods_pending - static_cast<u32>(i)}); | ||||||
|  |     } | ||||||
|  | } | ||||||
|  | 
 | ||||||
| void MaxwellDMA::HandleCopy() { | void MaxwellDMA::HandleCopy() { | ||||||
|     LOG_TRACE(HW_GPU, "Requested a DMA copy"); |     LOG_TRACE(HW_GPU, "Requested a DMA copy"); | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -35,6 +35,9 @@ public: | ||||||
|     /// Write the value to the register identified by method.
 |     /// Write the value to the register identified by method.
 | ||||||
|     void CallMethod(const GPU::MethodCall& method_call); |     void CallMethod(const GPU::MethodCall& method_call); | ||||||
| 
 | 
 | ||||||
|  |     /// Write multiple values to the register identified by method.
 | ||||||
|  |     void CallMultiMethod(u32 method, const u32* base_start, u32 amount, u32 methods_pending); | ||||||
|  | 
 | ||||||
|     struct Regs { |     struct Regs { | ||||||
|         static constexpr std::size_t NUM_REGS = 0x1D6; |         static constexpr std::size_t NUM_REGS = 0x1D6; | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -9,6 +9,7 @@ | ||||||
| #include "core/core_timing_util.h" | #include "core/core_timing_util.h" | ||||||
| #include "core/frontend/emu_window.h" | #include "core/frontend/emu_window.h" | ||||||
| #include "core/memory.h" | #include "core/memory.h" | ||||||
|  | #include "core/settings.h" | ||||||
| #include "video_core/engines/fermi_2d.h" | #include "video_core/engines/fermi_2d.h" | ||||||
| #include "video_core/engines/kepler_compute.h" | #include "video_core/engines/kepler_compute.h" | ||||||
| #include "video_core/engines/kepler_memory.h" | #include "video_core/engines/kepler_memory.h" | ||||||
|  | @ -154,7 +155,10 @@ u64 GPU::GetTicks() const { | ||||||
|     constexpr u64 gpu_ticks_den = 625; |     constexpr u64 gpu_ticks_den = 625; | ||||||
| 
 | 
 | ||||||
|     const u64 cpu_ticks = system.CoreTiming().GetTicks(); |     const u64 cpu_ticks = system.CoreTiming().GetTicks(); | ||||||
|     const u64 nanoseconds = Core::Timing::CyclesToNs(cpu_ticks).count(); |     u64 nanoseconds = Core::Timing::CyclesToNs(cpu_ticks).count(); | ||||||
|  |     if (Settings::values.use_fast_gpu_time) { | ||||||
|  |         nanoseconds /= 256; | ||||||
|  |     } | ||||||
|     const u64 nanoseconds_num = nanoseconds / gpu_ticks_den; |     const u64 nanoseconds_num = nanoseconds / gpu_ticks_den; | ||||||
|     const u64 nanoseconds_rem = nanoseconds % gpu_ticks_den; |     const u64 nanoseconds_rem = nanoseconds % gpu_ticks_den; | ||||||
|     return nanoseconds_num * gpu_ticks_num + (nanoseconds_rem * gpu_ticks_num) / gpu_ticks_den; |     return nanoseconds_num * gpu_ticks_num + (nanoseconds_rem * gpu_ticks_num) / gpu_ticks_den; | ||||||
|  | @ -209,16 +213,32 @@ void GPU::CallMethod(const MethodCall& method_call) { | ||||||
| 
 | 
 | ||||||
|     ASSERT(method_call.subchannel < bound_engines.size()); |     ASSERT(method_call.subchannel < bound_engines.size()); | ||||||
| 
 | 
 | ||||||
|     if (ExecuteMethodOnEngine(method_call)) { |     if (ExecuteMethodOnEngine(method_call.method)) { | ||||||
|         CallEngineMethod(method_call); |         CallEngineMethod(method_call); | ||||||
|     } else { |     } else { | ||||||
|         CallPullerMethod(method_call); |         CallPullerMethod(method_call); | ||||||
|     } |     } | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| bool GPU::ExecuteMethodOnEngine(const MethodCall& method_call) { | void GPU::CallMultiMethod(u32 method, u32 subchannel, const u32* base_start, u32 amount, | ||||||
|     const auto method = static_cast<BufferMethods>(method_call.method); |                           u32 methods_pending) { | ||||||
|     return method >= BufferMethods::NonPullerMethods; |     LOG_TRACE(HW_GPU, "Processing method {:08X} on subchannel {}", method, subchannel); | ||||||
|  | 
 | ||||||
|  |     ASSERT(subchannel < bound_engines.size()); | ||||||
|  | 
 | ||||||
|  |     if (ExecuteMethodOnEngine(method)) { | ||||||
|  |         CallEngineMultiMethod(method, subchannel, base_start, amount, methods_pending); | ||||||
|  |     } else { | ||||||
|  |         for (std::size_t i = 0; i < amount; i++) { | ||||||
|  |             CallPullerMethod( | ||||||
|  |                 {method, base_start[i], subchannel, methods_pending - static_cast<u32>(i)}); | ||||||
|  |         } | ||||||
|  |     } | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | bool GPU::ExecuteMethodOnEngine(u32 method) { | ||||||
|  |     const auto buffer_method = static_cast<BufferMethods>(method); | ||||||
|  |     return buffer_method >= BufferMethods::NonPullerMethods; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| void GPU::CallPullerMethod(const MethodCall& method_call) { | void GPU::CallPullerMethod(const MethodCall& method_call) { | ||||||
|  | @ -298,6 +318,31 @@ void GPU::CallEngineMethod(const MethodCall& method_call) { | ||||||
|     } |     } | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | void GPU::CallEngineMultiMethod(u32 method, u32 subchannel, const u32* base_start, u32 amount, | ||||||
|  |                                 u32 methods_pending) { | ||||||
|  |     const EngineID engine = bound_engines[subchannel]; | ||||||
|  | 
 | ||||||
|  |     switch (engine) { | ||||||
|  |     case EngineID::FERMI_TWOD_A: | ||||||
|  |         fermi_2d->CallMultiMethod(method, base_start, amount, methods_pending); | ||||||
|  |         break; | ||||||
|  |     case EngineID::MAXWELL_B: | ||||||
|  |         maxwell_3d->CallMultiMethod(method, base_start, amount, methods_pending); | ||||||
|  |         break; | ||||||
|  |     case EngineID::KEPLER_COMPUTE_B: | ||||||
|  |         kepler_compute->CallMultiMethod(method, base_start, amount, methods_pending); | ||||||
|  |         break; | ||||||
|  |     case EngineID::MAXWELL_DMA_COPY_A: | ||||||
|  |         maxwell_dma->CallMultiMethod(method, base_start, amount, methods_pending); | ||||||
|  |         break; | ||||||
|  |     case EngineID::KEPLER_INLINE_TO_MEMORY_B: | ||||||
|  |         kepler_memory->CallMultiMethod(method, base_start, amount, methods_pending); | ||||||
|  |         break; | ||||||
|  |     default: | ||||||
|  |         UNIMPLEMENTED_MSG("Unimplemented engine"); | ||||||
|  |     } | ||||||
|  | } | ||||||
|  | 
 | ||||||
| void GPU::ProcessBindMethod(const MethodCall& method_call) { | void GPU::ProcessBindMethod(const MethodCall& method_call) { | ||||||
|     // Bind the current subchannel to the desired engine id.
 |     // Bind the current subchannel to the desired engine id.
 | ||||||
|     LOG_DEBUG(HW_GPU, "Binding subchannel {} to engine {}", method_call.subchannel, |     LOG_DEBUG(HW_GPU, "Binding subchannel {} to engine {}", method_call.subchannel, | ||||||
|  |  | ||||||
|  | @ -155,6 +155,10 @@ public: | ||||||
|     /// Calls a GPU method.
 |     /// Calls a GPU method.
 | ||||||
|     void CallMethod(const MethodCall& method_call); |     void CallMethod(const MethodCall& method_call); | ||||||
| 
 | 
 | ||||||
|  |     /// Calls a GPU multivalue method.
 | ||||||
|  |     void CallMultiMethod(u32 method, u32 subchannel, const u32* base_start, u32 amount, | ||||||
|  |                          u32 methods_pending); | ||||||
|  | 
 | ||||||
|     /// Flush all current written commands into the host GPU for execution.
 |     /// Flush all current written commands into the host GPU for execution.
 | ||||||
|     void FlushCommands(); |     void FlushCommands(); | ||||||
|     /// Synchronizes CPU writes with Host GPU memory.
 |     /// Synchronizes CPU writes with Host GPU memory.
 | ||||||
|  | @ -309,8 +313,12 @@ private: | ||||||
|     /// Calls a GPU engine method.
 |     /// Calls a GPU engine method.
 | ||||||
|     void CallEngineMethod(const MethodCall& method_call); |     void CallEngineMethod(const MethodCall& method_call); | ||||||
| 
 | 
 | ||||||
|  |     /// Calls a GPU engine multivalue method.
 | ||||||
|  |     void CallEngineMultiMethod(u32 method, u32 subchannel, const u32* base_start, u32 amount, | ||||||
|  |                                u32 methods_pending); | ||||||
|  | 
 | ||||||
|     /// Determines where the method should be executed.
 |     /// Determines where the method should be executed.
 | ||||||
|     bool ExecuteMethodOnEngine(const MethodCall& method_call); |     bool ExecuteMethodOnEngine(u32 method); | ||||||
| 
 | 
 | ||||||
| protected: | protected: | ||||||
|     std::unique_ptr<Tegra::DmaPusher> dma_pusher; |     std::unique_ptr<Tegra::DmaPusher> dma_pusher; | ||||||
|  |  | ||||||
|  | @ -643,6 +643,8 @@ void Config::ReadRendererValues() { | ||||||
|     Settings::values.use_asynchronous_gpu_emulation = |     Settings::values.use_asynchronous_gpu_emulation = | ||||||
|         ReadSetting(QStringLiteral("use_asynchronous_gpu_emulation"), false).toBool(); |         ReadSetting(QStringLiteral("use_asynchronous_gpu_emulation"), false).toBool(); | ||||||
|     Settings::values.use_vsync = ReadSetting(QStringLiteral("use_vsync"), true).toBool(); |     Settings::values.use_vsync = ReadSetting(QStringLiteral("use_vsync"), true).toBool(); | ||||||
|  |     Settings::values.use_fast_gpu_time = | ||||||
|  |         ReadSetting(QStringLiteral("use_fast_gpu_time"), true).toBool(); | ||||||
|     Settings::values.force_30fps_mode = |     Settings::values.force_30fps_mode = | ||||||
|         ReadSetting(QStringLiteral("force_30fps_mode"), false).toBool(); |         ReadSetting(QStringLiteral("force_30fps_mode"), false).toBool(); | ||||||
| 
 | 
 | ||||||
|  | @ -1084,6 +1086,7 @@ void Config::SaveRendererValues() { | ||||||
|     WriteSetting(QStringLiteral("use_asynchronous_gpu_emulation"), |     WriteSetting(QStringLiteral("use_asynchronous_gpu_emulation"), | ||||||
|                  Settings::values.use_asynchronous_gpu_emulation, false); |                  Settings::values.use_asynchronous_gpu_emulation, false); | ||||||
|     WriteSetting(QStringLiteral("use_vsync"), Settings::values.use_vsync, true); |     WriteSetting(QStringLiteral("use_vsync"), Settings::values.use_vsync, true); | ||||||
|  |     WriteSetting(QStringLiteral("use_fast_gpu_time"), Settings::values.use_fast_gpu_time, true); | ||||||
|     WriteSetting(QStringLiteral("force_30fps_mode"), Settings::values.force_30fps_mode, false); |     WriteSetting(QStringLiteral("force_30fps_mode"), Settings::values.force_30fps_mode, false); | ||||||
| 
 | 
 | ||||||
|     // Cast to double because Qt's written float values are not human-readable
 |     // Cast to double because Qt's written float values are not human-readable
 | ||||||
|  |  | ||||||
|  | @ -22,6 +22,7 @@ void ConfigureGraphicsAdvanced::SetConfiguration() { | ||||||
|     ui->gpu_accuracy->setCurrentIndex(static_cast<int>(Settings::values.gpu_accuracy)); |     ui->gpu_accuracy->setCurrentIndex(static_cast<int>(Settings::values.gpu_accuracy)); | ||||||
|     ui->use_vsync->setEnabled(runtime_lock); |     ui->use_vsync->setEnabled(runtime_lock); | ||||||
|     ui->use_vsync->setChecked(Settings::values.use_vsync); |     ui->use_vsync->setChecked(Settings::values.use_vsync); | ||||||
|  |     ui->use_fast_gpu_time->setChecked(Settings::values.use_fast_gpu_time); | ||||||
|     ui->force_30fps_mode->setEnabled(runtime_lock); |     ui->force_30fps_mode->setEnabled(runtime_lock); | ||||||
|     ui->force_30fps_mode->setChecked(Settings::values.force_30fps_mode); |     ui->force_30fps_mode->setChecked(Settings::values.force_30fps_mode); | ||||||
|     ui->anisotropic_filtering_combobox->setEnabled(runtime_lock); |     ui->anisotropic_filtering_combobox->setEnabled(runtime_lock); | ||||||
|  | @ -32,6 +33,7 @@ void ConfigureGraphicsAdvanced::ApplyConfiguration() { | ||||||
|     auto gpu_accuracy = static_cast<Settings::GPUAccuracy>(ui->gpu_accuracy->currentIndex()); |     auto gpu_accuracy = static_cast<Settings::GPUAccuracy>(ui->gpu_accuracy->currentIndex()); | ||||||
|     Settings::values.gpu_accuracy = gpu_accuracy; |     Settings::values.gpu_accuracy = gpu_accuracy; | ||||||
|     Settings::values.use_vsync = ui->use_vsync->isChecked(); |     Settings::values.use_vsync = ui->use_vsync->isChecked(); | ||||||
|  |     Settings::values.use_fast_gpu_time = ui->use_fast_gpu_time->isChecked(); | ||||||
|     Settings::values.force_30fps_mode = ui->force_30fps_mode->isChecked(); |     Settings::values.force_30fps_mode = ui->force_30fps_mode->isChecked(); | ||||||
|     Settings::values.max_anisotropy = ui->anisotropic_filtering_combobox->currentIndex(); |     Settings::values.max_anisotropy = ui->anisotropic_filtering_combobox->currentIndex(); | ||||||
| } | } | ||||||
|  |  | ||||||
|  | @ -69,6 +69,13 @@ | ||||||
|           </property> |           </property> | ||||||
|          </widget> |          </widget> | ||||||
|         </item> |         </item> | ||||||
|  |         <item> | ||||||
|  |          <widget class="QCheckBox" name="use_fast_gpu_time"> | ||||||
|  |           <property name="text"> | ||||||
|  |            <string>Use Fast GPU Time</string> | ||||||
|  |           </property> | ||||||
|  |          </widget> | ||||||
|  |         </item> | ||||||
|         <item> |         <item> | ||||||
|          <layout class="QHBoxLayout" name="horizontalLayout_1"> |          <layout class="QHBoxLayout" name="horizontalLayout_1"> | ||||||
|           <item> |           <item> | ||||||
|  |  | ||||||
|  | @ -394,6 +394,8 @@ void Config::ReadValues() { | ||||||
|         sdl2_config->GetBoolean("Renderer", "use_asynchronous_gpu_emulation", false); |         sdl2_config->GetBoolean("Renderer", "use_asynchronous_gpu_emulation", false); | ||||||
|     Settings::values.use_vsync = |     Settings::values.use_vsync = | ||||||
|         static_cast<u16>(sdl2_config->GetInteger("Renderer", "use_vsync", 1)); |         static_cast<u16>(sdl2_config->GetInteger("Renderer", "use_vsync", 1)); | ||||||
|  |     Settings::values.use_fast_gpu_time = | ||||||
|  |         sdl2_config->GetBoolean("Renderer", "use_fast_gpu_time", true); | ||||||
| 
 | 
 | ||||||
|     Settings::values.bg_red = static_cast<float>(sdl2_config->GetReal("Renderer", "bg_red", 0.0)); |     Settings::values.bg_red = static_cast<float>(sdl2_config->GetReal("Renderer", "bg_red", 0.0)); | ||||||
|     Settings::values.bg_green = |     Settings::values.bg_green = | ||||||
|  |  | ||||||
|  | @ -130,6 +130,8 @@ void Config::ReadValues() { | ||||||
|     Settings::values.gpu_accuracy = static_cast<Settings::GPUAccuracy>(gpu_accuracy_level); |     Settings::values.gpu_accuracy = static_cast<Settings::GPUAccuracy>(gpu_accuracy_level); | ||||||
|     Settings::values.use_asynchronous_gpu_emulation = |     Settings::values.use_asynchronous_gpu_emulation = | ||||||
|         sdl2_config->GetBoolean("Renderer", "use_asynchronous_gpu_emulation", false); |         sdl2_config->GetBoolean("Renderer", "use_asynchronous_gpu_emulation", false); | ||||||
|  |     Settings::values.use_fast_gpu_time = | ||||||
|  |         sdl2_config->GetBoolean("Renderer", "use_fast_gpu_time", true); | ||||||
| 
 | 
 | ||||||
|     Settings::values.bg_red = static_cast<float>(sdl2_config->GetReal("Renderer", "bg_red", 0.0)); |     Settings::values.bg_red = static_cast<float>(sdl2_config->GetReal("Renderer", "bg_red", 0.0)); | ||||||
|     Settings::values.bg_green = |     Settings::values.bg_green = | ||||||
|  |  | ||||||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue
	
	 bunnei
						bunnei