forked from eden-emu/eden
		
	maxwell_3d: Use std::bitset to manage dirty flags
This commit is contained in:
		
							parent
							
								
									d07526cd2b
								
							
						
					
					
						commit
						20d8c304f2
					
				
					 4 changed files with 51 additions and 52 deletions
				
			
		|  | @ -107,21 +107,23 @@ void Maxwell3D::CallMacroMethod(u32 method, std::vector<u32> parameters) { | |||
| void Maxwell3D::CallMethod(const GPU::MethodCall& method_call) { | ||||
|     auto debug_context = system.GetGPUDebugContext(); | ||||
| 
 | ||||
|     const u32 method = method_call.method; | ||||
| 
 | ||||
|     // It is an error to write to a register other than the current macro's ARG register before it
 | ||||
|     // has finished execution.
 | ||||
|     if (executing_macro != 0) { | ||||
|         ASSERT(method_call.method == executing_macro + 1); | ||||
|         ASSERT(method == executing_macro + 1); | ||||
|     } | ||||
| 
 | ||||
|     // Methods after 0xE00 are special, they're actually triggers for some microcode that was
 | ||||
|     // uploaded to the GPU during initialization.
 | ||||
|     if (method_call.method >= MacroRegistersStart) { | ||||
|     if (method >= MacroRegistersStart) { | ||||
|         // We're trying to execute a macro
 | ||||
|         if (executing_macro == 0) { | ||||
|             // A macro call must begin by writing the macro method's register, not its argument.
 | ||||
|             ASSERT_MSG((method_call.method % 2) == 0, | ||||
|             ASSERT_MSG((method % 2) == 0, | ||||
|                        "Can't start macro execution by writing to the ARGS register"); | ||||
|             executing_macro = method_call.method; | ||||
|             executing_macro = method; | ||||
|         } | ||||
| 
 | ||||
|         macro_params.push_back(method_call.argument); | ||||
|  | @ -133,66 +135,62 @@ void Maxwell3D::CallMethod(const GPU::MethodCall& method_call) { | |||
|         return; | ||||
|     } | ||||
| 
 | ||||
|     ASSERT_MSG(method_call.method < Regs::NUM_REGS, | ||||
|     ASSERT_MSG(method < Regs::NUM_REGS, | ||||
|                "Invalid Maxwell3D register, increase the size of the Regs structure"); | ||||
| 
 | ||||
|     if (debug_context) { | ||||
|         debug_context->OnEvent(Tegra::DebugContext::Event::MaxwellCommandLoaded, nullptr); | ||||
|     } | ||||
| 
 | ||||
|     if (regs.reg_array[method_call.method] != method_call.argument) { | ||||
|         regs.reg_array[method_call.method] = method_call.argument; | ||||
|     if (regs.reg_array[method] != method_call.argument) { | ||||
|         regs.reg_array[method] = method_call.argument; | ||||
|         // Color buffers
 | ||||
|         constexpr u32 first_rt_reg = MAXWELL3D_REG_INDEX(rt); | ||||
|         constexpr u32 registers_per_rt = sizeof(regs.rt[0]) / sizeof(u32); | ||||
|         if (method_call.method >= first_rt_reg && | ||||
|             method_call.method < first_rt_reg + registers_per_rt * Regs::NumRenderTargets) { | ||||
|             const std::size_t rt_index = (method_call.method - first_rt_reg) / registers_per_rt; | ||||
|             dirty_flags.color_buffer |= 1u << static_cast<u32>(rt_index); | ||||
|         if (method >= first_rt_reg && | ||||
|             method < first_rt_reg + registers_per_rt * Regs::NumRenderTargets) { | ||||
|             const std::size_t rt_index = (method - first_rt_reg) / registers_per_rt; | ||||
|             dirty_flags.color_buffer.set(rt_index); | ||||
|         } | ||||
| 
 | ||||
|         // Zeta buffer
 | ||||
|         constexpr u32 registers_in_zeta = sizeof(regs.zeta) / sizeof(u32); | ||||
|         if (method_call.method == MAXWELL3D_REG_INDEX(zeta_enable) || | ||||
|             method_call.method == MAXWELL3D_REG_INDEX(zeta_width) || | ||||
|             method_call.method == MAXWELL3D_REG_INDEX(zeta_height) || | ||||
|             (method_call.method >= MAXWELL3D_REG_INDEX(zeta) && | ||||
|              method_call.method < MAXWELL3D_REG_INDEX(zeta) + registers_in_zeta)) { | ||||
|         if (method == MAXWELL3D_REG_INDEX(zeta_enable) || | ||||
|             method == MAXWELL3D_REG_INDEX(zeta_width) || | ||||
|             method == MAXWELL3D_REG_INDEX(zeta_height) || | ||||
|             (method >= MAXWELL3D_REG_INDEX(zeta) && | ||||
|              method < MAXWELL3D_REG_INDEX(zeta) + registers_in_zeta)) { | ||||
|             dirty_flags.zeta_buffer = true; | ||||
|         } | ||||
| 
 | ||||
|         // Shader
 | ||||
|         constexpr u32 shader_registers_count = | ||||
|             sizeof(regs.shader_config[0]) * Regs::MaxShaderProgram / sizeof(u32); | ||||
|         if (method_call.method >= MAXWELL3D_REG_INDEX(shader_config[0]) && | ||||
|             method_call.method < MAXWELL3D_REG_INDEX(shader_config[0]) + shader_registers_count) { | ||||
|         if (method >= MAXWELL3D_REG_INDEX(shader_config[0]) && | ||||
|             method < MAXWELL3D_REG_INDEX(shader_config[0]) + shader_registers_count) { | ||||
|             dirty_flags.shaders = true; | ||||
|         } | ||||
| 
 | ||||
|         // Vertex format
 | ||||
|         if (method_call.method >= MAXWELL3D_REG_INDEX(vertex_attrib_format) && | ||||
|             method_call.method < | ||||
|                 MAXWELL3D_REG_INDEX(vertex_attrib_format) + regs.vertex_attrib_format.size()) { | ||||
|         if (method >= MAXWELL3D_REG_INDEX(vertex_attrib_format) && | ||||
|             method < MAXWELL3D_REG_INDEX(vertex_attrib_format) + regs.vertex_attrib_format.size()) { | ||||
|             dirty_flags.vertex_attrib_format = true; | ||||
|         } | ||||
| 
 | ||||
|         // Vertex buffer
 | ||||
|         if (method_call.method >= MAXWELL3D_REG_INDEX(vertex_array) && | ||||
|             method_call.method < MAXWELL3D_REG_INDEX(vertex_array) + 4 * 32) { | ||||
|             dirty_flags.vertex_array |= | ||||
|                 1u << ((method_call.method - MAXWELL3D_REG_INDEX(vertex_array)) >> 2); | ||||
|         } else if (method_call.method >= MAXWELL3D_REG_INDEX(vertex_array_limit) && | ||||
|                    method_call.method < MAXWELL3D_REG_INDEX(vertex_array_limit) + 2 * 32) { | ||||
|             dirty_flags.vertex_array |= | ||||
|                 1u << ((method_call.method - MAXWELL3D_REG_INDEX(vertex_array_limit)) >> 1); | ||||
|         } else if (method_call.method >= MAXWELL3D_REG_INDEX(instanced_arrays) && | ||||
|                    method_call.method < MAXWELL3D_REG_INDEX(instanced_arrays) + 32) { | ||||
|             dirty_flags.vertex_array |= | ||||
|                 1u << (method_call.method - MAXWELL3D_REG_INDEX(instanced_arrays)); | ||||
|         if (method >= MAXWELL3D_REG_INDEX(vertex_array) && | ||||
|             method < MAXWELL3D_REG_INDEX(vertex_array) + 4 * 32) { | ||||
|             dirty_flags.vertex_array.set((method - MAXWELL3D_REG_INDEX(vertex_array)) >> 2); | ||||
|         } else if (method >= MAXWELL3D_REG_INDEX(vertex_array_limit) && | ||||
|                    method < MAXWELL3D_REG_INDEX(vertex_array_limit) + 2 * 32) { | ||||
|             dirty_flags.vertex_array.set((method - MAXWELL3D_REG_INDEX(vertex_array_limit)) >> 1); | ||||
|         } else if (method >= MAXWELL3D_REG_INDEX(instanced_arrays) && | ||||
|                    method < MAXWELL3D_REG_INDEX(instanced_arrays) + 32) { | ||||
|             dirty_flags.vertex_array.set(method - MAXWELL3D_REG_INDEX(instanced_arrays)); | ||||
|         } | ||||
|     } | ||||
| 
 | ||||
|     switch (method_call.method) { | ||||
|     switch (method) { | ||||
|     case MAXWELL3D_REG_INDEX(macros.data): { | ||||
|         ProcessMacroUpload(method_call.argument); | ||||
|         break; | ||||
|  |  | |||
|  | @ -5,8 +5,10 @@ | |||
| #pragma once | ||||
| 
 | ||||
| #include <array> | ||||
| #include <bitset> | ||||
| #include <unordered_map> | ||||
| #include <vector> | ||||
| 
 | ||||
| #include "common/assert.h" | ||||
| #include "common/bit_field.h" | ||||
| #include "common/common_funcs.h" | ||||
|  | @ -1094,19 +1096,18 @@ public: | |||
|     MemoryManager& memory_manager; | ||||
| 
 | ||||
|     struct DirtyFlags { | ||||
|         u8 color_buffer = 0xFF; | ||||
|         bool zeta_buffer = true; | ||||
| 
 | ||||
|         bool shaders = true; | ||||
|         std::bitset<8> color_buffer{0xFF}; | ||||
|         std::bitset<32> vertex_array{0xFFFFFFFF}; | ||||
| 
 | ||||
|         bool vertex_attrib_format = true; | ||||
|         u32 vertex_array = 0xFFFFFFFF; | ||||
|         bool zeta_buffer = true; | ||||
|         bool shaders = true; | ||||
| 
 | ||||
|         void OnMemoryWrite() { | ||||
|             color_buffer = 0xFF; | ||||
|             zeta_buffer = true; | ||||
|             shaders = true; | ||||
|             vertex_array = 0xFFFFFFFF; | ||||
|             color_buffer.set(); | ||||
|             vertex_array.set(); | ||||
|         } | ||||
|     }; | ||||
| 
 | ||||
|  |  | |||
|  | @ -200,7 +200,7 @@ GLuint RasterizerOpenGL::SetupVertexFormat() { | |||
|     } | ||||
| 
 | ||||
|     // Rebinding the VAO invalidates the vertex buffer bindings.
 | ||||
|     gpu.dirty_flags.vertex_array = 0xFFFFFFFF; | ||||
|     gpu.dirty_flags.vertex_array.set(); | ||||
| 
 | ||||
|     state.draw.vertex_array = vao_entry.handle; | ||||
|     return vao_entry.handle; | ||||
|  | @ -210,14 +210,14 @@ void RasterizerOpenGL::SetupVertexBuffer(GLuint vao) { | |||
|     auto& gpu = Core::System::GetInstance().GPU().Maxwell3D(); | ||||
|     const auto& regs = gpu.regs; | ||||
| 
 | ||||
|     if (!gpu.dirty_flags.vertex_array) | ||||
|     if (gpu.dirty_flags.vertex_array.none()) | ||||
|         return; | ||||
| 
 | ||||
|     MICROPROFILE_SCOPE(OpenGL_VB); | ||||
| 
 | ||||
|     // Upload all guest vertex arrays sequentially to our buffer
 | ||||
|     for (u32 index = 0; index < Maxwell::NumVertexArrays; ++index) { | ||||
|         if (~gpu.dirty_flags.vertex_array & (1u << index)) | ||||
|         if (!gpu.dirty_flags.vertex_array[index]) | ||||
|             continue; | ||||
| 
 | ||||
|         const auto& vertex_array = regs.vertex_array[index]; | ||||
|  | @ -244,7 +244,7 @@ void RasterizerOpenGL::SetupVertexBuffer(GLuint vao) { | |||
|         } | ||||
|     } | ||||
| 
 | ||||
|     gpu.dirty_flags.vertex_array = 0; | ||||
|     gpu.dirty_flags.vertex_array.reset(); | ||||
| } | ||||
| 
 | ||||
| DrawParameters RasterizerOpenGL::SetupDraw() { | ||||
|  | @ -488,13 +488,13 @@ std::pair<bool, bool> RasterizerOpenGL::ConfigureFramebuffers( | |||
|     OpenGLState& current_state, bool using_color_fb, bool using_depth_fb, bool preserve_contents, | ||||
|     std::optional<std::size_t> single_color_target) { | ||||
|     MICROPROFILE_SCOPE(OpenGL_Framebuffer); | ||||
|     const auto& gpu = Core::System::GetInstance().GPU().Maxwell3D(); | ||||
|     auto& gpu = Core::System::GetInstance().GPU().Maxwell3D(); | ||||
|     const auto& regs = gpu.regs; | ||||
| 
 | ||||
|     const FramebufferConfigState fb_config_state{using_color_fb, using_depth_fb, preserve_contents, | ||||
|                                                  single_color_target}; | ||||
|     if (fb_config_state == current_framebuffer_config_state && gpu.dirty_flags.color_buffer == 0 && | ||||
|         !gpu.dirty_flags.zeta_buffer) { | ||||
|     if (fb_config_state == current_framebuffer_config_state && | ||||
|         gpu.dirty_flags.color_buffer.none() && !gpu.dirty_flags.zeta_buffer) { | ||||
|         // Only skip if the previous ConfigureFramebuffers call was from the same kind (multiple or
 | ||||
|         // single color targets). This is done because the guest registers may not change but the
 | ||||
|         // host framebuffer may contain different attachments
 | ||||
|  | @ -721,10 +721,10 @@ void RasterizerOpenGL::DrawArrays() { | |||
|     // Add space for at least 18 constant buffers
 | ||||
|     buffer_size += Maxwell::MaxConstBuffers * (MaxConstbufferSize + uniform_buffer_alignment); | ||||
| 
 | ||||
|     bool invalidate = buffer_cache.Map(buffer_size); | ||||
|     const bool invalidate = buffer_cache.Map(buffer_size); | ||||
|     if (invalidate) { | ||||
|         // As all cached buffers are invalidated, we need to recheck their state.
 | ||||
|         gpu.dirty_flags.vertex_array = 0xFFFFFFFF; | ||||
|         gpu.dirty_flags.vertex_array.set(); | ||||
|     } | ||||
| 
 | ||||
|     const GLuint vao = SetupVertexFormat(); | ||||
|  |  | |||
|  | @ -962,10 +962,10 @@ Surface RasterizerCacheOpenGL::GetColorBufferSurface(std::size_t index, bool pre | |||
|     auto& gpu{Core::System::GetInstance().GPU().Maxwell3D()}; | ||||
|     const auto& regs{gpu.regs}; | ||||
| 
 | ||||
|     if ((gpu.dirty_flags.color_buffer & (1u << static_cast<u32>(index))) == 0) { | ||||
|     if (!gpu.dirty_flags.color_buffer[index]) { | ||||
|         return last_color_buffers[index]; | ||||
|     } | ||||
|     gpu.dirty_flags.color_buffer &= ~(1u << static_cast<u32>(index)); | ||||
|     gpu.dirty_flags.color_buffer.reset(index); | ||||
| 
 | ||||
|     ASSERT(index < Tegra::Engines::Maxwell3D::Regs::NumRenderTargets); | ||||
| 
 | ||||
|  |  | |||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue
	
	 ReinUsesLisp
						ReinUsesLisp