forked from eden-emu/eden
		
	pica/command_processor: build geometry pipeline and run geometry shader
The geometry pipeline manages data transfer between VS, GS and primitive assembler. It has known four modes: - no GS mode: sends VS output directly to the primitive assembler (what citra currently does) - GS mode 0: sends VS output to GS input registers, and sends GS output to primitive assembler - GS mode 1: sends VS output to GS uniform registers, and sends GS output to primitive assembler. It also takes an index from the index buffer at the beginning of each primitive for determine the primitive size. - GS mode 2: similar to mode 1, but doesn't take the index and uses a fixed primitive size. hwtest shows that immediate mode also supports GS (at least for mode 0), so the geometry pipeline gets refactored into its own class for supporting both drawing mode. In the immediate mode, some games don't set the pipeline registers to a valid value until the first attribute input, so a geometry pipeline reset flag is set in `pipeline.vs_default_attributes_setup.index` trigger, and the actual pipeline reconfigure is triggered in the first attribute input. In the normal drawing mode with index buffer, the vertex cache is a little bit modified to support the geometry pipeline. Instead of OutputVertex, it now holds AttributeBuffer, which is the input to the geometry pipeline. The AttributeBuffer->OutputVertex conversion is done inside the pipeline vertex handler. The actual hardware vertex cache is believed to be implemented in a similar way (because this is the only way that makes sense). Both geometry pipeline and GS unit rely on states preservation across drawing call, so they are put into the global state. In the future, the other three vertex shader units should be also placed in the global state, and a scheduler should be implemented on top of the four units. Note that the current gs_unit already allows running VS on it in the future.
This commit is contained in:
		
							parent
							
								
									8285ca4ad8
								
							
						
					
					
						commit
						0f35755572
					
				
					 6 changed files with 383 additions and 28 deletions
				
			
		|  | @ -161,6 +161,7 @@ static void WritePicaReg(u32 id, u32 value, u32 mask) { | |||
| 
 | ||||
|     case PICA_REG_INDEX(pipeline.vs_default_attributes_setup.index): | ||||
|         g_state.immediate.current_attribute = 0; | ||||
|         g_state.immediate.reset_geometry_pipeline = true; | ||||
|         default_attr_counter = 0; | ||||
|         break; | ||||
| 
 | ||||
|  | @ -234,16 +235,14 @@ static void WritePicaReg(u32 id, u32 value, u32 mask) { | |||
|                     shader_engine->Run(g_state.vs, shader_unit); | ||||
|                     shader_unit.WriteOutput(regs.vs, output); | ||||
| 
 | ||||
|                     // Send to renderer
 | ||||
|                     using Pica::Shader::OutputVertex; | ||||
|                     auto AddTriangle = [](const OutputVertex& v0, const OutputVertex& v1, | ||||
|                                           const OutputVertex& v2) { | ||||
|                         VideoCore::g_renderer->Rasterizer()->AddTriangle(v0, v1, v2); | ||||
|                     }; | ||||
| 
 | ||||
|                     g_state.primitive_assembler.SubmitVertex( | ||||
|                         Shader::OutputVertex::FromAttributeBuffer(regs.rasterizer, output), | ||||
|                         AddTriangle); | ||||
|                     // Send to geometry pipeline
 | ||||
|                     if (g_state.immediate.reset_geometry_pipeline) { | ||||
|                         g_state.geometry_pipeline.Reconfigure(); | ||||
|                         g_state.immediate.reset_geometry_pipeline = false; | ||||
|                     } | ||||
|                     ASSERT(!g_state.geometry_pipeline.NeedIndexInput()); | ||||
|                     g_state.geometry_pipeline.Setup(shader_engine); | ||||
|                     g_state.geometry_pipeline.SubmitVertex(output); | ||||
|                 } | ||||
|             } | ||||
|         } | ||||
|  | @ -321,8 +320,8 @@ static void WritePicaReg(u32 id, u32 value, u32 mask) { | |||
|         // The size has been tuned for optimal balance between hit-rate and the cost of lookup
 | ||||
|         const size_t VERTEX_CACHE_SIZE = 32; | ||||
|         std::array<u16, VERTEX_CACHE_SIZE> vertex_cache_ids; | ||||
|         std::array<Shader::OutputVertex, VERTEX_CACHE_SIZE> vertex_cache; | ||||
|         Shader::OutputVertex output_vertex; | ||||
|         std::array<Shader::AttributeBuffer, VERTEX_CACHE_SIZE> vertex_cache; | ||||
|         Shader::AttributeBuffer vs_output; | ||||
| 
 | ||||
|         unsigned int vertex_cache_pos = 0; | ||||
|         vertex_cache_ids.fill(-1); | ||||
|  | @ -332,6 +331,11 @@ static void WritePicaReg(u32 id, u32 value, u32 mask) { | |||
| 
 | ||||
|         shader_engine->SetupBatch(g_state.vs, regs.vs.main_offset); | ||||
| 
 | ||||
|         g_state.geometry_pipeline.Reconfigure(); | ||||
|         g_state.geometry_pipeline.Setup(shader_engine); | ||||
|         if (g_state.geometry_pipeline.NeedIndexInput()) | ||||
|             ASSERT(is_indexed); | ||||
| 
 | ||||
|         for (unsigned int index = 0; index < regs.pipeline.num_vertices; ++index) { | ||||
|             // Indexed rendering doesn't use the start offset
 | ||||
|             unsigned int vertex = | ||||
|  | @ -345,6 +349,11 @@ static void WritePicaReg(u32 id, u32 value, u32 mask) { | |||
|             bool vertex_cache_hit = false; | ||||
| 
 | ||||
|             if (is_indexed) { | ||||
|                 if (g_state.geometry_pipeline.NeedIndexInput()) { | ||||
|                     g_state.geometry_pipeline.SubmitIndex(vertex); | ||||
|                     continue; | ||||
|                 } | ||||
| 
 | ||||
|                 if (g_debug_context && Pica::g_debug_context->recorder) { | ||||
|                     int size = index_u16 ? 2 : 1; | ||||
|                     memory_accesses.AddAccess(base_address + index_info.offset + size * index, | ||||
|  | @ -353,7 +362,7 @@ static void WritePicaReg(u32 id, u32 value, u32 mask) { | |||
| 
 | ||||
|                 for (unsigned int i = 0; i < VERTEX_CACHE_SIZE; ++i) { | ||||
|                     if (vertex == vertex_cache_ids[i]) { | ||||
|                         output_vertex = vertex_cache[i]; | ||||
|                         vs_output = vertex_cache[i]; | ||||
|                         vertex_cache_hit = true; | ||||
|                         break; | ||||
|                     } | ||||
|  | @ -362,7 +371,7 @@ static void WritePicaReg(u32 id, u32 value, u32 mask) { | |||
| 
 | ||||
|             if (!vertex_cache_hit) { | ||||
|                 // Initialize data for the current vertex
 | ||||
|                 Shader::AttributeBuffer input, output{}; | ||||
|                 Shader::AttributeBuffer input; | ||||
|                 loader.LoadVertex(base_address, index, vertex, input, memory_accesses); | ||||
| 
 | ||||
|                 // Send to vertex shader
 | ||||
|  | @ -371,26 +380,17 @@ static void WritePicaReg(u32 id, u32 value, u32 mask) { | |||
|                                              (void*)&input); | ||||
|                 shader_unit.LoadInput(regs.vs, input); | ||||
|                 shader_engine->Run(g_state.vs, shader_unit); | ||||
|                 shader_unit.WriteOutput(regs.vs, output); | ||||
| 
 | ||||
|                 // Retrieve vertex from register data
 | ||||
|                 output_vertex = Shader::OutputVertex::FromAttributeBuffer(regs.rasterizer, output); | ||||
|                 shader_unit.WriteOutput(regs.vs, vs_output); | ||||
| 
 | ||||
|                 if (is_indexed) { | ||||
|                     vertex_cache[vertex_cache_pos] = output_vertex; | ||||
|                     vertex_cache[vertex_cache_pos] = vs_output; | ||||
|                     vertex_cache_ids[vertex_cache_pos] = vertex; | ||||
|                     vertex_cache_pos = (vertex_cache_pos + 1) % VERTEX_CACHE_SIZE; | ||||
|                 } | ||||
|             } | ||||
| 
 | ||||
|             // Send to renderer
 | ||||
|             using Pica::Shader::OutputVertex; | ||||
|             auto AddTriangle = [](const OutputVertex& v0, const OutputVertex& v1, | ||||
|                                   const OutputVertex& v2) { | ||||
|                 VideoCore::g_renderer->Rasterizer()->AddTriangle(v0, v1, v2); | ||||
|             }; | ||||
| 
 | ||||
|             primitive_assembler.SubmitVertex(output_vertex, AddTriangle); | ||||
|             // Send to geometry pipeline
 | ||||
|             g_state.geometry_pipeline.SubmitVertex(vs_output); | ||||
|         } | ||||
| 
 | ||||
|         for (auto& range : memory_accesses.ranges) { | ||||
|  |  | |||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue
	
	 wwylele
						wwylele