forked from eden-emu/eden
		
	shader_decode: Implement TEXS.F16
This commit is contained in:
		
							parent
							
								
									c68c13e1aa
								
							
						
					
					
						commit
						5af82a8ed4
					
				
					 3 changed files with 57 additions and 15 deletions
				
			
		|  | @ -219,8 +219,7 @@ u32 ShaderIR::DecodeMemory(BasicBlock& bb, u32 pc) { | ||||||
|         if (instr.texs.fp32_flag) { |         if (instr.texs.fp32_flag) { | ||||||
|             WriteTexsInstructionFloat(bb, instr, texture); |             WriteTexsInstructionFloat(bb, instr, texture); | ||||||
|         } else { |         } else { | ||||||
|             UNIMPLEMENTED(); |             WriteTexsInstructionHalfFloat(bb, instr, texture); | ||||||
|             // WriteTexsInstructionHalfFloat(bb, instr, texture);
 |  | ||||||
|         } |         } | ||||||
|         break; |         break; | ||||||
|     } |     } | ||||||
|  | @ -416,39 +415,52 @@ const Sampler& ShaderIR::GetSampler(const Tegra::Shader::Sampler& sampler, Textu | ||||||
|     return *used_samplers.emplace(entry).first; |     return *used_samplers.emplace(entry).first; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| void ShaderIR::WriteTexsInstructionFloat(BasicBlock& bb, Tegra::Shader::Instruction instr, | void ShaderIR::WriteTexsInstructionFloat(BasicBlock& bb, Instruction instr, Node texture) { | ||||||
|                                          Node texture) { |  | ||||||
|     // TEXS has two destination registers and a swizzle. The first two elements in the swizzle
 |     // TEXS has two destination registers and a swizzle. The first two elements in the swizzle
 | ||||||
|     // go into gpr0+0 and gpr0+1, and the rest goes into gpr28+0 and gpr28+1
 |     // go into gpr0+0 and gpr0+1, and the rest goes into gpr28+0 and gpr28+1
 | ||||||
| 
 | 
 | ||||||
|     MetaComponents meta; |     MetaComponents meta; | ||||||
|     std::array<Node, 4> dest; |     std::array<Node, 4> dest; | ||||||
| 
 |  | ||||||
|     std::size_t written_components = 0; |  | ||||||
|     for (u32 component = 0; component < 4; ++component) { |     for (u32 component = 0; component < 4; ++component) { | ||||||
|         if (!instr.texs.IsComponentEnabled(component)) { |         if (!instr.texs.IsComponentEnabled(component)) { | ||||||
|             continue; |             continue; | ||||||
|         } |         } | ||||||
|         meta.components_map[written_components] = static_cast<u32>(component); |         meta.components_map[meta.count] = component; | ||||||
| 
 | 
 | ||||||
|         if (written_components < 2) { |         if (meta.count < 2) { | ||||||
|             // Write the first two swizzle components to gpr0 and gpr0+1
 |             // Write the first two swizzle components to gpr0 and gpr0+1
 | ||||||
|             dest[written_components] = GetRegister(instr.gpr0.Value() + written_components % 2); |             dest[meta.count] = GetRegister(instr.gpr0.Value() + meta.count % 2); | ||||||
|         } else { |         } else { | ||||||
|             ASSERT(instr.texs.HasTwoDestinations()); |             ASSERT(instr.texs.HasTwoDestinations()); | ||||||
|             // Write the rest of the swizzle components to gpr28 and gpr28+1
 |             // Write the rest of the swizzle components to gpr28 and gpr28+1
 | ||||||
|             dest[written_components] = GetRegister(instr.gpr28.Value() + written_components % 2); |             dest[meta.count] = GetRegister(instr.gpr28.Value() + meta.count % 2); | ||||||
|  |         } | ||||||
|  |         ++meta.count; | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|         ++written_components; |     std::generate(dest.begin() + meta.count, dest.end(), [&]() { return GetRegister(RZ); }); | ||||||
|     } |  | ||||||
| 
 |  | ||||||
|     std::generate(dest.begin() + written_components, dest.end(), [&]() { return GetRegister(RZ); }); |  | ||||||
| 
 | 
 | ||||||
|     bb.push_back(Operation(OperationCode::AssignComposite, meta, texture, dest[0], dest[1], dest[2], |     bb.push_back(Operation(OperationCode::AssignComposite, meta, texture, dest[0], dest[1], dest[2], | ||||||
|                            dest[3])); |                            dest[3])); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | void ShaderIR::WriteTexsInstructionHalfFloat(BasicBlock& bb, Instruction instr, Node texture) { | ||||||
|  |     // TEXS.F16 destionation registers are packed in two registers in pairs (just like any half
 | ||||||
|  |     // float instruction).
 | ||||||
|  | 
 | ||||||
|  |     MetaComponents meta; | ||||||
|  |     for (u32 component = 0; component < 4; ++component) { | ||||||
|  |         if (!instr.texs.IsComponentEnabled(component)) | ||||||
|  |             continue; | ||||||
|  |         meta.components_map[meta.count++] = component; | ||||||
|  |     } | ||||||
|  |     if (meta.count == 0) | ||||||
|  |         return; | ||||||
|  | 
 | ||||||
|  |     bb.push_back(Operation(OperationCode::AssignCompositeHalf, meta, texture, | ||||||
|  |                            GetRegister(instr.gpr0), GetRegister(instr.gpr28))); | ||||||
|  | } | ||||||
|  | 
 | ||||||
| Node ShaderIR::GetTextureCode(Instruction instr, TextureType texture_type, | Node ShaderIR::GetTextureCode(Instruction instr, TextureType texture_type, | ||||||
|                               TextureProcessMode process_mode, bool depth_compare, bool is_array, |                               TextureProcessMode process_mode, bool depth_compare, bool is_array, | ||||||
|                               std::size_t array_offset, std::size_t bias_offset, |                               std::size_t array_offset, std::size_t bias_offset, | ||||||
|  |  | ||||||
|  | @ -785,6 +785,31 @@ private: | ||||||
|         return {}; |         return {}; | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|  |     std::string AssignCompositeHalf(Operation operation) { | ||||||
|  |         const auto& meta = std::get<MetaComponents>(operation.GetMeta()); | ||||||
|  | 
 | ||||||
|  |         const std::string composite = code.GenerateTemporal(); | ||||||
|  |         code.AddLine("vec4 " + composite + " = " + Visit(operation[0]) + ';'); | ||||||
|  | 
 | ||||||
|  |         const auto ReadComponent = [&](u32 component) { | ||||||
|  |             if (component < meta.count) { | ||||||
|  |                 return composite + '[' + std::to_string(meta.GetSourceComponent(component)) + ']'; | ||||||
|  |             } | ||||||
|  |             return std::string("0"); | ||||||
|  |         }; | ||||||
|  | 
 | ||||||
|  |         const auto dst1 = std::get<GprNode>(*operation[1]).GetIndex(); | ||||||
|  |         const std::string src1 = "vec2(" + ReadComponent(0) + ", " + ReadComponent(1) + ')'; | ||||||
|  |         code.AddLine(GetRegister(dst1) + " = utof(packHalf2x16(" + src1 + "))"); | ||||||
|  | 
 | ||||||
|  |         if (meta.count > 2) { | ||||||
|  |             const auto dst2 = std::get<GprNode>(*operation[2]).GetIndex(); | ||||||
|  |             const std::string src2 = "vec2(" + ReadComponent(2) + ", " + ReadComponent(3) + ')'; | ||||||
|  |             code.AddLine(GetRegister(dst2) + " = utof(packHalf2x16(" + src2 + "))"); | ||||||
|  |         } | ||||||
|  |         return {}; | ||||||
|  |     } | ||||||
|  | 
 | ||||||
|     std::string Composite(Operation operation) { |     std::string Composite(Operation operation) { | ||||||
|         std::string value = "vec4("; |         std::string value = "vec4("; | ||||||
|         for (std::size_t i = 0; i < 4; ++i) { |         for (std::size_t i = 0; i < 4; ++i) { | ||||||
|  | @ -1302,6 +1327,7 @@ private: | ||||||
|     static constexpr OperationDecompilersArray operation_decompilers = { |     static constexpr OperationDecompilersArray operation_decompilers = { | ||||||
|         &GLSLDecompiler::Assign, |         &GLSLDecompiler::Assign, | ||||||
|         &GLSLDecompiler::AssignComposite, |         &GLSLDecompiler::AssignComposite, | ||||||
|  |         &GLSLDecompiler::AssignCompositeHalf, | ||||||
| 
 | 
 | ||||||
|         &GLSLDecompiler::Composite, |         &GLSLDecompiler::Composite, | ||||||
|         &GLSLDecompiler::Select, |         &GLSLDecompiler::Select, | ||||||
|  |  | ||||||
|  | @ -46,6 +46,7 @@ constexpr u32 RZ = 0xff; | ||||||
| enum class OperationCode { | enum class OperationCode { | ||||||
|     Assign,              /// (float& dest, float src) -> void
 |     Assign,              /// (float& dest, float src) -> void
 | ||||||
|     AssignComposite,     /// (MetaComponents, float4 src, float&[4] dst) -> void
 |     AssignComposite,     /// (MetaComponents, float4 src, float&[4] dst) -> void
 | ||||||
|  |     AssignCompositeHalf, /// (MetaComponents, float4 src, float&[2] dst) -> void
 | ||||||
| 
 | 
 | ||||||
|     Composite, /// (float[4] values) -> float4
 |     Composite, /// (float[4] values) -> float4
 | ||||||
|     Select,    /// (MetaArithmetic, bool pred, float a, float b) -> float
 |     Select,    /// (MetaArithmetic, bool pred, float a, float b) -> float
 | ||||||
|  | @ -279,6 +280,7 @@ struct MetaTexture { | ||||||
| 
 | 
 | ||||||
| struct MetaComponents { | struct MetaComponents { | ||||||
|     std::array<u32, 4> components_map{}; |     std::array<u32, 4> components_map{}; | ||||||
|  |     u32 count{}; | ||||||
| 
 | 
 | ||||||
|     u32 GetSourceComponent(u32 dest_index) const { |     u32 GetSourceComponent(u32 dest_index) const { | ||||||
|         return components_map[dest_index]; |         return components_map[dest_index]; | ||||||
|  | @ -692,6 +694,8 @@ private: | ||||||
|                               Tegra::Shader::TextureType type, bool is_array, bool is_shadow); |                               Tegra::Shader::TextureType type, bool is_array, bool is_shadow); | ||||||
| 
 | 
 | ||||||
|     void WriteTexsInstructionFloat(BasicBlock& bb, Tegra::Shader::Instruction instr, Node texture); |     void WriteTexsInstructionFloat(BasicBlock& bb, Tegra::Shader::Instruction instr, Node texture); | ||||||
|  |     void WriteTexsInstructionHalfFloat(BasicBlock& bb, Tegra::Shader::Instruction instr, | ||||||
|  |                                        Node texture); | ||||||
| 
 | 
 | ||||||
|     Node GetTexCode(Tegra::Shader::Instruction instr, Tegra::Shader::TextureType texture_type, |     Node GetTexCode(Tegra::Shader::Instruction instr, Tegra::Shader::TextureType texture_type, | ||||||
|                     Tegra::Shader::TextureProcessMode process_mode, bool depth_compare, |                     Tegra::Shader::TextureProcessMode process_mode, bool depth_compare, | ||||||
|  |  | ||||||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue
	
	 ReinUsesLisp
						ReinUsesLisp