forked from eden-emu/eden
		
	Video_core: Address feedback
This commit is contained in:
		
							parent
							
								
									62fc8bfe16
								
							
						
					
					
						commit
						1fdf24a081
					
				
					 20 changed files with 348 additions and 172 deletions
				
			
		|  | @ -60,7 +60,7 @@ private: | ||||||
|     using ConstIteratorType = typename MapType::const_iterator; |     using ConstIteratorType = typename MapType::const_iterator; | ||||||
| 
 | 
 | ||||||
|     size_t ContinousSizeInternal(KeyT address) const { |     size_t ContinousSizeInternal(KeyT address) const { | ||||||
|         const auto it = GetFirstElemnentBeforeOrOn(address); |         const auto it = GetFirstElementBeforeOrOn(address); | ||||||
|         if (it == container.end() || it->second == null_value) { |         if (it == container.end() || it->second == null_value) { | ||||||
|             return 0; |             return 0; | ||||||
|         } |         } | ||||||
|  | @ -72,14 +72,14 @@ private: | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|     ValueT GetValueInternal(KeyT address) const { |     ValueT GetValueInternal(KeyT address) const { | ||||||
|         const auto it = GetFirstElemnentBeforeOrOn(address); |         const auto it = GetFirstElementBeforeOrOn(address); | ||||||
|         if (it == container.end()) { |         if (it == container.end()) { | ||||||
|             return null_value; |             return null_value; | ||||||
|         } |         } | ||||||
|         return it->second; |         return it->second; | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|     ConstIteratorType GetFirstElemnentBeforeOrOn(KeyT address) const { |     ConstIteratorType GetFirstElementBeforeOrOn(KeyT address) const { | ||||||
|         auto it = container.lower_bound(address); |         auto it = container.lower_bound(address); | ||||||
|         if (it == container.begin()) { |         if (it == container.begin()) { | ||||||
|             return it; |             return it; | ||||||
|  |  | ||||||
|  | @ -137,6 +137,15 @@ void EmitGetAttribute(EmitContext& ctx, IR::Inst& inst, IR::Attribute attr, Scal | ||||||
|     case IR::Attribute::VertexId: |     case IR::Attribute::VertexId: | ||||||
|         ctx.Add("MOV.F {}.x,{}.id;", inst, ctx.attrib_name); |         ctx.Add("MOV.F {}.x,{}.id;", inst, ctx.attrib_name); | ||||||
|         break; |         break; | ||||||
|  |     case IR::Attribute::BaseInstance: | ||||||
|  |         ctx.Add("MOV.F {}.x,{}.baseInstance;", inst, ctx.attrib_name); | ||||||
|  |         break; | ||||||
|  |     case IR::Attribute::BaseVertex: | ||||||
|  |         ctx.Add("MOV.F {}.x,{}.baseVertex;", inst, ctx.attrib_name); | ||||||
|  |         break; | ||||||
|  |     case IR::Attribute::DrawID: | ||||||
|  |         ctx.Add("MOV.F {}.x,{}.draw.id;", inst, ctx.attrib_name); | ||||||
|  |         break; | ||||||
|     case IR::Attribute::FrontFace: |     case IR::Attribute::FrontFace: | ||||||
|         ctx.Add("CMP.F {}.x,{}.facing.x,0,-1;", inst, ctx.attrib_name); |         ctx.Add("CMP.F {}.x,{}.facing.x,0,-1;", inst, ctx.attrib_name); | ||||||
|         break; |         break; | ||||||
|  | @ -156,6 +165,15 @@ void EmitGetAttributeU32(EmitContext& ctx, IR::Inst& inst, IR::Attribute attr, S | ||||||
|     case IR::Attribute::VertexId: |     case IR::Attribute::VertexId: | ||||||
|         ctx.Add("MOV.S {}.x,{}.id;", inst, ctx.attrib_name); |         ctx.Add("MOV.S {}.x,{}.id;", inst, ctx.attrib_name); | ||||||
|         break; |         break; | ||||||
|  |     case IR::Attribute::BaseInstance: | ||||||
|  |         ctx.Add("MOV.S {}.x,{}.baseInstance;", inst, ctx.attrib_name); | ||||||
|  |         break; | ||||||
|  |     case IR::Attribute::BaseVertex: | ||||||
|  |         ctx.Add("MOV.S {}.x,{}.baseVertex;", inst, ctx.attrib_name); | ||||||
|  |         break; | ||||||
|  |     case IR::Attribute::DrawID: | ||||||
|  |         ctx.Add("MOV.S {}.x,{}.draw.id;", inst, ctx.attrib_name); | ||||||
|  |         break; | ||||||
|     default: |     default: | ||||||
|         throw NotImplementedException("Get U32 attribute {}", attr); |         throw NotImplementedException("Get U32 attribute {}", attr); | ||||||
|     } |     } | ||||||
|  |  | ||||||
|  | @ -240,6 +240,9 @@ void EmitGetAttribute(EmitContext& ctx, IR::Inst& inst, IR::Attribute attr, | ||||||
|     case IR::Attribute::BaseVertex: |     case IR::Attribute::BaseVertex: | ||||||
|         ctx.AddF32("{}=itof(gl_BaseVertex);", inst); |         ctx.AddF32("{}=itof(gl_BaseVertex);", inst); | ||||||
|         break; |         break; | ||||||
|  |     case IR::Attribute::DrawID: | ||||||
|  |         ctx.AddF32("{}=itof(gl_DrawID);", inst); | ||||||
|  |         break; | ||||||
|     default: |     default: | ||||||
|         throw NotImplementedException("Get attribute {}", attr); |         throw NotImplementedException("Get attribute {}", attr); | ||||||
|     } |     } | ||||||
|  | @ -262,6 +265,9 @@ void EmitGetAttributeU32(EmitContext& ctx, IR::Inst& inst, IR::Attribute attr, s | ||||||
|     case IR::Attribute::BaseVertex: |     case IR::Attribute::BaseVertex: | ||||||
|         ctx.AddU32("{}=uint(gl_BaseVertex);", inst); |         ctx.AddU32("{}=uint(gl_BaseVertex);", inst); | ||||||
|         break; |         break; | ||||||
|  |     case IR::Attribute::DrawID: | ||||||
|  |         ctx.AddU32("{}=uint(gl_DrawID);", inst); | ||||||
|  |         break; | ||||||
|     default: |     default: | ||||||
|         throw NotImplementedException("Get U32 attribute {}", attr); |         throw NotImplementedException("Get U32 attribute {}", attr); | ||||||
|     } |     } | ||||||
|  |  | ||||||
|  | @ -343,6 +343,8 @@ Id EmitGetAttribute(EmitContext& ctx, IR::Attribute attr, Id vertex) { | ||||||
|         return ctx.OpBitcast(ctx.F32[1], ctx.OpLoad(ctx.U32[1], ctx.base_instance)); |         return ctx.OpBitcast(ctx.F32[1], ctx.OpLoad(ctx.U32[1], ctx.base_instance)); | ||||||
|     case IR::Attribute::BaseVertex: |     case IR::Attribute::BaseVertex: | ||||||
|         return ctx.OpBitcast(ctx.F32[1], ctx.OpLoad(ctx.U32[1], ctx.base_vertex)); |         return ctx.OpBitcast(ctx.F32[1], ctx.OpLoad(ctx.U32[1], ctx.base_vertex)); | ||||||
|  |     case IR::Attribute::DrawID: | ||||||
|  |         return ctx.OpBitcast(ctx.F32[1], ctx.OpLoad(ctx.U32[1], ctx.draw_index)); | ||||||
|     case IR::Attribute::FrontFace: |     case IR::Attribute::FrontFace: | ||||||
|         return ctx.OpSelect(ctx.F32[1], ctx.OpLoad(ctx.U1, ctx.front_face), |         return ctx.OpSelect(ctx.F32[1], ctx.OpLoad(ctx.U1, ctx.front_face), | ||||||
|                             ctx.OpBitcast(ctx.F32[1], ctx.Const(std::numeric_limits<u32>::max())), |                             ctx.OpBitcast(ctx.F32[1], ctx.Const(std::numeric_limits<u32>::max())), | ||||||
|  | @ -388,6 +390,8 @@ Id EmitGetAttributeU32(EmitContext& ctx, IR::Attribute attr, Id) { | ||||||
|         return ctx.OpLoad(ctx.U32[1], ctx.base_instance); |         return ctx.OpLoad(ctx.U32[1], ctx.base_instance); | ||||||
|     case IR::Attribute::BaseVertex: |     case IR::Attribute::BaseVertex: | ||||||
|         return ctx.OpLoad(ctx.U32[1], ctx.base_vertex); |         return ctx.OpLoad(ctx.U32[1], ctx.base_vertex); | ||||||
|  |     case IR::Attribute::DrawID: | ||||||
|  |         return ctx.OpLoad(ctx.U32[1], ctx.draw_index); | ||||||
|     default: |     default: | ||||||
|         throw NotImplementedException("Read U32 attribute {}", attr); |         throw NotImplementedException("Read U32 attribute {}", attr); | ||||||
|     } |     } | ||||||
|  |  | ||||||
|  | @ -1402,6 +1402,9 @@ void EmitContext::DefineInputs(const IR::Program& program) { | ||||||
|     } else if (loads[IR::Attribute::BaseVertex]) { |     } else if (loads[IR::Attribute::BaseVertex]) { | ||||||
|         base_vertex = DefineInput(*this, U32[1], true, spv::BuiltIn::BaseVertex); |         base_vertex = DefineInput(*this, U32[1], true, spv::BuiltIn::BaseVertex); | ||||||
|     } |     } | ||||||
|  |     if (loads[IR::Attribute::DrawID]) { | ||||||
|  |         draw_index = DefineInput(*this, U32[1], true, spv::BuiltIn::DrawIndex); | ||||||
|  |     } | ||||||
|     if (loads[IR::Attribute::FrontFace]) { |     if (loads[IR::Attribute::FrontFace]) { | ||||||
|         front_face = DefineInput(*this, U1, true, spv::BuiltIn::FrontFacing); |         front_face = DefineInput(*this, U1, true, spv::BuiltIn::FrontFacing); | ||||||
|     } |     } | ||||||
|  |  | ||||||
|  | @ -218,6 +218,7 @@ public: | ||||||
|     Id base_instance{}; |     Id base_instance{}; | ||||||
|     Id vertex_id{}; |     Id vertex_id{}; | ||||||
|     Id vertex_index{}; |     Id vertex_index{}; | ||||||
|  |     Id draw_index{}; | ||||||
|     Id base_vertex{}; |     Id base_vertex{}; | ||||||
|     Id front_face{}; |     Id front_face{}; | ||||||
|     Id point_coord{}; |     Id point_coord{}; | ||||||
|  |  | ||||||
|  | @ -450,6 +450,8 @@ std::string NameOf(Attribute attribute) { | ||||||
|         return "BaseInstance"; |         return "BaseInstance"; | ||||||
|     case Attribute::BaseVertex: |     case Attribute::BaseVertex: | ||||||
|         return "BaseVertex"; |         return "BaseVertex"; | ||||||
|  |     case Attribute::DrawID: | ||||||
|  |         return "DrawID"; | ||||||
|     } |     } | ||||||
|     return fmt::format("<reserved attribute {}>", static_cast<int>(attribute)); |     return fmt::format("<reserved attribute {}>", static_cast<int>(attribute)); | ||||||
| } | } | ||||||
|  |  | ||||||
|  | @ -223,6 +223,7 @@ enum class Attribute : u64 { | ||||||
|     // Implementation attributes
 |     // Implementation attributes
 | ||||||
|     BaseInstance = 256, |     BaseInstance = 256, | ||||||
|     BaseVertex = 257, |     BaseVertex = 257, | ||||||
|  |     DrawID = 258, | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
| constexpr size_t NUM_GENERICS = 32; | constexpr size_t NUM_GENERICS = 32; | ||||||
|  |  | ||||||
|  | @ -518,6 +518,7 @@ void FoldBitCast(IR::Inst& inst, IR::Opcode reverse) { | ||||||
|             case IR::Attribute::VertexId: |             case IR::Attribute::VertexId: | ||||||
|             case IR::Attribute::BaseVertex: |             case IR::Attribute::BaseVertex: | ||||||
|             case IR::Attribute::BaseInstance: |             case IR::Attribute::BaseInstance: | ||||||
|  |             case IR::Attribute::DrawID: | ||||||
|                 break; |                 break; | ||||||
|             default: |             default: | ||||||
|                 return; |                 return; | ||||||
|  | @ -665,6 +666,8 @@ void FoldConstBuffer(Environment& env, IR::Block& block, IR::Inst& inst) { | ||||||
|             return IR::Attribute::BaseInstance; |             return IR::Attribute::BaseInstance; | ||||||
|         case ReplaceConstant::BaseVertex: |         case ReplaceConstant::BaseVertex: | ||||||
|             return IR::Attribute::BaseVertex; |             return IR::Attribute::BaseVertex; | ||||||
|  |         case ReplaceConstant::DrawID: | ||||||
|  |             return IR::Attribute::DrawID; | ||||||
|         default: |         default: | ||||||
|             throw NotImplementedException("Not implemented replacement variable {}", *replacement); |             throw NotImplementedException("Not implemented replacement variable {}", *replacement); | ||||||
|         } |         } | ||||||
|  |  | ||||||
|  | @ -19,6 +19,7 @@ namespace Shader { | ||||||
| enum class ReplaceConstant : u32 { | enum class ReplaceConstant : u32 { | ||||||
|     BaseInstance, |     BaseInstance, | ||||||
|     BaseVertex, |     BaseVertex, | ||||||
|  |     DrawID, | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
| enum class TextureType : u32 { | enum class TextureType : u32 { | ||||||
|  |  | ||||||
|  | @ -94,7 +94,7 @@ void DrawManager::DrawIndex(PrimitiveTopology topology, u32 index_first, u32 ind | ||||||
| void DrawManager::DrawArrayIndirect(PrimitiveTopology topology) { | void DrawManager::DrawArrayIndirect(PrimitiveTopology topology) { | ||||||
|     draw_state.topology = topology; |     draw_state.topology = topology; | ||||||
| 
 | 
 | ||||||
|     ProcessDrawIndirect(true); |     ProcessDrawIndirect(); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| void DrawManager::DrawIndexedIndirect(PrimitiveTopology topology, u32 index_first, | void DrawManager::DrawIndexedIndirect(PrimitiveTopology topology, u32 index_first, | ||||||
|  | @ -105,7 +105,7 @@ void DrawManager::DrawIndexedIndirect(PrimitiveTopology topology, u32 index_firs | ||||||
|     draw_state.index_buffer.first = index_first; |     draw_state.index_buffer.first = index_first; | ||||||
|     draw_state.index_buffer.count = index_count; |     draw_state.index_buffer.count = index_count; | ||||||
| 
 | 
 | ||||||
|     ProcessDrawIndirect(true); |     ProcessDrawIndirect(); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| void DrawManager::SetInlineIndexBuffer(u32 index) { | void DrawManager::SetInlineIndexBuffer(u32 index) { | ||||||
|  | @ -216,9 +216,12 @@ void DrawManager::ProcessDraw(bool draw_indexed, u32 instance_count) { | ||||||
|     } |     } | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| void DrawManager::ProcessDrawIndirect(bool draw_indexed) { | void DrawManager::ProcessDrawIndirect() { | ||||||
|     LOG_TRACE(HW_GPU, "called, topology={}, count={}", draw_state.topology, |     LOG_TRACE( | ||||||
|               draw_indexed ? draw_state.index_buffer.count : draw_state.vertex_buffer.count); |         HW_GPU, | ||||||
|  |         "called, topology={}, is_indexed={}, includes_count={}, buffer_size={}, max_draw_count={}", | ||||||
|  |         draw_state.topology, indirect_state.is_indexed, indirect_state.include_count, | ||||||
|  |         indirect_state.buffer_size, indirect_state.max_draw_counts); | ||||||
| 
 | 
 | ||||||
|     UpdateTopology(); |     UpdateTopology(); | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -85,7 +85,7 @@ private: | ||||||
| 
 | 
 | ||||||
|     void ProcessDraw(bool draw_indexed, u32 instance_count); |     void ProcessDraw(bool draw_indexed, u32 instance_count); | ||||||
| 
 | 
 | ||||||
|     void ProcessDrawIndirect(bool draw_indexed); |     void ProcessDrawIndirect(); | ||||||
| 
 | 
 | ||||||
|     Maxwell3D* maxwell3d{}; |     Maxwell3D* maxwell3d{}; | ||||||
|     State draw_state{}; |     State draw_state{}; | ||||||
|  |  | ||||||
|  | @ -220,9 +220,6 @@ void Maxwell3D::ProcessMacro(u32 method, const u32* base_start, u32 amount, bool | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| void Maxwell3D::RefreshParametersImpl() { | void Maxwell3D::RefreshParametersImpl() { | ||||||
|     if (!Settings::IsGPULevelHigh()) { |  | ||||||
|         return; |  | ||||||
|     } |  | ||||||
|     size_t current_index = 0; |     size_t current_index = 0; | ||||||
|     for (auto& segment : macro_segments) { |     for (auto& segment : macro_segments) { | ||||||
|         if (segment.first == 0) { |         if (segment.first == 0) { | ||||||
|  | @ -448,9 +445,11 @@ void Maxwell3D::CallMultiMethod(u32 method, const u32* base_start, u32 amount, | ||||||
|     case MAXWELL3D_REG_INDEX(const_buffer.buffer) + 15: |     case MAXWELL3D_REG_INDEX(const_buffer.buffer) + 15: | ||||||
|         ProcessCBMultiData(base_start, amount); |         ProcessCBMultiData(base_start, amount); | ||||||
|         break; |         break; | ||||||
|     case MAXWELL3D_REG_INDEX(inline_data): |     case MAXWELL3D_REG_INDEX(inline_data): { | ||||||
|  |         ASSERT(methods_pending == amount); | ||||||
|         upload_state.ProcessData(base_start, amount); |         upload_state.ProcessData(base_start, amount); | ||||||
|         return; |         return; | ||||||
|  |     } | ||||||
|     default: |     default: | ||||||
|         for (u32 i = 0; i < amount; i++) { |         for (u32 i = 0; i < amount; i++) { | ||||||
|             CallMethod(method, base_start[i], methods_pending - i <= 1); |             CallMethod(method, base_start[i], methods_pending - i <= 1); | ||||||
|  | @ -537,7 +536,7 @@ void Maxwell3D::ProcessQueryGet() { | ||||||
| void Maxwell3D::ProcessQueryCondition() { | void Maxwell3D::ProcessQueryCondition() { | ||||||
|     const GPUVAddr condition_address{regs.render_enable.Address()}; |     const GPUVAddr condition_address{regs.render_enable.Address()}; | ||||||
|     switch (regs.render_enable_override) { |     switch (regs.render_enable_override) { | ||||||
|     case Regs::RenderEnable::Override::AlwaysRender: { |     case Regs::RenderEnable::Override::AlwaysRender: | ||||||
|         execute_on = true; |         execute_on = true; | ||||||
|         break; |         break; | ||||||
|     case Regs::RenderEnable::Override::NeverRender: |     case Regs::RenderEnable::Override::NeverRender: | ||||||
|  | @ -586,7 +585,6 @@ void Maxwell3D::ProcessQueryCondition() { | ||||||
|         break; |         break; | ||||||
|     } |     } | ||||||
|     } |     } | ||||||
|     } |  | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| void Maxwell3D::ProcessCounterReset() { | void Maxwell3D::ProcessCounterReset() { | ||||||
|  | @ -685,7 +683,8 @@ u32 Maxwell3D::GetRegisterValue(u32 method) const { | ||||||
|     return regs.reg_array[method]; |     return regs.reg_array[method]; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| void Maxwell3D::setHLEReplacementName(u32 bank, u32 offset, HLEReplaceName name) { | void Maxwell3D::SetHLEReplacementAttributeType(u32 bank, u32 offset, | ||||||
|  |                                                HLEReplacementAttributeType name) { | ||||||
|     const u64 key = (static_cast<u64>(bank) << 32) | offset; |     const u64 key = (static_cast<u64>(bank) << 32) | offset; | ||||||
|     replace_table.emplace(key, name); |     replace_table.emplace(key, name); | ||||||
| } | } | ||||||
|  |  | ||||||
|  | @ -1218,12 +1218,12 @@ public: | ||||||
| 
 | 
 | ||||||
|         struct Window { |         struct Window { | ||||||
|             union { |             union { | ||||||
|                 u32 raw_1; |                 u32 raw_x; | ||||||
|                 BitField<0, 16, u32> x_min; |                 BitField<0, 16, u32> x_min; | ||||||
|                 BitField<16, 16, u32> x_max; |                 BitField<16, 16, u32> x_max; | ||||||
|             }; |             }; | ||||||
|             union { |             union { | ||||||
|                 u32 raw_2; |                 u32 raw_y; | ||||||
|                 BitField<0, 16, u32> y_min; |                 BitField<0, 16, u32> y_min; | ||||||
|                 BitField<16, 16, u32> y_max; |                 BitField<16, 16, u32> y_max; | ||||||
|             }; |             }; | ||||||
|  | @ -3031,14 +3031,15 @@ public: | ||||||
| 
 | 
 | ||||||
|     EngineHint engine_state{EngineHint::None}; |     EngineHint engine_state{EngineHint::None}; | ||||||
| 
 | 
 | ||||||
|     enum class HLEReplaceName : u32 { |     enum class HLEReplacementAttributeType : u32 { | ||||||
|         BaseVertex = 0x0, |         BaseVertex = 0x0, | ||||||
|         BaseInstance = 0x1, |         BaseInstance = 0x1, | ||||||
|  |         DrawID = 0x2, | ||||||
|     }; |     }; | ||||||
| 
 | 
 | ||||||
|     void setHLEReplacementName(u32 bank, u32 offset, HLEReplaceName name); |     void SetHLEReplacementAttributeType(u32 bank, u32 offset, HLEReplacementAttributeType name); | ||||||
| 
 | 
 | ||||||
|     std::unordered_map<u64, HLEReplaceName> replace_table; |     std::unordered_map<u64, HLEReplacementAttributeType> replace_table; | ||||||
| 
 | 
 | ||||||
|     static_assert(sizeof(Regs) == Regs::NUM_REGS * sizeof(u32), "Maxwell3D Regs has wrong size"); |     static_assert(sizeof(Regs) == Regs::NUM_REGS * sizeof(u32), "Maxwell3D Regs has wrong size"); | ||||||
|     static_assert(std::is_trivially_copyable_v<Regs>, "Maxwell3D Regs must be trivially copyable"); |     static_assert(std::is_trivially_copyable_v<Regs>, "Maxwell3D Regs must be trivially copyable"); | ||||||
|  | @ -3087,9 +3088,7 @@ public: | ||||||
|     std::unique_ptr<DrawManager> draw_manager; |     std::unique_ptr<DrawManager> draw_manager; | ||||||
|     friend class DrawManager; |     friend class DrawManager; | ||||||
| 
 | 
 | ||||||
|     std::vector<u8> inline_index_draw_indexes; |     GPUVAddr GetMacroAddress(size_t index) const { | ||||||
| 
 |  | ||||||
|     GPUVAddr getMacroAddress(size_t index) const { |  | ||||||
|         return macro_addresses[index]; |         return macro_addresses[index]; | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|  | @ -3100,7 +3099,7 @@ public: | ||||||
|         RefreshParametersImpl(); |         RefreshParametersImpl(); | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|     bool AnyParametersDirty() { |     bool AnyParametersDirty() const { | ||||||
|         return current_macro_dirty; |         return current_macro_dirty; | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|  | @ -3114,6 +3113,10 @@ public: | ||||||
|     /// Handles a write to the CB_BIND register.
 |     /// Handles a write to the CB_BIND register.
 | ||||||
|     void ProcessCBBind(size_t stage_index); |     void ProcessCBBind(size_t stage_index); | ||||||
| 
 | 
 | ||||||
|  |     /// Handles a write to the CB_DATA[i] register.
 | ||||||
|  |     void ProcessCBData(u32 value); | ||||||
|  |     void ProcessCBMultiData(const u32* start_base, u32 amount); | ||||||
|  | 
 | ||||||
| private: | private: | ||||||
|     void InitializeRegisterDefaults(); |     void InitializeRegisterDefaults(); | ||||||
| 
 | 
 | ||||||
|  | @ -3165,10 +3168,6 @@ private: | ||||||
|     /// Handles writes to syncing register.
 |     /// Handles writes to syncing register.
 | ||||||
|     void ProcessSyncPoint(); |     void ProcessSyncPoint(); | ||||||
| 
 | 
 | ||||||
|     /// Handles a write to the CB_DATA[i] register.
 |  | ||||||
|     void ProcessCBData(u32 value); |  | ||||||
|     void ProcessCBMultiData(const u32* start_base, u32 amount); |  | ||||||
| 
 |  | ||||||
|     /// Returns a query's value or an empty object if the value will be deferred through a cache.
 |     /// Returns a query's value or an empty object if the value will be deferred through a cache.
 | ||||||
|     std::optional<u64> GetQueryResult(); |     std::optional<u64> GetQueryResult(); | ||||||
| 
 | 
 | ||||||
|  | @ -3196,11 +3195,6 @@ private: | ||||||
| 
 | 
 | ||||||
|     bool execute_on{true}; |     bool execute_on{true}; | ||||||
| 
 | 
 | ||||||
|     std::array<bool, Regs::NUM_REGS> draw_command{}; |  | ||||||
|     std::vector<u32> deferred_draw_method; |  | ||||||
|     enum class DrawMode : u32 { General = 0, Instance, InlineIndex }; |  | ||||||
|     DrawMode draw_mode{DrawMode::General}; |  | ||||||
|     bool draw_indexed{}; |  | ||||||
|     std::vector<std::pair<GPUVAddr, size_t>> macro_segments; |     std::vector<std::pair<GPUVAddr, size_t>> macro_segments; | ||||||
|     std::vector<GPUVAddr> macro_addresses; |     std::vector<GPUVAddr> macro_addresses; | ||||||
|     bool current_macro_dirty{}; |     bool current_macro_dirty{}; | ||||||
|  |  | ||||||
|  | @ -23,7 +23,7 @@ | ||||||
| #include "video_core/macro/macro_jit_x64.h" | #include "video_core/macro/macro_jit_x64.h" | ||||||
| #endif | #endif | ||||||
| 
 | 
 | ||||||
| MICROPROFILE_DEFINE(MacroHLE, "GPU", "Execute macro hle", MP_RGB(128, 192, 192)); | MICROPROFILE_DEFINE(MacroHLE, "GPU", "Execute macro HLE", MP_RGB(128, 192, 192)); | ||||||
| 
 | 
 | ||||||
| namespace Tegra { | namespace Tegra { | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -1,5 +1,5 @@ | ||||||
| // SPDX-FileCopyrightText: Copyright 2020 yuzu Emulator Project
 | // SPDX-FileCopyrightText: Copyright 2023 yuzu Emulator Project
 | ||||||
| // SPDX-License-Identifier: GPL-2.0-or-later
 | // SPDX-License-Identifier: GPL-3.0-or-later
 | ||||||
| 
 | 
 | ||||||
| #include <array> | #include <array> | ||||||
| #include <vector> | #include <vector> | ||||||
|  | @ -15,28 +15,28 @@ | ||||||
| 
 | 
 | ||||||
| namespace Tegra { | namespace Tegra { | ||||||
| 
 | 
 | ||||||
| using Maxwell = Engines::Maxwell3D; | using Maxwell3D = Engines::Maxwell3D; | ||||||
| 
 | 
 | ||||||
| namespace { | namespace { | ||||||
| 
 | 
 | ||||||
| bool IsTopologySafe(Maxwell::Regs::PrimitiveTopology topology) { | bool IsTopologySafe(Maxwell3D::Regs::PrimitiveTopology topology) { | ||||||
|     switch (topology) { |     switch (topology) { | ||||||
|     case Maxwell::Regs::PrimitiveTopology::Points: |     case Maxwell3D::Regs::PrimitiveTopology::Points: | ||||||
|     case Maxwell::Regs::PrimitiveTopology::Lines: |     case Maxwell3D::Regs::PrimitiveTopology::Lines: | ||||||
|     case Maxwell::Regs::PrimitiveTopology::LineLoop: |     case Maxwell3D::Regs::PrimitiveTopology::LineLoop: | ||||||
|     case Maxwell::Regs::PrimitiveTopology::LineStrip: |     case Maxwell3D::Regs::PrimitiveTopology::LineStrip: | ||||||
|     case Maxwell::Regs::PrimitiveTopology::Triangles: |     case Maxwell3D::Regs::PrimitiveTopology::Triangles: | ||||||
|     case Maxwell::Regs::PrimitiveTopology::TriangleStrip: |     case Maxwell3D::Regs::PrimitiveTopology::TriangleStrip: | ||||||
|     case Maxwell::Regs::PrimitiveTopology::TriangleFan: |     case Maxwell3D::Regs::PrimitiveTopology::TriangleFan: | ||||||
|     case Maxwell::Regs::PrimitiveTopology::LinesAdjacency: |     case Maxwell3D::Regs::PrimitiveTopology::LinesAdjacency: | ||||||
|     case Maxwell::Regs::PrimitiveTopology::LineStripAdjacency: |     case Maxwell3D::Regs::PrimitiveTopology::LineStripAdjacency: | ||||||
|     case Maxwell::Regs::PrimitiveTopology::TrianglesAdjacency: |     case Maxwell3D::Regs::PrimitiveTopology::TrianglesAdjacency: | ||||||
|     case Maxwell::Regs::PrimitiveTopology::TriangleStripAdjacency: |     case Maxwell3D::Regs::PrimitiveTopology::TriangleStripAdjacency: | ||||||
|     case Maxwell::Regs::PrimitiveTopology::Patches: |     case Maxwell3D::Regs::PrimitiveTopology::Patches: | ||||||
|         return true; |         return true; | ||||||
|     case Maxwell::Regs::PrimitiveTopology::Quads: |     case Maxwell3D::Regs::PrimitiveTopology::Quads: | ||||||
|     case Maxwell::Regs::PrimitiveTopology::QuadStrip: |     case Maxwell3D::Regs::PrimitiveTopology::QuadStrip: | ||||||
|     case Maxwell::Regs::PrimitiveTopology::Polygon: |     case Maxwell3D::Regs::PrimitiveTopology::Polygon: | ||||||
|     default: |     default: | ||||||
|         return false; |         return false; | ||||||
|     } |     } | ||||||
|  | @ -44,34 +44,55 @@ bool IsTopologySafe(Maxwell::Regs::PrimitiveTopology topology) { | ||||||
| 
 | 
 | ||||||
| class HLEMacroImpl : public CachedMacro { | class HLEMacroImpl : public CachedMacro { | ||||||
| public: | public: | ||||||
|     explicit HLEMacroImpl(Engines::Maxwell3D& maxwell3d_) : maxwell3d{maxwell3d_} {} |     explicit HLEMacroImpl(Maxwell3D& maxwell3d_) : maxwell3d{maxwell3d_} {} | ||||||
| 
 | 
 | ||||||
| protected: | protected: | ||||||
|     Engines::Maxwell3D& maxwell3d; |     Maxwell3D& maxwell3d; | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
| class HLE_771BB18C62444DA0 final : public HLEMacroImpl { | class HLE_DrawArrays final : public HLEMacroImpl { | ||||||
| public: | public: | ||||||
|     explicit HLE_771BB18C62444DA0(Engines::Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} |     explicit HLE_DrawArrays(Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} | ||||||
| 
 | 
 | ||||||
|     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { |     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { | ||||||
|         maxwell3d.RefreshParameters(); |         maxwell3d.RefreshParameters(); | ||||||
|         const u32 instance_count = parameters[2] & maxwell3d.GetRegisterValue(0xD1B); | 
 | ||||||
|         maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true; |         auto topology = static_cast<Maxwell3D::Regs::PrimitiveTopology>(parameters[0]); | ||||||
|         maxwell3d.draw_manager->DrawIndex( |         maxwell3d.draw_manager->DrawArray(topology, parameters[1], parameters[2], | ||||||
|             static_cast<Tegra::Engines::Maxwell3D::Regs::PrimitiveTopology>(parameters[0] & |                                           maxwell3d.regs.global_base_instance_index, 1); | ||||||
|                                                                             0x3ffffff), |  | ||||||
|             parameters[4], parameters[1], parameters[3], parameters[5], instance_count); |  | ||||||
|     } |     } | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
| class HLE_DrawArraysIndirect final : public HLEMacroImpl { | class HLE_DrawIndexed final : public HLEMacroImpl { | ||||||
| public: | public: | ||||||
|     explicit HLE_DrawArraysIndirect(Engines::Maxwell3D& maxwell3d_, bool extended_ = false) |     explicit HLE_DrawIndexed(Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} | ||||||
|         : HLEMacroImpl(maxwell3d_), extended(extended_) {} |  | ||||||
| 
 | 
 | ||||||
|     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { |     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { | ||||||
|         auto topology = static_cast<Maxwell::Regs::PrimitiveTopology>(parameters[0]); |         maxwell3d.RefreshParameters(); | ||||||
|  |         maxwell3d.regs.index_buffer.start_addr_high = parameters[1]; | ||||||
|  |         maxwell3d.regs.index_buffer.start_addr_low = parameters[2]; | ||||||
|  |         maxwell3d.regs.index_buffer.format = | ||||||
|  |             static_cast<Engines::Maxwell3D::Regs::IndexFormat>(parameters[3]); | ||||||
|  |         maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true; | ||||||
|  | 
 | ||||||
|  |         auto topology = static_cast<Maxwell3D::Regs::PrimitiveTopology>(parameters[0]); | ||||||
|  |         maxwell3d.draw_manager->DrawIndex(topology, 0, parameters[4], | ||||||
|  |                                           maxwell3d.regs.global_base_vertex_index, | ||||||
|  |                                           maxwell3d.regs.global_base_instance_index, 1); | ||||||
|  |     } | ||||||
|  | }; | ||||||
|  | 
 | ||||||
|  | /*
 | ||||||
|  |  * @note: these macros have two versions, a normal and extended version, with the extended version | ||||||
|  |  * also assigning the base vertex/instance. | ||||||
|  |  */ | ||||||
|  | template <bool extended> | ||||||
|  | class HLE_DrawArraysIndirect final : public HLEMacroImpl { | ||||||
|  | public: | ||||||
|  |     explicit HLE_DrawArraysIndirect(Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} | ||||||
|  | 
 | ||||||
|  |     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { | ||||||
|  |         auto topology = static_cast<Maxwell3D::Regs::PrimitiveTopology>(parameters[0]); | ||||||
|         if (!maxwell3d.AnyParametersDirty() || !IsTopologySafe(topology)) { |         if (!maxwell3d.AnyParametersDirty() || !IsTopologySafe(topology)) { | ||||||
|             Fallback(parameters); |             Fallback(parameters); | ||||||
|             return; |             return; | ||||||
|  | @ -81,20 +102,21 @@ public: | ||||||
|         params.is_indexed = false; |         params.is_indexed = false; | ||||||
|         params.include_count = false; |         params.include_count = false; | ||||||
|         params.count_start_address = 0; |         params.count_start_address = 0; | ||||||
|         params.indirect_start_address = maxwell3d.getMacroAddress(1); |         params.indirect_start_address = maxwell3d.GetMacroAddress(1); | ||||||
|         params.buffer_size = 4 * sizeof(u32); |         params.buffer_size = 4 * sizeof(u32); | ||||||
|         params.max_draw_counts = 1; |         params.max_draw_counts = 1; | ||||||
|         params.stride = 0; |         params.stride = 0; | ||||||
| 
 | 
 | ||||||
|         if (extended) { |         if constexpr (extended) { | ||||||
|             maxwell3d.engine_state = Maxwell::EngineHint::OnHLEMacro; |             maxwell3d.engine_state = Maxwell3D::EngineHint::OnHLEMacro; | ||||||
|             maxwell3d.setHLEReplacementName(0, 0x640, Maxwell::HLEReplaceName::BaseInstance); |             maxwell3d.SetHLEReplacementAttributeType( | ||||||
|  |                 0, 0x640, Maxwell3D::HLEReplacementAttributeType::BaseInstance); | ||||||
|         } |         } | ||||||
| 
 | 
 | ||||||
|         maxwell3d.draw_manager->DrawArrayIndirect(topology); |         maxwell3d.draw_manager->DrawArrayIndirect(topology); | ||||||
| 
 | 
 | ||||||
|         if (extended) { |         if constexpr (extended) { | ||||||
|             maxwell3d.engine_state = Maxwell::EngineHint::None; |             maxwell3d.engine_state = Maxwell3D::EngineHint::None; | ||||||
|             maxwell3d.replace_table.clear(); |             maxwell3d.replace_table.clear(); | ||||||
|         } |         } | ||||||
|     } |     } | ||||||
|  | @ -103,14 +125,14 @@ private: | ||||||
|     void Fallback(const std::vector<u32>& parameters) { |     void Fallback(const std::vector<u32>& parameters) { | ||||||
|         SCOPE_EXIT({ |         SCOPE_EXIT({ | ||||||
|             if (extended) { |             if (extended) { | ||||||
|                 maxwell3d.engine_state = Maxwell::EngineHint::None; |                 maxwell3d.engine_state = Maxwell3D::EngineHint::None; | ||||||
|                 maxwell3d.replace_table.clear(); |                 maxwell3d.replace_table.clear(); | ||||||
|             } |             } | ||||||
|         }); |         }); | ||||||
|         maxwell3d.RefreshParameters(); |         maxwell3d.RefreshParameters(); | ||||||
|         const u32 instance_count = (maxwell3d.GetRegisterValue(0xD1B) & parameters[2]); |         const u32 instance_count = (maxwell3d.GetRegisterValue(0xD1B) & parameters[2]); | ||||||
| 
 | 
 | ||||||
|         auto topology = static_cast<Maxwell::Regs::PrimitiveTopology>(parameters[0]); |         auto topology = static_cast<Maxwell3D::Regs::PrimitiveTopology>(parameters[0]); | ||||||
|         const u32 vertex_first = parameters[3]; |         const u32 vertex_first = parameters[3]; | ||||||
|         const u32 vertex_count = parameters[1]; |         const u32 vertex_count = parameters[1]; | ||||||
| 
 | 
 | ||||||
|  | @ -122,31 +144,35 @@ private: | ||||||
|         } |         } | ||||||
| 
 | 
 | ||||||
|         const u32 base_instance = parameters[4]; |         const u32 base_instance = parameters[4]; | ||||||
|         if (extended) { |         if constexpr (extended) { | ||||||
|             maxwell3d.regs.global_base_instance_index = base_instance; |             maxwell3d.regs.global_base_instance_index = base_instance; | ||||||
|             maxwell3d.engine_state = Maxwell::EngineHint::OnHLEMacro; |             maxwell3d.engine_state = Maxwell3D::EngineHint::OnHLEMacro; | ||||||
|             maxwell3d.setHLEReplacementName(0, 0x640, Maxwell::HLEReplaceName::BaseInstance); |             maxwell3d.SetHLEReplacementAttributeType( | ||||||
|  |                 0, 0x640, Maxwell3D::HLEReplacementAttributeType::BaseInstance); | ||||||
|         } |         } | ||||||
| 
 | 
 | ||||||
|         maxwell3d.draw_manager->DrawArray(topology, vertex_first, vertex_count, base_instance, |         maxwell3d.draw_manager->DrawArray(topology, vertex_first, vertex_count, base_instance, | ||||||
|                                           instance_count); |                                           instance_count); | ||||||
| 
 | 
 | ||||||
|         if (extended) { |         if constexpr (extended) { | ||||||
|             maxwell3d.regs.global_base_instance_index = 0; |             maxwell3d.regs.global_base_instance_index = 0; | ||||||
|             maxwell3d.engine_state = Maxwell::EngineHint::None; |             maxwell3d.engine_state = Maxwell3D::EngineHint::None; | ||||||
|             maxwell3d.replace_table.clear(); |             maxwell3d.replace_table.clear(); | ||||||
|         } |         } | ||||||
|     } |     } | ||||||
| 
 |  | ||||||
|     bool extended; |  | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
|  | /*
 | ||||||
|  |  * @note: these macros have two versions, a normal and extended version, with the extended version | ||||||
|  |  * also assigning the base vertex/instance. | ||||||
|  |  */ | ||||||
|  | template <bool extended> | ||||||
| class HLE_DrawIndexedIndirect final : public HLEMacroImpl { | class HLE_DrawIndexedIndirect final : public HLEMacroImpl { | ||||||
| public: | public: | ||||||
|     explicit HLE_DrawIndexedIndirect(Engines::Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} |     explicit HLE_DrawIndexedIndirect(Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} | ||||||
| 
 | 
 | ||||||
|     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { |     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { | ||||||
|         auto topology = static_cast<Maxwell::Regs::PrimitiveTopology>(parameters[0]); |         auto topology = static_cast<Maxwell3D::Regs::PrimitiveTopology>(parameters[0]); | ||||||
|         if (!maxwell3d.AnyParametersDirty() || !IsTopologySafe(topology)) { |         if (!maxwell3d.AnyParametersDirty() || !IsTopologySafe(topology)) { | ||||||
|             Fallback(parameters); |             Fallback(parameters); | ||||||
|             return; |             return; | ||||||
|  | @ -159,24 +185,30 @@ public: | ||||||
|         maxwell3d.regs.global_base_vertex_index = element_base; |         maxwell3d.regs.global_base_vertex_index = element_base; | ||||||
|         maxwell3d.regs.global_base_instance_index = base_instance; |         maxwell3d.regs.global_base_instance_index = base_instance; | ||||||
|         maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true; |         maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true; | ||||||
|         maxwell3d.engine_state = Maxwell::EngineHint::OnHLEMacro; |         if constexpr (extended) { | ||||||
|         maxwell3d.setHLEReplacementName(0, 0x640, Maxwell::HLEReplaceName::BaseVertex); |             maxwell3d.engine_state = Maxwell3D::EngineHint::OnHLEMacro; | ||||||
|         maxwell3d.setHLEReplacementName(0, 0x644, Maxwell::HLEReplaceName::BaseInstance); |             maxwell3d.SetHLEReplacementAttributeType( | ||||||
|  |                 0, 0x640, Maxwell3D::HLEReplacementAttributeType::BaseVertex); | ||||||
|  |             maxwell3d.SetHLEReplacementAttributeType( | ||||||
|  |                 0, 0x644, Maxwell3D::HLEReplacementAttributeType::BaseInstance); | ||||||
|  |         } | ||||||
|         auto& params = maxwell3d.draw_manager->GetIndirectParams(); |         auto& params = maxwell3d.draw_manager->GetIndirectParams(); | ||||||
|         params.is_indexed = true; |         params.is_indexed = true; | ||||||
|         params.include_count = false; |         params.include_count = false; | ||||||
|         params.count_start_address = 0; |         params.count_start_address = 0; | ||||||
|         params.indirect_start_address = maxwell3d.getMacroAddress(1); |         params.indirect_start_address = maxwell3d.GetMacroAddress(1); | ||||||
|         params.buffer_size = 5 * sizeof(u32); |         params.buffer_size = 5 * sizeof(u32); | ||||||
|         params.max_draw_counts = 1; |         params.max_draw_counts = 1; | ||||||
|         params.stride = 0; |         params.stride = 0; | ||||||
|         maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true; |         maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true; | ||||||
|         maxwell3d.draw_manager->DrawIndexedIndirect(topology, 0, estimate); |         maxwell3d.draw_manager->DrawIndexedIndirect(topology, 0, estimate); | ||||||
|         maxwell3d.engine_state = Maxwell::EngineHint::None; |  | ||||||
|         maxwell3d.replace_table.clear(); |  | ||||||
|         maxwell3d.regs.vertex_id_base = 0x0; |         maxwell3d.regs.vertex_id_base = 0x0; | ||||||
|         maxwell3d.regs.global_base_vertex_index = 0x0; |         maxwell3d.regs.global_base_vertex_index = 0x0; | ||||||
|         maxwell3d.regs.global_base_instance_index = 0x0; |         maxwell3d.regs.global_base_instance_index = 0x0; | ||||||
|  |         if constexpr (extended) { | ||||||
|  |             maxwell3d.engine_state = Maxwell3D::EngineHint::None; | ||||||
|  |             maxwell3d.replace_table.clear(); | ||||||
|  |         } | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
| private: | private: | ||||||
|  | @ -189,31 +221,37 @@ private: | ||||||
|         maxwell3d.regs.global_base_vertex_index = element_base; |         maxwell3d.regs.global_base_vertex_index = element_base; | ||||||
|         maxwell3d.regs.global_base_instance_index = base_instance; |         maxwell3d.regs.global_base_instance_index = base_instance; | ||||||
|         maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true; |         maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true; | ||||||
|         maxwell3d.engine_state = Maxwell::EngineHint::OnHLEMacro; |         if constexpr (extended) { | ||||||
|         maxwell3d.setHLEReplacementName(0, 0x640, Maxwell::HLEReplaceName::BaseVertex); |             maxwell3d.engine_state = Maxwell3D::EngineHint::OnHLEMacro; | ||||||
|         maxwell3d.setHLEReplacementName(0, 0x644, Maxwell::HLEReplaceName::BaseInstance); |             maxwell3d.SetHLEReplacementAttributeType( | ||||||
|  |                 0, 0x640, Maxwell3D::HLEReplacementAttributeType::BaseVertex); | ||||||
|  |             maxwell3d.SetHLEReplacementAttributeType( | ||||||
|  |                 0, 0x644, Maxwell3D::HLEReplacementAttributeType::BaseInstance); | ||||||
|  |         } | ||||||
| 
 | 
 | ||||||
|         maxwell3d.draw_manager->DrawIndex( |         maxwell3d.draw_manager->DrawIndex( | ||||||
|             static_cast<Tegra::Engines::Maxwell3D::Regs::PrimitiveTopology>(parameters[0]), |             static_cast<Tegra::Maxwell3D::Regs::PrimitiveTopology>(parameters[0]), parameters[3], | ||||||
|             parameters[3], parameters[1], element_base, base_instance, instance_count); |             parameters[1], element_base, base_instance, instance_count); | ||||||
| 
 | 
 | ||||||
|         maxwell3d.regs.vertex_id_base = 0x0; |         maxwell3d.regs.vertex_id_base = 0x0; | ||||||
|         maxwell3d.regs.global_base_vertex_index = 0x0; |         maxwell3d.regs.global_base_vertex_index = 0x0; | ||||||
|         maxwell3d.regs.global_base_instance_index = 0x0; |         maxwell3d.regs.global_base_instance_index = 0x0; | ||||||
|         maxwell3d.engine_state = Maxwell::EngineHint::None; |         if constexpr (extended) { | ||||||
|         maxwell3d.replace_table.clear(); |             maxwell3d.engine_state = Maxwell3D::EngineHint::None; | ||||||
|  |             maxwell3d.replace_table.clear(); | ||||||
|  |         } | ||||||
|     } |     } | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
| class HLE_MultiLayerClear final : public HLEMacroImpl { | class HLE_MultiLayerClear final : public HLEMacroImpl { | ||||||
| public: | public: | ||||||
|     explicit HLE_MultiLayerClear(Engines::Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} |     explicit HLE_MultiLayerClear(Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} | ||||||
| 
 | 
 | ||||||
|     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { |     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { | ||||||
|         maxwell3d.RefreshParameters(); |         maxwell3d.RefreshParameters(); | ||||||
|         ASSERT(parameters.size() == 1); |         ASSERT(parameters.size() == 1); | ||||||
| 
 | 
 | ||||||
|         const Engines::Maxwell3D::Regs::ClearSurface clear_params{parameters[0]}; |         const Maxwell3D::Regs::ClearSurface clear_params{parameters[0]}; | ||||||
|         const u32 rt_index = clear_params.RT; |         const u32 rt_index = clear_params.RT; | ||||||
|         const u32 num_layers = maxwell3d.regs.rt[rt_index].depth; |         const u32 num_layers = maxwell3d.regs.rt[rt_index].depth; | ||||||
|         ASSERT(clear_params.layer == 0); |         ASSERT(clear_params.layer == 0); | ||||||
|  | @ -225,11 +263,10 @@ public: | ||||||
| 
 | 
 | ||||||
| class HLE_MultiDrawIndexedIndirectCount final : public HLEMacroImpl { | class HLE_MultiDrawIndexedIndirectCount final : public HLEMacroImpl { | ||||||
| public: | public: | ||||||
|     explicit HLE_MultiDrawIndexedIndirectCount(Engines::Maxwell3D& maxwell3d_) |     explicit HLE_MultiDrawIndexedIndirectCount(Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} | ||||||
|         : HLEMacroImpl(maxwell3d_) {} |  | ||||||
| 
 | 
 | ||||||
|     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { |     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { | ||||||
|         const auto topology = static_cast<Maxwell::Regs::PrimitiveTopology>(parameters[2]); |         const auto topology = static_cast<Maxwell3D::Regs::PrimitiveTopology>(parameters[2]); | ||||||
|         if (!IsTopologySafe(topology)) { |         if (!IsTopologySafe(topology)) { | ||||||
|             Fallback(parameters); |             Fallback(parameters); | ||||||
|             return; |             return; | ||||||
|  | @ -253,27 +290,30 @@ public: | ||||||
|         auto& params = maxwell3d.draw_manager->GetIndirectParams(); |         auto& params = maxwell3d.draw_manager->GetIndirectParams(); | ||||||
|         params.is_indexed = true; |         params.is_indexed = true; | ||||||
|         params.include_count = true; |         params.include_count = true; | ||||||
|         params.count_start_address = maxwell3d.getMacroAddress(4); |         params.count_start_address = maxwell3d.GetMacroAddress(4); | ||||||
|         params.indirect_start_address = maxwell3d.getMacroAddress(5); |         params.indirect_start_address = maxwell3d.GetMacroAddress(5); | ||||||
|         params.buffer_size = stride * draw_count; |         params.buffer_size = stride * draw_count; | ||||||
|         params.max_draw_counts = draw_count; |         params.max_draw_counts = draw_count; | ||||||
|         params.stride = stride; |         params.stride = stride; | ||||||
|         maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true; |         maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true; | ||||||
|         maxwell3d.engine_state = Maxwell::EngineHint::OnHLEMacro; |         maxwell3d.engine_state = Maxwell3D::EngineHint::OnHLEMacro; | ||||||
|         maxwell3d.setHLEReplacementName(0, 0x640, Maxwell::HLEReplaceName::BaseVertex); |         maxwell3d.SetHLEReplacementAttributeType( | ||||||
|         maxwell3d.setHLEReplacementName(0, 0x644, Maxwell::HLEReplaceName::BaseInstance); |             0, 0x640, Maxwell3D::HLEReplacementAttributeType::BaseVertex); | ||||||
|  |         maxwell3d.SetHLEReplacementAttributeType( | ||||||
|  |             0, 0x644, Maxwell3D::HLEReplacementAttributeType::BaseInstance); | ||||||
|  |         maxwell3d.SetHLEReplacementAttributeType(0, 0x648, | ||||||
|  |                                                  Maxwell3D::HLEReplacementAttributeType::DrawID); | ||||||
|         maxwell3d.draw_manager->DrawIndexedIndirect(topology, 0, estimate); |         maxwell3d.draw_manager->DrawIndexedIndirect(topology, 0, estimate); | ||||||
|         maxwell3d.engine_state = Maxwell::EngineHint::None; |         maxwell3d.engine_state = Maxwell3D::EngineHint::None; | ||||||
|         maxwell3d.replace_table.clear(); |         maxwell3d.replace_table.clear(); | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
| private: | private: | ||||||
|     void Fallback(const std::vector<u32>& parameters) { |     void Fallback(const std::vector<u32>& parameters) { | ||||||
|         SCOPE_EXIT({ |         SCOPE_EXIT({ | ||||||
|             // Clean everything.
 |  | ||||||
|             // Clean everything.
 |             // Clean everything.
 | ||||||
|             maxwell3d.regs.vertex_id_base = 0x0; |             maxwell3d.regs.vertex_id_base = 0x0; | ||||||
|             maxwell3d.engine_state = Maxwell::EngineHint::None; |             maxwell3d.engine_state = Maxwell3D::EngineHint::None; | ||||||
|             maxwell3d.replace_table.clear(); |             maxwell3d.replace_table.clear(); | ||||||
|         }); |         }); | ||||||
|         maxwell3d.RefreshParameters(); |         maxwell3d.RefreshParameters(); | ||||||
|  | @ -283,7 +323,7 @@ private: | ||||||
|             // Nothing to do.
 |             // Nothing to do.
 | ||||||
|             return; |             return; | ||||||
|         } |         } | ||||||
|         const auto topology = static_cast<Maxwell::Regs::PrimitiveTopology>(parameters[2]); |         const auto topology = static_cast<Maxwell3D::Regs::PrimitiveTopology>(parameters[2]); | ||||||
|         const u32 padding = parameters[3]; |         const u32 padding = parameters[3]; | ||||||
|         const std::size_t max_draws = parameters[4]; |         const std::size_t max_draws = parameters[4]; | ||||||
| 
 | 
 | ||||||
|  | @ -297,9 +337,13 @@ private: | ||||||
|             const u32 base_vertex = parameters[base + 3]; |             const u32 base_vertex = parameters[base + 3]; | ||||||
|             const u32 base_instance = parameters[base + 4]; |             const u32 base_instance = parameters[base + 4]; | ||||||
|             maxwell3d.regs.vertex_id_base = base_vertex; |             maxwell3d.regs.vertex_id_base = base_vertex; | ||||||
|             maxwell3d.engine_state = Maxwell::EngineHint::OnHLEMacro; |             maxwell3d.engine_state = Maxwell3D::EngineHint::OnHLEMacro; | ||||||
|             maxwell3d.setHLEReplacementName(0, 0x640, Maxwell::HLEReplaceName::BaseVertex); |             maxwell3d.SetHLEReplacementAttributeType( | ||||||
|             maxwell3d.setHLEReplacementName(0, 0x644, Maxwell::HLEReplaceName::BaseInstance); |                 0, 0x640, Maxwell3D::HLEReplacementAttributeType::BaseVertex); | ||||||
|  |             maxwell3d.SetHLEReplacementAttributeType( | ||||||
|  |                 0, 0x644, Maxwell3D::HLEReplacementAttributeType::BaseInstance); | ||||||
|  |             maxwell3d.CallMethod(0x8e3, 0x648, true); | ||||||
|  |             maxwell3d.CallMethod(0x8e4, static_cast<u32>(index), true); | ||||||
|             maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true; |             maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true; | ||||||
|             maxwell3d.draw_manager->DrawIndex(topology, parameters[base + 2], parameters[base], |             maxwell3d.draw_manager->DrawIndex(topology, parameters[base + 2], parameters[base], | ||||||
|                                               base_vertex, base_instance, parameters[base + 1]); |                                               base_vertex, base_instance, parameters[base + 1]); | ||||||
|  | @ -309,7 +353,7 @@ private: | ||||||
| 
 | 
 | ||||||
| class HLE_C713C83D8F63CCF3 final : public HLEMacroImpl { | class HLE_C713C83D8F63CCF3 final : public HLEMacroImpl { | ||||||
| public: | public: | ||||||
|     explicit HLE_C713C83D8F63CCF3(Engines::Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} |     explicit HLE_C713C83D8F63CCF3(Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} | ||||||
| 
 | 
 | ||||||
|     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { |     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { | ||||||
|         maxwell3d.RefreshParameters(); |         maxwell3d.RefreshParameters(); | ||||||
|  | @ -325,7 +369,7 @@ public: | ||||||
| 
 | 
 | ||||||
| class HLE_D7333D26E0A93EDE final : public HLEMacroImpl { | class HLE_D7333D26E0A93EDE final : public HLEMacroImpl { | ||||||
| public: | public: | ||||||
|     explicit HLE_D7333D26E0A93EDE(Engines::Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} |     explicit HLE_D7333D26E0A93EDE(Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} | ||||||
| 
 | 
 | ||||||
|     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { |     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { | ||||||
|         maxwell3d.RefreshParameters(); |         maxwell3d.RefreshParameters(); | ||||||
|  | @ -341,7 +385,7 @@ public: | ||||||
| 
 | 
 | ||||||
| class HLE_BindShader final : public HLEMacroImpl { | class HLE_BindShader final : public HLEMacroImpl { | ||||||
| public: | public: | ||||||
|     explicit HLE_BindShader(Engines::Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} |     explicit HLE_BindShader(Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} | ||||||
| 
 | 
 | ||||||
|     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { |     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { | ||||||
|         maxwell3d.RefreshParameters(); |         maxwell3d.RefreshParameters(); | ||||||
|  | @ -371,7 +415,7 @@ public: | ||||||
| 
 | 
 | ||||||
| class HLE_SetRasterBoundingBox final : public HLEMacroImpl { | class HLE_SetRasterBoundingBox final : public HLEMacroImpl { | ||||||
| public: | public: | ||||||
|     explicit HLE_SetRasterBoundingBox(Engines::Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} |     explicit HLE_SetRasterBoundingBox(Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} | ||||||
| 
 | 
 | ||||||
|     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { |     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { | ||||||
|         maxwell3d.RefreshParameters(); |         maxwell3d.RefreshParameters(); | ||||||
|  | @ -384,60 +428,156 @@ public: | ||||||
|     } |     } | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
|  | template <size_t base_size> | ||||||
|  | class HLE_ClearConstBuffer final : public HLEMacroImpl { | ||||||
|  | public: | ||||||
|  |     explicit HLE_ClearConstBuffer(Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} | ||||||
|  | 
 | ||||||
|  |     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { | ||||||
|  |         maxwell3d.RefreshParameters(); | ||||||
|  |         static constexpr std::array<u32, base_size> zeroes{}; | ||||||
|  |         auto& regs = maxwell3d.regs; | ||||||
|  |         regs.const_buffer.size = static_cast<u32>(base_size); | ||||||
|  |         regs.const_buffer.address_high = parameters[0]; | ||||||
|  |         regs.const_buffer.address_low = parameters[1]; | ||||||
|  |         regs.const_buffer.offset = 0; | ||||||
|  |         maxwell3d.ProcessCBMultiData(zeroes.data(), parameters[2] * 4); | ||||||
|  |     } | ||||||
|  | }; | ||||||
|  | 
 | ||||||
|  | class HLE_ClearMemory final : public HLEMacroImpl { | ||||||
|  | public: | ||||||
|  |     explicit HLE_ClearMemory(Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} | ||||||
|  | 
 | ||||||
|  |     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { | ||||||
|  |         maxwell3d.RefreshParameters(); | ||||||
|  | 
 | ||||||
|  |         const u32 needed_memory = parameters[2] / sizeof(u32); | ||||||
|  |         if (needed_memory > zero_memory.size()) { | ||||||
|  |             zero_memory.resize(needed_memory, 0); | ||||||
|  |         } | ||||||
|  |         auto& regs = maxwell3d.regs; | ||||||
|  |         regs.upload.line_length_in = parameters[2]; | ||||||
|  |         regs.upload.line_count = 1; | ||||||
|  |         regs.upload.dest.address_high = parameters[0]; | ||||||
|  |         regs.upload.dest.address_low = parameters[1]; | ||||||
|  |         maxwell3d.CallMethod(static_cast<size_t>(MAXWELL3D_REG_INDEX(launch_dma)), 0x1011, true); | ||||||
|  |         maxwell3d.CallMultiMethod(static_cast<size_t>(MAXWELL3D_REG_INDEX(inline_data)), | ||||||
|  |                                   zero_memory.data(), needed_memory, needed_memory); | ||||||
|  |     } | ||||||
|  | 
 | ||||||
|  | private: | ||||||
|  |     std::vector<u32> zero_memory; | ||||||
|  | }; | ||||||
|  | 
 | ||||||
|  | class HLE_TransformFeedbackSetup final : public HLEMacroImpl { | ||||||
|  | public: | ||||||
|  |     explicit HLE_TransformFeedbackSetup(Maxwell3D& maxwell3d_) : HLEMacroImpl(maxwell3d_) {} | ||||||
|  | 
 | ||||||
|  |     void Execute(const std::vector<u32>& parameters, [[maybe_unused]] u32 method) override { | ||||||
|  |         maxwell3d.RefreshParameters(); | ||||||
|  | 
 | ||||||
|  |         auto& regs = maxwell3d.regs; | ||||||
|  |         regs.transform_feedback_enabled = 1; | ||||||
|  |         regs.transform_feedback.buffers[0].start_offset = 0; | ||||||
|  |         regs.transform_feedback.buffers[1].start_offset = 0; | ||||||
|  |         regs.transform_feedback.buffers[2].start_offset = 0; | ||||||
|  |         regs.transform_feedback.buffers[3].start_offset = 0; | ||||||
|  | 
 | ||||||
|  |         regs.upload.line_length_in = 4; | ||||||
|  |         regs.upload.line_count = 1; | ||||||
|  |         regs.upload.dest.address_high = parameters[0]; | ||||||
|  |         regs.upload.dest.address_low = parameters[1]; | ||||||
|  |         maxwell3d.CallMethod(static_cast<size_t>(MAXWELL3D_REG_INDEX(launch_dma)), 0x1011, true); | ||||||
|  |         maxwell3d.CallMethod(static_cast<size_t>(MAXWELL3D_REG_INDEX(inline_data)), | ||||||
|  |                              regs.transform_feedback.controls[0].stride, true); | ||||||
|  |     } | ||||||
|  | }; | ||||||
|  | 
 | ||||||
| } // Anonymous namespace
 | } // Anonymous namespace
 | ||||||
| 
 | 
 | ||||||
| HLEMacro::HLEMacro(Engines::Maxwell3D& maxwell3d_) : maxwell3d{maxwell3d_} { | HLEMacro::HLEMacro(Maxwell3D& maxwell3d_) : maxwell3d{maxwell3d_} { | ||||||
|     builders.emplace(0x771BB18C62444DA0ULL, |     builders.emplace(0xDD6A7FA92A7D2674ULL, | ||||||
|                      std::function<std::unique_ptr<CachedMacro>(Engines::Maxwell3D&)>( |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|                          [](Engines::Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|                              return std::make_unique<HLE_771BB18C62444DA0>(maxwell3d__); |                              return std::make_unique<HLE_DrawArrays>(maxwell3d__); | ||||||
|                          })); |                          })); | ||||||
|     builders.emplace(0x0D61FC9FAAC9FCADULL, |     builders.emplace(0x0D61FC9FAAC9FCADULL, | ||||||
|                      std::function<std::unique_ptr<CachedMacro>(Engines::Maxwell3D&)>( |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|                          [](Engines::Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|                              return std::make_unique<HLE_DrawArraysIndirect>(maxwell3d__); |                              return std::make_unique<HLE_DrawArraysIndirect<false>>(maxwell3d__); | ||||||
|                          })); |                          })); | ||||||
|     builders.emplace(0x8A4D173EB99A8603ULL, |     builders.emplace(0x8A4D173EB99A8603ULL, | ||||||
|                      std::function<std::unique_ptr<CachedMacro>(Engines::Maxwell3D&)>( |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|                          [](Engines::Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|                              return std::make_unique<HLE_DrawArraysIndirect>(maxwell3d__, true); |                              return std::make_unique<HLE_DrawArraysIndirect<true>>(maxwell3d__); | ||||||
|  |                          })); | ||||||
|  |     builders.emplace(0x2DB33AADB741839CULL, | ||||||
|  |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|  |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|  |                              return std::make_unique<HLE_DrawIndexed>(maxwell3d__); | ||||||
|  |                          })); | ||||||
|  |     builders.emplace(0x771BB18C62444DA0ULL, | ||||||
|  |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|  |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|  |                              return std::make_unique<HLE_DrawIndexedIndirect<false>>(maxwell3d__); | ||||||
|                          })); |                          })); | ||||||
|     builders.emplace(0x0217920100488FF7ULL, |     builders.emplace(0x0217920100488FF7ULL, | ||||||
|                      std::function<std::unique_ptr<CachedMacro>(Engines::Maxwell3D&)>( |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|                          [](Engines::Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|                              return std::make_unique<HLE_DrawIndexedIndirect>(maxwell3d__); |                              return std::make_unique<HLE_DrawIndexedIndirect<true>>(maxwell3d__); | ||||||
|                          })); |                          })); | ||||||
|     builders.emplace(0x3F5E74B9C9A50164ULL, |     builders.emplace(0x3F5E74B9C9A50164ULL, | ||||||
|                      std::function<std::unique_ptr<CachedMacro>(Engines::Maxwell3D&)>( |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|                          [](Engines::Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|                              return std::make_unique<HLE_MultiDrawIndexedIndirectCount>( |                              return std::make_unique<HLE_MultiDrawIndexedIndirectCount>( | ||||||
|                                  maxwell3d__); |                                  maxwell3d__); | ||||||
|                          })); |                          })); | ||||||
|     builders.emplace(0xEAD26C3E2109B06BULL, |     builders.emplace(0xEAD26C3E2109B06BULL, | ||||||
|                      std::function<std::unique_ptr<CachedMacro>(Engines::Maxwell3D&)>( |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|                          [](Engines::Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|                              return std::make_unique<HLE_MultiLayerClear>(maxwell3d__); |                              return std::make_unique<HLE_MultiLayerClear>(maxwell3d__); | ||||||
|                          })); |                          })); | ||||||
|     builders.emplace(0xC713C83D8F63CCF3ULL, |     builders.emplace(0xC713C83D8F63CCF3ULL, | ||||||
|                      std::function<std::unique_ptr<CachedMacro>(Engines::Maxwell3D&)>( |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|                          [](Engines::Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|                              return std::make_unique<HLE_C713C83D8F63CCF3>(maxwell3d__); |                              return std::make_unique<HLE_C713C83D8F63CCF3>(maxwell3d__); | ||||||
|                          })); |                          })); | ||||||
|     builders.emplace(0xD7333D26E0A93EDEULL, |     builders.emplace(0xD7333D26E0A93EDEULL, | ||||||
|                      std::function<std::unique_ptr<CachedMacro>(Engines::Maxwell3D&)>( |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|                          [](Engines::Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|                              return std::make_unique<HLE_D7333D26E0A93EDE>(maxwell3d__); |                              return std::make_unique<HLE_D7333D26E0A93EDE>(maxwell3d__); | ||||||
|                          })); |                          })); | ||||||
|     builders.emplace(0xEB29B2A09AA06D38ULL, |     builders.emplace(0xEB29B2A09AA06D38ULL, | ||||||
|                      std::function<std::unique_ptr<CachedMacro>(Engines::Maxwell3D&)>( |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|                          [](Engines::Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|                              return std::make_unique<HLE_BindShader>(maxwell3d__); |                              return std::make_unique<HLE_BindShader>(maxwell3d__); | ||||||
|                          })); |                          })); | ||||||
|     builders.emplace(0xDB1341DBEB4C8AF7ULL, |     builders.emplace(0xDB1341DBEB4C8AF7ULL, | ||||||
|                      std::function<std::unique_ptr<CachedMacro>(Engines::Maxwell3D&)>( |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|                          [](Engines::Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|                              return std::make_unique<HLE_SetRasterBoundingBox>(maxwell3d__); |                              return std::make_unique<HLE_SetRasterBoundingBox>(maxwell3d__); | ||||||
|                          })); |                          })); | ||||||
|  |     builders.emplace(0x6C97861D891EDf7EULL, | ||||||
|  |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|  |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|  |                              return std::make_unique<HLE_ClearConstBuffer<0x5F00>>(maxwell3d__); | ||||||
|  |                          })); | ||||||
|  |     builders.emplace(0xD246FDDF3A6173D7ULL, | ||||||
|  |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|  |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|  |                              return std::make_unique<HLE_ClearConstBuffer<0x7000>>(maxwell3d__); | ||||||
|  |                          })); | ||||||
|  |     builders.emplace(0xEE4D0004BEC8ECF4ULL, | ||||||
|  |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|  |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|  |                              return std::make_unique<HLE_ClearMemory>(maxwell3d__); | ||||||
|  |                          })); | ||||||
|  |     builders.emplace(0xFC0CF27F5FFAA661ULL, | ||||||
|  |                      std::function<std::unique_ptr<CachedMacro>(Maxwell3D&)>( | ||||||
|  |                          [](Maxwell3D& maxwell3d__) -> std::unique_ptr<CachedMacro> { | ||||||
|  |                              return std::make_unique<HLE_TransformFeedbackSetup>(maxwell3d__); | ||||||
|  |                          })); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| HLEMacro::~HLEMacro() = default; | HLEMacro::~HLEMacro() = default; | ||||||
|  |  | ||||||
|  | @ -357,21 +357,21 @@ void RasterizerOpenGL::FlushRegion(VAddr addr, u64 size, VideoCommon::CacheType | ||||||
|     if (addr == 0 || size == 0) { |     if (addr == 0 || size == 0) { | ||||||
|         return; |         return; | ||||||
|     } |     } | ||||||
|     if (bool(which & VideoCommon::CacheType::TextureCache)) { |     if (True(which & VideoCommon::CacheType::TextureCache)) { | ||||||
|         std::scoped_lock lock{texture_cache.mutex}; |         std::scoped_lock lock{texture_cache.mutex}; | ||||||
|         texture_cache.DownloadMemory(addr, size); |         texture_cache.DownloadMemory(addr, size); | ||||||
|     } |     } | ||||||
|     if ((bool(which & VideoCommon::CacheType::BufferCache))) { |     if ((True(which & VideoCommon::CacheType::BufferCache))) { | ||||||
|         std::scoped_lock lock{buffer_cache.mutex}; |         std::scoped_lock lock{buffer_cache.mutex}; | ||||||
|         buffer_cache.DownloadMemory(addr, size); |         buffer_cache.DownloadMemory(addr, size); | ||||||
|     } |     } | ||||||
|     if ((bool(which & VideoCommon::CacheType::QueryCache))) { |     if ((True(which & VideoCommon::CacheType::QueryCache))) { | ||||||
|         query_cache.FlushRegion(addr, size); |         query_cache.FlushRegion(addr, size); | ||||||
|     } |     } | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| bool RasterizerOpenGL::MustFlushRegion(VAddr addr, u64 size, VideoCommon::CacheType which) { | bool RasterizerOpenGL::MustFlushRegion(VAddr addr, u64 size, VideoCommon::CacheType which) { | ||||||
|     if ((bool(which & VideoCommon::CacheType::BufferCache))) { |     if ((True(which & VideoCommon::CacheType::BufferCache))) { | ||||||
|         std::scoped_lock lock{buffer_cache.mutex}; |         std::scoped_lock lock{buffer_cache.mutex}; | ||||||
|         if (buffer_cache.IsRegionGpuModified(addr, size)) { |         if (buffer_cache.IsRegionGpuModified(addr, size)) { | ||||||
|             return true; |             return true; | ||||||
|  | @ -380,7 +380,7 @@ bool RasterizerOpenGL::MustFlushRegion(VAddr addr, u64 size, VideoCommon::CacheT | ||||||
|     if (!Settings::IsGPULevelHigh()) { |     if (!Settings::IsGPULevelHigh()) { | ||||||
|         return false; |         return false; | ||||||
|     } |     } | ||||||
|     if (bool(which & VideoCommon::CacheType::TextureCache)) { |     if (True(which & VideoCommon::CacheType::TextureCache)) { | ||||||
|         std::scoped_lock lock{texture_cache.mutex}; |         std::scoped_lock lock{texture_cache.mutex}; | ||||||
|         return texture_cache.IsRegionGpuModified(addr, size); |         return texture_cache.IsRegionGpuModified(addr, size); | ||||||
|     } |     } | ||||||
|  | @ -392,18 +392,18 @@ void RasterizerOpenGL::InvalidateRegion(VAddr addr, u64 size, VideoCommon::Cache | ||||||
|     if (addr == 0 || size == 0) { |     if (addr == 0 || size == 0) { | ||||||
|         return; |         return; | ||||||
|     } |     } | ||||||
|     if (bool(which & VideoCommon::CacheType::TextureCache)) { |     if (True(which & VideoCommon::CacheType::TextureCache)) { | ||||||
|         std::scoped_lock lock{texture_cache.mutex}; |         std::scoped_lock lock{texture_cache.mutex}; | ||||||
|         texture_cache.WriteMemory(addr, size); |         texture_cache.WriteMemory(addr, size); | ||||||
|     } |     } | ||||||
|     if (bool(which & VideoCommon::CacheType::BufferCache)) { |     if (True(which & VideoCommon::CacheType::BufferCache)) { | ||||||
|         std::scoped_lock lock{buffer_cache.mutex}; |         std::scoped_lock lock{buffer_cache.mutex}; | ||||||
|         buffer_cache.WriteMemory(addr, size); |         buffer_cache.WriteMemory(addr, size); | ||||||
|     } |     } | ||||||
|     if (bool(which & VideoCommon::CacheType::ShaderCache)) { |     if (True(which & VideoCommon::CacheType::ShaderCache)) { | ||||||
|         shader_cache.InvalidateRegion(addr, size); |         shader_cache.InvalidateRegion(addr, size); | ||||||
|     } |     } | ||||||
|     if (bool(which & VideoCommon::CacheType::QueryCache)) { |     if (True(which & VideoCommon::CacheType::QueryCache)) { | ||||||
|         query_cache.InvalidateRegion(addr, size); |         query_cache.InvalidateRegion(addr, size); | ||||||
|     } |     } | ||||||
| } | } | ||||||
|  |  | ||||||
|  | @ -431,21 +431,21 @@ void RasterizerVulkan::FlushRegion(VAddr addr, u64 size, VideoCommon::CacheType | ||||||
|     if (addr == 0 || size == 0) { |     if (addr == 0 || size == 0) { | ||||||
|         return; |         return; | ||||||
|     } |     } | ||||||
|     if (bool(which & VideoCommon::CacheType::TextureCache)) { |     if (True(which & VideoCommon::CacheType::TextureCache)) { | ||||||
|         std::scoped_lock lock{texture_cache.mutex}; |         std::scoped_lock lock{texture_cache.mutex}; | ||||||
|         texture_cache.DownloadMemory(addr, size); |         texture_cache.DownloadMemory(addr, size); | ||||||
|     } |     } | ||||||
|     if ((bool(which & VideoCommon::CacheType::BufferCache))) { |     if ((True(which & VideoCommon::CacheType::BufferCache))) { | ||||||
|         std::scoped_lock lock{buffer_cache.mutex}; |         std::scoped_lock lock{buffer_cache.mutex}; | ||||||
|         buffer_cache.DownloadMemory(addr, size); |         buffer_cache.DownloadMemory(addr, size); | ||||||
|     } |     } | ||||||
|     if ((bool(which & VideoCommon::CacheType::QueryCache))) { |     if ((True(which & VideoCommon::CacheType::QueryCache))) { | ||||||
|         query_cache.FlushRegion(addr, size); |         query_cache.FlushRegion(addr, size); | ||||||
|     } |     } | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| bool RasterizerVulkan::MustFlushRegion(VAddr addr, u64 size, VideoCommon::CacheType which) { | bool RasterizerVulkan::MustFlushRegion(VAddr addr, u64 size, VideoCommon::CacheType which) { | ||||||
|     if ((bool(which & VideoCommon::CacheType::BufferCache))) { |     if ((True(which & VideoCommon::CacheType::BufferCache))) { | ||||||
|         std::scoped_lock lock{buffer_cache.mutex}; |         std::scoped_lock lock{buffer_cache.mutex}; | ||||||
|         if (buffer_cache.IsRegionGpuModified(addr, size)) { |         if (buffer_cache.IsRegionGpuModified(addr, size)) { | ||||||
|             return true; |             return true; | ||||||
|  | @ -454,7 +454,7 @@ bool RasterizerVulkan::MustFlushRegion(VAddr addr, u64 size, VideoCommon::CacheT | ||||||
|     if (!Settings::IsGPULevelHigh()) { |     if (!Settings::IsGPULevelHigh()) { | ||||||
|         return false; |         return false; | ||||||
|     } |     } | ||||||
|     if (bool(which & VideoCommon::CacheType::TextureCache)) { |     if (True(which & VideoCommon::CacheType::TextureCache)) { | ||||||
|         std::scoped_lock lock{texture_cache.mutex}; |         std::scoped_lock lock{texture_cache.mutex}; | ||||||
|         return texture_cache.IsRegionGpuModified(addr, size); |         return texture_cache.IsRegionGpuModified(addr, size); | ||||||
|     } |     } | ||||||
|  | @ -465,18 +465,18 @@ void RasterizerVulkan::InvalidateRegion(VAddr addr, u64 size, VideoCommon::Cache | ||||||
|     if (addr == 0 || size == 0) { |     if (addr == 0 || size == 0) { | ||||||
|         return; |         return; | ||||||
|     } |     } | ||||||
|     if (bool(which & VideoCommon::CacheType::TextureCache)) { |     if (True(which & VideoCommon::CacheType::TextureCache)) { | ||||||
|         std::scoped_lock lock{texture_cache.mutex}; |         std::scoped_lock lock{texture_cache.mutex}; | ||||||
|         texture_cache.WriteMemory(addr, size); |         texture_cache.WriteMemory(addr, size); | ||||||
|     } |     } | ||||||
|     if ((bool(which & VideoCommon::CacheType::BufferCache))) { |     if ((True(which & VideoCommon::CacheType::BufferCache))) { | ||||||
|         std::scoped_lock lock{buffer_cache.mutex}; |         std::scoped_lock lock{buffer_cache.mutex}; | ||||||
|         buffer_cache.WriteMemory(addr, size); |         buffer_cache.WriteMemory(addr, size); | ||||||
|     } |     } | ||||||
|     if ((bool(which & VideoCommon::CacheType::QueryCache))) { |     if ((True(which & VideoCommon::CacheType::QueryCache))) { | ||||||
|         query_cache.InvalidateRegion(addr, size); |         query_cache.InvalidateRegion(addr, size); | ||||||
|     } |     } | ||||||
|     if ((bool(which & VideoCommon::CacheType::ShaderCache))) { |     if ((True(which & VideoCommon::CacheType::ShaderCache))) { | ||||||
|         pipeline_cache.InvalidateRegion(addr, size); |         pipeline_cache.InvalidateRegion(addr, size); | ||||||
|     } |     } | ||||||
| } | } | ||||||
|  | @ -1050,7 +1050,7 @@ void RasterizerVulkan::UpdateDepthBiasEnable(Tegra::Engines::Maxwell3D::Regs& re | ||||||
|     constexpr size_t POINT = 0; |     constexpr size_t POINT = 0; | ||||||
|     constexpr size_t LINE = 1; |     constexpr size_t LINE = 1; | ||||||
|     constexpr size_t POLYGON = 2; |     constexpr size_t POLYGON = 2; | ||||||
|     constexpr std::array POLYGON_OFFSET_ENABLE_LUT = { |     static constexpr std::array POLYGON_OFFSET_ENABLE_LUT = { | ||||||
|         POINT,   // Points
 |         POINT,   // Points
 | ||||||
|         LINE,    // Lines
 |         LINE,    // Lines
 | ||||||
|         LINE,    // LineLoop
 |         LINE,    // LineLoop
 | ||||||
|  | @ -1159,13 +1159,12 @@ void RasterizerVulkan::UpdateStencilOp(Tegra::Engines::Maxwell3D::Regs& regs) { | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| void RasterizerVulkan::UpdateLogicOp(Tegra::Engines::Maxwell3D::Regs& regs) { | void RasterizerVulkan::UpdateLogicOp(Tegra::Engines::Maxwell3D::Regs& regs) { | ||||||
|     if (!regs.logic_op.enable) { |  | ||||||
|         return; |  | ||||||
|     } |  | ||||||
|     if (!state_tracker.TouchLogicOp()) { |     if (!state_tracker.TouchLogicOp()) { | ||||||
|         return; |         return; | ||||||
|     } |     } | ||||||
|     auto op = static_cast<VkLogicOp>(static_cast<u32>(regs.logic_op.op) - 0x1500); |     const auto op_value = static_cast<u32>(regs.logic_op.op); | ||||||
|  |     auto op = op_value >= 0x1500 && op_value < 0x1510 ? static_cast<VkLogicOp>(op_value - 0x1500) | ||||||
|  |                                                       : VK_LOGIC_OP_NO_OP; | ||||||
|     scheduler.Record([op](vk::CommandBuffer cmdbuf) { cmdbuf.SetLogicOpEXT(op); }); |     scheduler.Record([op](vk::CommandBuffer cmdbuf) { cmdbuf.SetLogicOpEXT(op); }); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -351,12 +351,14 @@ std::optional<Shader::ReplaceConstant> GraphicsEnvironment::GetReplaceConstBuffe | ||||||
|     if (it == maxwell3d->replace_table.end()) { |     if (it == maxwell3d->replace_table.end()) { | ||||||
|         return std::nullopt; |         return std::nullopt; | ||||||
|     } |     } | ||||||
|     const auto converted_value = [](Tegra::Engines::Maxwell3D::HLEReplaceName name) { |     const auto converted_value = [](Tegra::Engines::Maxwell3D::HLEReplacementAttributeType name) { | ||||||
|         switch (name) { |         switch (name) { | ||||||
|         case Tegra::Engines::Maxwell3D::HLEReplaceName::BaseVertex: |         case Tegra::Engines::Maxwell3D::HLEReplacementAttributeType::BaseVertex: | ||||||
|             return Shader::ReplaceConstant::BaseVertex; |             return Shader::ReplaceConstant::BaseVertex; | ||||||
|         case Tegra::Engines::Maxwell3D::HLEReplaceName::BaseInstance: |         case Tegra::Engines::Maxwell3D::HLEReplacementAttributeType::BaseInstance: | ||||||
|             return Shader::ReplaceConstant::BaseInstance; |             return Shader::ReplaceConstant::BaseInstance; | ||||||
|  |         case Tegra::Engines::Maxwell3D::HLEReplacementAttributeType::DrawID: | ||||||
|  |             return Shader::ReplaceConstant::DrawID; | ||||||
|         default: |         default: | ||||||
|             UNREACHABLE(); |             UNREACHABLE(); | ||||||
|         } |         } | ||||||
|  |  | ||||||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue
	
	 Fernando Sahmkow
						Fernando Sahmkow