forked from eden-emu/eden
		
	Introduce skeleton of the GPU Compute Engine.
This commit is contained in:
		
							parent
							
								
									86e8a9f978
								
							
						
					
					
						commit
						e42bf4f314
					
				
					 3 changed files with 202 additions and 8 deletions
				
			
		|  | @ -4,12 +4,21 @@ | ||||||
| 
 | 
 | ||||||
| #include "common/assert.h" | #include "common/assert.h" | ||||||
| #include "common/logging/log.h" | #include "common/logging/log.h" | ||||||
|  | #include "core/core.h" | ||||||
| #include "video_core/engines/kepler_compute.h" | #include "video_core/engines/kepler_compute.h" | ||||||
|  | #include "video_core/engines/maxwell_3d.h" | ||||||
| #include "video_core/memory_manager.h" | #include "video_core/memory_manager.h" | ||||||
|  | #include "video_core/rasterizer_interface.h" | ||||||
|  | #include "video_core/renderer_base.h" | ||||||
|  | #include "video_core/textures/decoders.h" | ||||||
| 
 | 
 | ||||||
| namespace Tegra::Engines { | namespace Tegra::Engines { | ||||||
| 
 | 
 | ||||||
| KeplerCompute::KeplerCompute(MemoryManager& memory_manager) : memory_manager{memory_manager} {} | KeplerCompute::KeplerCompute(Core::System& system, VideoCore::RasterizerInterface& rasterizer, | ||||||
|  |                              MemoryManager& memory_manager) | ||||||
|  |     : system{system}, rasterizer{rasterizer}, memory_manager{memory_manager}, upload_state{ | ||||||
|  |                                                                                   memory_manager, | ||||||
|  |                                                                                   regs.upload} {} | ||||||
| 
 | 
 | ||||||
| KeplerCompute::~KeplerCompute() = default; | KeplerCompute::~KeplerCompute() = default; | ||||||
| 
 | 
 | ||||||
|  | @ -20,14 +29,34 @@ void KeplerCompute::CallMethod(const GPU::MethodCall& method_call) { | ||||||
|     regs.reg_array[method_call.method] = method_call.argument; |     regs.reg_array[method_call.method] = method_call.argument; | ||||||
| 
 | 
 | ||||||
|     switch (method_call.method) { |     switch (method_call.method) { | ||||||
|  |     case KEPLER_COMPUTE_REG_INDEX(exec_upload): { | ||||||
|  |         upload_state.ProcessExec(regs.exec_upload.linear != 0); | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  |     case KEPLER_COMPUTE_REG_INDEX(data_upload): { | ||||||
|  |         bool is_last_call = method_call.IsLastCall(); | ||||||
|  |         upload_state.ProcessData(method_call.argument, is_last_call); | ||||||
|  |         if (is_last_call) { | ||||||
|  |             system.GPU().Maxwell3D().dirty_flags.OnMemoryWrite(); | ||||||
|  |         } | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|     case KEPLER_COMPUTE_REG_INDEX(launch): |     case KEPLER_COMPUTE_REG_INDEX(launch): | ||||||
|         // Abort execution since compute shaders can be used to alter game memory (e.g. CUDA
 |         ProcessLaunch(); | ||||||
|         // kernels)
 |  | ||||||
|         UNREACHABLE_MSG("Compute shaders are not implemented"); |  | ||||||
|         break; |         break; | ||||||
|     default: |     default: | ||||||
|         break; |         break; | ||||||
|     } |     } | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | void KeplerCompute::ProcessLaunch() { | ||||||
|  | 
 | ||||||
|  |     const GPUVAddr launch_desc_loc = regs.launch_desc_loc.Address(); | ||||||
|  |     memory_manager.ReadBlockUnsafe(launch_desc_loc, &launch_description, | ||||||
|  |                                    LaunchParams::NUM_LAUNCH_PARAMETERS * sizeof(u32)); | ||||||
|  | 
 | ||||||
|  |     const GPUVAddr code_loc = regs.code_loc.Address() + launch_description.program_start; | ||||||
|  |     LOG_WARNING(HW_GPU, "Compute Kernel Execute at Address 0x{:016x}, STUBBED", code_loc); | ||||||
|  | } | ||||||
|  | 
 | ||||||
| } // namespace Tegra::Engines
 | } // namespace Tegra::Engines
 | ||||||
|  |  | ||||||
|  | @ -6,14 +6,25 @@ | ||||||
| 
 | 
 | ||||||
| #include <array> | #include <array> | ||||||
| #include <cstddef> | #include <cstddef> | ||||||
|  | #include <vector> | ||||||
|  | #include "common/bit_field.h" | ||||||
| #include "common/common_funcs.h" | #include "common/common_funcs.h" | ||||||
| #include "common/common_types.h" | #include "common/common_types.h" | ||||||
|  | #include "video_core/engines/engine_upload.h" | ||||||
| #include "video_core/gpu.h" | #include "video_core/gpu.h" | ||||||
| 
 | 
 | ||||||
|  | namespace Core { | ||||||
|  | class System; | ||||||
|  | } | ||||||
|  | 
 | ||||||
| namespace Tegra { | namespace Tegra { | ||||||
| class MemoryManager; | class MemoryManager; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | namespace VideoCore { | ||||||
|  | class RasterizerInterface; | ||||||
|  | } | ||||||
|  | 
 | ||||||
| namespace Tegra::Engines { | namespace Tegra::Engines { | ||||||
| 
 | 
 | ||||||
| #define KEPLER_COMPUTE_REG_INDEX(field_name)                                                       \ | #define KEPLER_COMPUTE_REG_INDEX(field_name)                                                       \ | ||||||
|  | @ -21,7 +32,8 @@ namespace Tegra::Engines { | ||||||
| 
 | 
 | ||||||
| class KeplerCompute final { | class KeplerCompute final { | ||||||
| public: | public: | ||||||
|     explicit KeplerCompute(MemoryManager& memory_manager); |     explicit KeplerCompute(Core::System& system, VideoCore::RasterizerInterface& rasterizer, | ||||||
|  |                            MemoryManager& memory_manager); | ||||||
|     ~KeplerCompute(); |     ~KeplerCompute(); | ||||||
| 
 | 
 | ||||||
|     static constexpr std::size_t NumConstBuffers = 8; |     static constexpr std::size_t NumConstBuffers = 8; | ||||||
|  | @ -31,30 +43,183 @@ public: | ||||||
| 
 | 
 | ||||||
|         union { |         union { | ||||||
|             struct { |             struct { | ||||||
|                 INSERT_PADDING_WORDS(0xAF); |                 INSERT_PADDING_WORDS(0x60); | ||||||
|  | 
 | ||||||
|  |                 Upload::Data upload; | ||||||
|  | 
 | ||||||
|  |                 struct { | ||||||
|  |                     union { | ||||||
|  |                         BitField<0, 1, u32> linear; | ||||||
|  |                     }; | ||||||
|  |                 } exec_upload; | ||||||
|  | 
 | ||||||
|  |                 u32 data_upload; | ||||||
|  | 
 | ||||||
|  |                 INSERT_PADDING_WORDS(0x3F); | ||||||
|  | 
 | ||||||
|  |                 struct { | ||||||
|  |                     u32 address; | ||||||
|  |                     GPUVAddr Address() const { | ||||||
|  |                         return static_cast<GPUVAddr>((static_cast<GPUVAddr>(address) << 8)); | ||||||
|  |                     } | ||||||
|  |                 } launch_desc_loc; | ||||||
|  | 
 | ||||||
|  |                 INSERT_PADDING_WORDS(0x1); | ||||||
| 
 | 
 | ||||||
|                 u32 launch; |                 u32 launch; | ||||||
| 
 | 
 | ||||||
|                 INSERT_PADDING_WORDS(0xC48); |                 INSERT_PADDING_WORDS(0x4A7); | ||||||
|  | 
 | ||||||
|  |                 struct { | ||||||
|  |                     u32 address_high; | ||||||
|  |                     u32 address_low; | ||||||
|  |                     u32 limit; | ||||||
|  |                     GPUVAddr Address() const { | ||||||
|  |                         return static_cast<GPUVAddr>((static_cast<GPUVAddr>(address_high) << 32) | | ||||||
|  |                                                      address_low); | ||||||
|  |                     } | ||||||
|  |                 } tsc; | ||||||
|  | 
 | ||||||
|  |                 INSERT_PADDING_WORDS(0x3); | ||||||
|  | 
 | ||||||
|  |                 struct { | ||||||
|  |                     u32 address_high; | ||||||
|  |                     u32 address_low; | ||||||
|  |                     u32 limit; | ||||||
|  |                     GPUVAddr Address() const { | ||||||
|  |                         return static_cast<GPUVAddr>((static_cast<GPUVAddr>(address_high) << 32) | | ||||||
|  |                                                      address_low); | ||||||
|  |                     } | ||||||
|  |                 } tic; | ||||||
|  | 
 | ||||||
|  |                 INSERT_PADDING_WORDS(0x22); | ||||||
|  | 
 | ||||||
|  |                 struct { | ||||||
|  |                     u32 address_high; | ||||||
|  |                     u32 address_low; | ||||||
|  |                     GPUVAddr Address() const { | ||||||
|  |                         return static_cast<GPUVAddr>((static_cast<GPUVAddr>(address_high) << 32) | | ||||||
|  |                                                      address_low); | ||||||
|  |                     } | ||||||
|  |                 } code_loc; | ||||||
|  | 
 | ||||||
|  |                 INSERT_PADDING_WORDS(0x3FE); | ||||||
|  | 
 | ||||||
|  |                 u32 texture_const_buffer_index; | ||||||
|  | 
 | ||||||
|  |                 INSERT_PADDING_WORDS(0x374); | ||||||
|             }; |             }; | ||||||
|             std::array<u32, NUM_REGS> reg_array; |             std::array<u32, NUM_REGS> reg_array; | ||||||
|         }; |         }; | ||||||
|     } regs{}; |     } regs{}; | ||||||
|  | 
 | ||||||
|  |     struct LaunchParams { | ||||||
|  |         static constexpr std::size_t NUM_LAUNCH_PARAMETERS = 0x40; | ||||||
|  | 
 | ||||||
|  |         INSERT_PADDING_WORDS(0x8); | ||||||
|  | 
 | ||||||
|  |         u32 program_start; | ||||||
|  | 
 | ||||||
|  |         INSERT_PADDING_WORDS(0x2); | ||||||
|  | 
 | ||||||
|  |         BitField<30, 1, u32> linked_tsc; | ||||||
|  | 
 | ||||||
|  |         BitField<0, 31, u32> grid_dim_x; | ||||||
|  | 
 | ||||||
|  |         union { | ||||||
|  |             BitField<0, 16, u32> grid_dim_y; | ||||||
|  |             BitField<16, 16, u32> grid_dim_z; | ||||||
|  |         }; | ||||||
|  | 
 | ||||||
|  |         INSERT_PADDING_WORDS(0x3); | ||||||
|  | 
 | ||||||
|  |         BitField<0, 16, u32> shared_alloc; | ||||||
|  | 
 | ||||||
|  |         BitField<0, 31, u32> block_dim_x; | ||||||
|  | 
 | ||||||
|  |         union { | ||||||
|  |             BitField<0, 16, u32> block_dim_y; | ||||||
|  |             BitField<16, 16, u32> block_dim_z; | ||||||
|  |         }; | ||||||
|  | 
 | ||||||
|  |         union { | ||||||
|  |             BitField<0, 8, u32> const_buffer_enable_mask; | ||||||
|  |             BitField<29, 2, u32> cache_layout; | ||||||
|  |         } memory_config; | ||||||
|  | 
 | ||||||
|  |         INSERT_PADDING_WORDS(0x8); | ||||||
|  | 
 | ||||||
|  |         struct { | ||||||
|  |             u32 address_low; | ||||||
|  |             union { | ||||||
|  |                 BitField<0, 8, u32> address_high; | ||||||
|  |                 BitField<15, 17, u32> size; | ||||||
|  |             }; | ||||||
|  |             GPUVAddr Address() const { | ||||||
|  |                 return static_cast<GPUVAddr>((static_cast<GPUVAddr>(address_high.Value()) << 32) | | ||||||
|  |                                              address_low); | ||||||
|  |             } | ||||||
|  |         } const_buffer_config[8]; | ||||||
|  | 
 | ||||||
|  |         union { | ||||||
|  |             BitField<0, 20, u32> local_pos_alloc; | ||||||
|  |             BitField<27, 5, u32> barrier_alloc; | ||||||
|  |         }; | ||||||
|  | 
 | ||||||
|  |         union { | ||||||
|  |             BitField<0, 20, u32> local_neg_alloc; | ||||||
|  |             BitField<24, 5, u32> gpr_alloc; | ||||||
|  |         }; | ||||||
|  | 
 | ||||||
|  |         INSERT_PADDING_WORDS(0x11); | ||||||
|  |     } launch_description; | ||||||
|  | 
 | ||||||
|  |     struct { | ||||||
|  |         u32 write_offset = 0; | ||||||
|  |         u32 copy_size = 0; | ||||||
|  |         std::vector<u8> inner_buffer; | ||||||
|  |     } state{}; | ||||||
|  | 
 | ||||||
|     static_assert(sizeof(Regs) == Regs::NUM_REGS * sizeof(u32), |     static_assert(sizeof(Regs) == Regs::NUM_REGS * sizeof(u32), | ||||||
|                   "KeplerCompute Regs has wrong size"); |                   "KeplerCompute Regs has wrong size"); | ||||||
| 
 | 
 | ||||||
|  |     static_assert(sizeof(LaunchParams) == LaunchParams::NUM_LAUNCH_PARAMETERS * sizeof(u32), | ||||||
|  |                   "KeplerCompute LaunchParams has wrong size"); | ||||||
|  | 
 | ||||||
|     /// Write the value to the register identified by method.
 |     /// Write the value to the register identified by method.
 | ||||||
|     void CallMethod(const GPU::MethodCall& method_call); |     void CallMethod(const GPU::MethodCall& method_call); | ||||||
| 
 | 
 | ||||||
| private: | private: | ||||||
|  |     Core::System& system; | ||||||
|  |     VideoCore::RasterizerInterface& rasterizer; | ||||||
|     MemoryManager& memory_manager; |     MemoryManager& memory_manager; | ||||||
|  |     Upload::State upload_state; | ||||||
|  | 
 | ||||||
|  |     void ProcessLaunch(); | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
| #define ASSERT_REG_POSITION(field_name, position)                                                  \ | #define ASSERT_REG_POSITION(field_name, position)                                                  \ | ||||||
|     static_assert(offsetof(KeplerCompute::Regs, field_name) == position * 4,                       \ |     static_assert(offsetof(KeplerCompute::Regs, field_name) == position * 4,                       \ | ||||||
|                   "Field " #field_name " has invalid position") |                   "Field " #field_name " has invalid position") | ||||||
| 
 | 
 | ||||||
|  | #define ASSERT_LAUNCH_PARAM_POSITION(field_name, position)                                         \ | ||||||
|  |     static_assert(offsetof(KeplerCompute::LaunchParams, field_name) == position * 4,               \ | ||||||
|  |                   "Field " #field_name " has invalid position") | ||||||
|  | 
 | ||||||
|  | ASSERT_REG_POSITION(upload, 0x60); | ||||||
|  | ASSERT_REG_POSITION(exec_upload, 0x6C); | ||||||
|  | ASSERT_REG_POSITION(data_upload, 0x6D); | ||||||
| ASSERT_REG_POSITION(launch, 0xAF); | ASSERT_REG_POSITION(launch, 0xAF); | ||||||
|  | ASSERT_REG_POSITION(tsc, 0x557); | ||||||
|  | ASSERT_REG_POSITION(tic, 0x55D); | ||||||
|  | ASSERT_REG_POSITION(code_loc, 0x582); | ||||||
|  | ASSERT_REG_POSITION(texture_const_buffer_index, 0x982); | ||||||
|  | ASSERT_LAUNCH_PARAM_POSITION(program_start, 0x8); | ||||||
|  | ASSERT_LAUNCH_PARAM_POSITION(grid_dim_x, 0xC); | ||||||
|  | ASSERT_LAUNCH_PARAM_POSITION(shared_alloc, 0x11); | ||||||
|  | ASSERT_LAUNCH_PARAM_POSITION(block_dim_x, 0x12); | ||||||
|  | ASSERT_LAUNCH_PARAM_POSITION(memory_config, 0x14); | ||||||
|  | ASSERT_LAUNCH_PARAM_POSITION(const_buffer_config, 0x1D); | ||||||
| 
 | 
 | ||||||
| #undef ASSERT_REG_POSITION | #undef ASSERT_REG_POSITION | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -35,7 +35,7 @@ GPU::GPU(Core::System& system, VideoCore::RendererBase& renderer) : renderer{ren | ||||||
|     dma_pusher = std::make_unique<Tegra::DmaPusher>(*this); |     dma_pusher = std::make_unique<Tegra::DmaPusher>(*this); | ||||||
|     maxwell_3d = std::make_unique<Engines::Maxwell3D>(system, rasterizer, *memory_manager); |     maxwell_3d = std::make_unique<Engines::Maxwell3D>(system, rasterizer, *memory_manager); | ||||||
|     fermi_2d = std::make_unique<Engines::Fermi2D>(rasterizer, *memory_manager); |     fermi_2d = std::make_unique<Engines::Fermi2D>(rasterizer, *memory_manager); | ||||||
|     kepler_compute = std::make_unique<Engines::KeplerCompute>(*memory_manager); |     kepler_compute = std::make_unique<Engines::KeplerCompute>(system, rasterizer, *memory_manager); | ||||||
|     maxwell_dma = std::make_unique<Engines::MaxwellDMA>(system, rasterizer, *memory_manager); |     maxwell_dma = std::make_unique<Engines::MaxwellDMA>(system, rasterizer, *memory_manager); | ||||||
|     kepler_memory = std::make_unique<Engines::KeplerMemory>(system, *memory_manager); |     kepler_memory = std::make_unique<Engines::KeplerMemory>(system, *memory_manager); | ||||||
| } | } | ||||||
|  |  | ||||||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue
	
	 Fernando Sahmkow
						Fernando Sahmkow