forked from eden-emu/eden
		
	spirv: Replace Constant/ConstantComposite with Const helper
This commit is contained in:
		
							parent
							
								
									4a97dd4483
								
							
						
					
					
						commit
						688c89590c
					
				
					 12 changed files with 100 additions and 111 deletions
				
			
		|  | @ -131,13 +131,13 @@ Id DefineInput(EmitContext& ctx, Id type, bool per_invocation, | ||||||
|     case Stage::TessellationControl: |     case Stage::TessellationControl: | ||||||
|     case Stage::TessellationEval: |     case Stage::TessellationEval: | ||||||
|         if (per_invocation) { |         if (per_invocation) { | ||||||
|             type = ctx.TypeArray(type, ctx.Constant(ctx.U32[1], 32u)); |             type = ctx.TypeArray(type, ctx.Const(32u)); | ||||||
|         } |         } | ||||||
|         break; |         break; | ||||||
|     case Stage::Geometry: |     case Stage::Geometry: | ||||||
|         if (per_invocation) { |         if (per_invocation) { | ||||||
|             const u32 num_vertices{NumVertices(ctx.profile.input_topology)}; |             const u32 num_vertices{NumVertices(ctx.profile.input_topology)}; | ||||||
|             type = ctx.TypeArray(type, ctx.Constant(ctx.U32[1], num_vertices)); |             type = ctx.TypeArray(type, ctx.Const(num_vertices)); | ||||||
|         } |         } | ||||||
|         break; |         break; | ||||||
|     default: |     default: | ||||||
|  | @ -149,7 +149,7 @@ Id DefineInput(EmitContext& ctx, Id type, bool per_invocation, | ||||||
| Id DefineOutput(EmitContext& ctx, Id type, std::optional<u32> invocations, | Id DefineOutput(EmitContext& ctx, Id type, std::optional<u32> invocations, | ||||||
|                 std::optional<spv::BuiltIn> builtin = std::nullopt) { |                 std::optional<spv::BuiltIn> builtin = std::nullopt) { | ||||||
|     if (invocations && ctx.stage == Stage::TessellationControl) { |     if (invocations && ctx.stage == Stage::TessellationControl) { | ||||||
|         type = ctx.TypeArray(type, ctx.Constant(ctx.U32[1], *invocations)); |         type = ctx.TypeArray(type, ctx.Const(*invocations)); | ||||||
|     } |     } | ||||||
|     return DefineVariable(ctx, type, builtin, spv::StorageClass::Output); |     return DefineVariable(ctx, type, builtin, spv::StorageClass::Output); | ||||||
| } | } | ||||||
|  | @ -224,7 +224,7 @@ std::optional<AttrInfo> AttrTypes(EmitContext& ctx, u32 index) { | ||||||
| 
 | 
 | ||||||
| void DefineConstBuffers(EmitContext& ctx, const Info& info, Id UniformDefinitions::*member_type, | void DefineConstBuffers(EmitContext& ctx, const Info& info, Id UniformDefinitions::*member_type, | ||||||
|                         u32 binding, Id type, char type_char, u32 element_size) { |                         u32 binding, Id type, char type_char, u32 element_size) { | ||||||
|     const Id array_type{ctx.TypeArray(type, ctx.Constant(ctx.U32[1], 65536U / element_size))}; |     const Id array_type{ctx.TypeArray(type, ctx.Const(65536U / element_size))}; | ||||||
|     ctx.Decorate(array_type, spv::Decoration::ArrayStride, element_size); |     ctx.Decorate(array_type, spv::Decoration::ArrayStride, element_size); | ||||||
| 
 | 
 | ||||||
|     const Id struct_type{ctx.TypeStruct(array_type)}; |     const Id struct_type{ctx.TypeStruct(array_type)}; | ||||||
|  | @ -328,7 +328,7 @@ Id CasLoop(EmitContext& ctx, Operation operation, Id array_pointer, Id element_p | ||||||
|     const bool is_struct{!is_shared || ctx.profile.support_explicit_workgroup_layout}; |     const bool is_struct{!is_shared || ctx.profile.support_explicit_workgroup_layout}; | ||||||
|     const Id cas_func{CasFunction(ctx, operation, value_type)}; |     const Id cas_func{CasFunction(ctx, operation, value_type)}; | ||||||
|     const Id zero{ctx.u32_zero_value}; |     const Id zero{ctx.u32_zero_value}; | ||||||
|     const Id scope_id{ctx.Constant(ctx.U32[1], static_cast<u32>(scope))}; |     const Id scope_id{ctx.Const(static_cast<u32>(scope))}; | ||||||
| 
 | 
 | ||||||
|     const Id loop_header{ctx.OpLabel()}; |     const Id loop_header{ctx.OpLabel()}; | ||||||
|     const Id continue_block{ctx.OpLabel()}; |     const Id continue_block{ctx.OpLabel()}; | ||||||
|  | @ -428,11 +428,11 @@ Id EmitContext::Def(const IR::Value& value) { | ||||||
|     case IR::Type::U1: |     case IR::Type::U1: | ||||||
|         return value.U1() ? true_value : false_value; |         return value.U1() ? true_value : false_value; | ||||||
|     case IR::Type::U32: |     case IR::Type::U32: | ||||||
|         return Constant(U32[1], value.U32()); |         return Const(value.U32()); | ||||||
|     case IR::Type::U64: |     case IR::Type::U64: | ||||||
|         return Constant(U64, value.U64()); |         return Constant(U64, value.U64()); | ||||||
|     case IR::Type::F32: |     case IR::Type::F32: | ||||||
|         return Constant(F32[1], value.F32()); |         return Const(value.F32()); | ||||||
|     case IR::Type::F64: |     case IR::Type::F64: | ||||||
|         return Constant(F64[1], value.F64()); |         return Constant(F64[1], value.F64()); | ||||||
|     case IR::Type::Label: |     case IR::Type::Label: | ||||||
|  | @ -486,8 +486,8 @@ void EmitContext::DefineCommonTypes(const Info& info) { | ||||||
| void EmitContext::DefineCommonConstants() { | void EmitContext::DefineCommonConstants() { | ||||||
|     true_value = ConstantTrue(U1); |     true_value = ConstantTrue(U1); | ||||||
|     false_value = ConstantFalse(U1); |     false_value = ConstantFalse(U1); | ||||||
|     u32_zero_value = Constant(U32[1], 0U); |     u32_zero_value = Const(0U); | ||||||
|     f32_zero_value = Constant(F32[1], 0.0f); |     f32_zero_value = Const(0.0f); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| void EmitContext::DefineInterfaces(const IR::Program& program) { | void EmitContext::DefineInterfaces(const IR::Program& program) { | ||||||
|  | @ -500,7 +500,7 @@ void EmitContext::DefineLocalMemory(const IR::Program& program) { | ||||||
|         return; |         return; | ||||||
|     } |     } | ||||||
|     const u32 num_elements{Common::DivCeil(program.local_memory_size, 4U)}; |     const u32 num_elements{Common::DivCeil(program.local_memory_size, 4U)}; | ||||||
|     const Id type{TypeArray(U32[1], Constant(U32[1], num_elements))}; |     const Id type{TypeArray(U32[1], Const(num_elements))}; | ||||||
|     const Id pointer{TypePointer(spv::StorageClass::Private, type)}; |     const Id pointer{TypePointer(spv::StorageClass::Private, type)}; | ||||||
|     local_memory = AddGlobalVariable(pointer, spv::StorageClass::Private); |     local_memory = AddGlobalVariable(pointer, spv::StorageClass::Private); | ||||||
|     if (profile.supported_spirv >= 0x00010400) { |     if (profile.supported_spirv >= 0x00010400) { | ||||||
|  | @ -514,7 +514,7 @@ void EmitContext::DefineSharedMemory(const IR::Program& program) { | ||||||
|     } |     } | ||||||
|     const auto make{[&](Id element_type, u32 element_size) { |     const auto make{[&](Id element_type, u32 element_size) { | ||||||
|         const u32 num_elements{Common::DivCeil(program.shared_memory_size, element_size)}; |         const u32 num_elements{Common::DivCeil(program.shared_memory_size, element_size)}; | ||||||
|         const Id array_type{TypeArray(element_type, Constant(U32[1], num_elements))}; |         const Id array_type{TypeArray(element_type, Const(num_elements))}; | ||||||
|         Decorate(array_type, spv::Decoration::ArrayStride, element_size); |         Decorate(array_type, spv::Decoration::ArrayStride, element_size); | ||||||
| 
 | 
 | ||||||
|         const Id struct_type{TypeStruct(array_type)}; |         const Id struct_type{TypeStruct(array_type)}; | ||||||
|  | @ -549,7 +549,7 @@ void EmitContext::DefineSharedMemory(const IR::Program& program) { | ||||||
|         return; |         return; | ||||||
|     } |     } | ||||||
|     const u32 num_elements{Common::DivCeil(program.shared_memory_size, 4U)}; |     const u32 num_elements{Common::DivCeil(program.shared_memory_size, 4U)}; | ||||||
|     const Id type{TypeArray(U32[1], Constant(U32[1], num_elements))}; |     const Id type{TypeArray(U32[1], Const(num_elements))}; | ||||||
|     shared_memory_u32_type = TypePointer(spv::StorageClass::Workgroup, type); |     shared_memory_u32_type = TypePointer(spv::StorageClass::Workgroup, type); | ||||||
| 
 | 
 | ||||||
|     shared_u32 = TypePointer(spv::StorageClass::Workgroup, U32[1]); |     shared_u32 = TypePointer(spv::StorageClass::Workgroup, U32[1]); | ||||||
|  | @ -569,10 +569,10 @@ void EmitContext::DefineSharedMemory(const IR::Program& program) { | ||||||
|         OpBranch(loop_header); |         OpBranch(loop_header); | ||||||
| 
 | 
 | ||||||
|         AddLabel(loop_header); |         AddLabel(loop_header); | ||||||
|         const Id word_offset{OpShiftRightArithmetic(U32[1], offset, Constant(U32[1], 2U))}; |         const Id word_offset{OpShiftRightArithmetic(U32[1], offset, Const(2U))}; | ||||||
|         const Id shift_offset{OpShiftLeftLogical(U32[1], offset, Constant(U32[1], 3U))}; |         const Id shift_offset{OpShiftLeftLogical(U32[1], offset, Const(3U))}; | ||||||
|         const Id bit_offset{OpBitwiseAnd(U32[1], shift_offset, Constant(U32[1], mask))}; |         const Id bit_offset{OpBitwiseAnd(U32[1], shift_offset, Const(mask))}; | ||||||
|         const Id count{Constant(U32[1], size)}; |         const Id count{Const(size)}; | ||||||
|         OpLoopMerge(merge_block, continue_block, spv::LoopControlMask::MaskNone); |         OpLoopMerge(merge_block, continue_block, spv::LoopControlMask::MaskNone); | ||||||
|         OpBranch(continue_block); |         OpBranch(continue_block); | ||||||
| 
 | 
 | ||||||
|  | @ -580,9 +580,8 @@ void EmitContext::DefineSharedMemory(const IR::Program& program) { | ||||||
|         const Id word_pointer{OpAccessChain(shared_u32, shared_memory_u32, word_offset)}; |         const Id word_pointer{OpAccessChain(shared_u32, shared_memory_u32, word_offset)}; | ||||||
|         const Id old_value{OpLoad(U32[1], word_pointer)}; |         const Id old_value{OpLoad(U32[1], word_pointer)}; | ||||||
|         const Id new_value{OpBitFieldInsert(U32[1], old_value, insert_value, bit_offset, count)}; |         const Id new_value{OpBitFieldInsert(U32[1], old_value, insert_value, bit_offset, count)}; | ||||||
|         const Id atomic_res{OpAtomicCompareExchange(U32[1], word_pointer, Constant(U32[1], 1U), |         const Id atomic_res{OpAtomicCompareExchange(U32[1], word_pointer, Const(1U), u32_zero_value, | ||||||
|                                                     u32_zero_value, u32_zero_value, new_value, |                                                     u32_zero_value, new_value, old_value)}; | ||||||
|                                                     old_value)}; |  | ||||||
|         const Id success{OpIEqual(U1, atomic_res, old_value)}; |         const Id success{OpIEqual(U1, atomic_res, old_value)}; | ||||||
|         OpBranchConditional(success, merge_block, loop_header); |         OpBranchConditional(success, merge_block, loop_header); | ||||||
| 
 | 
 | ||||||
|  | @ -623,9 +622,9 @@ void EmitContext::DefineAttributeMemAccess(const Info& info) { | ||||||
|         const Id vertex{is_array ? OpFunctionParameter(U32[1]) : Id{}}; |         const Id vertex{is_array ? OpFunctionParameter(U32[1]) : Id{}}; | ||||||
| 
 | 
 | ||||||
|         AddLabel(); |         AddLabel(); | ||||||
|         const Id base_index{OpShiftRightArithmetic(U32[1], offset, Constant(U32[1], 2U))}; |         const Id base_index{OpShiftRightArithmetic(U32[1], offset, Const(2U))}; | ||||||
|         const Id masked_index{OpBitwiseAnd(U32[1], base_index, Constant(U32[1], 3U))}; |         const Id masked_index{OpBitwiseAnd(U32[1], base_index, Const(3U))}; | ||||||
|         const Id compare_index{OpShiftRightArithmetic(U32[1], base_index, Constant(U32[1], 2U))}; |         const Id compare_index{OpShiftRightArithmetic(U32[1], base_index, Const(2U))}; | ||||||
|         std::vector<Sirit::Literal> literals; |         std::vector<Sirit::Literal> literals; | ||||||
|         std::vector<Id> labels; |         std::vector<Id> labels; | ||||||
|         if (info.loads_position) { |         if (info.loads_position) { | ||||||
|  | @ -643,7 +642,7 @@ void EmitContext::DefineAttributeMemAccess(const Info& info) { | ||||||
|         OpSelectionMerge(end_block, spv::SelectionControlMask::MaskNone); |         OpSelectionMerge(end_block, spv::SelectionControlMask::MaskNone); | ||||||
|         OpSwitch(compare_index, default_label, literals, labels); |         OpSwitch(compare_index, default_label, literals, labels); | ||||||
|         AddLabel(default_label); |         AddLabel(default_label); | ||||||
|         OpReturnValue(Constant(F32[1], 0.0f)); |         OpReturnValue(Const(0.0f)); | ||||||
|         size_t label_index{0}; |         size_t label_index{0}; | ||||||
|         if (info.loads_position) { |         if (info.loads_position) { | ||||||
|             AddLabel(labels[label_index]); |             AddLabel(labels[label_index]); | ||||||
|  | @ -661,7 +660,7 @@ void EmitContext::DefineAttributeMemAccess(const Info& info) { | ||||||
|             AddLabel(labels[label_index]); |             AddLabel(labels[label_index]); | ||||||
|             const auto type{AttrTypes(*this, static_cast<u32>(i))}; |             const auto type{AttrTypes(*this, static_cast<u32>(i))}; | ||||||
|             if (!type) { |             if (!type) { | ||||||
|                 OpReturnValue(Constant(F32[1], 0.0f)); |                 OpReturnValue(Const(0.0f)); | ||||||
|                 ++label_index; |                 ++label_index; | ||||||
|                 continue; |                 continue; | ||||||
|             } |             } | ||||||
|  | @ -688,9 +687,9 @@ void EmitContext::DefineAttributeMemAccess(const Info& info) { | ||||||
|         const Id offset{OpFunctionParameter(U32[1])}; |         const Id offset{OpFunctionParameter(U32[1])}; | ||||||
|         const Id store_value{OpFunctionParameter(F32[1])}; |         const Id store_value{OpFunctionParameter(F32[1])}; | ||||||
|         AddLabel(); |         AddLabel(); | ||||||
|         const Id base_index{OpShiftRightArithmetic(U32[1], offset, Constant(U32[1], 2U))}; |         const Id base_index{OpShiftRightArithmetic(U32[1], offset, Const(2U))}; | ||||||
|         const Id masked_index{OpBitwiseAnd(U32[1], base_index, Constant(U32[1], 3U))}; |         const Id masked_index{OpBitwiseAnd(U32[1], base_index, Const(3U))}; | ||||||
|         const Id compare_index{OpShiftRightArithmetic(U32[1], base_index, Constant(U32[1], 2U))}; |         const Id compare_index{OpShiftRightArithmetic(U32[1], base_index, Const(2U))}; | ||||||
|         std::vector<Sirit::Literal> literals; |         std::vector<Sirit::Literal> literals; | ||||||
|         std::vector<Id> labels; |         std::vector<Id> labels; | ||||||
|         if (info.stores_position) { |         if (info.stores_position) { | ||||||
|  | @ -744,7 +743,7 @@ void EmitContext::DefineAttributeMemAccess(const Info& info) { | ||||||
|             OpReturn(); |             OpReturn(); | ||||||
|             ++label_index; |             ++label_index; | ||||||
|             AddLabel(labels[label_index]); |             AddLabel(labels[label_index]); | ||||||
|             const Id fixed_index{OpIAdd(U32[1], masked_index, Constant(U32[1], 4))}; |             const Id fixed_index{OpIAdd(U32[1], masked_index, Const(4U))}; | ||||||
|             const Id pointer2{OpAccessChain(output_f32, clip_distances, fixed_index)}; |             const Id pointer2{OpAccessChain(output_f32, clip_distances, fixed_index)}; | ||||||
|             OpStore(pointer2, store_value); |             OpStore(pointer2, store_value); | ||||||
|             OpReturn(); |             OpReturn(); | ||||||
|  | @ -1018,9 +1017,9 @@ void EmitContext::DefineInputs(const Info& info) { | ||||||
|             DefineInput(*this, U32[1], false, spv::BuiltIn::SubgroupLocalInvocationId); |             DefineInput(*this, U32[1], false, spv::BuiltIn::SubgroupLocalInvocationId); | ||||||
|     } |     } | ||||||
|     if (info.uses_fswzadd) { |     if (info.uses_fswzadd) { | ||||||
|         const Id f32_one{Constant(F32[1], 1.0f)}; |         const Id f32_one{Const(1.0f)}; | ||||||
|         const Id f32_minus_one{Constant(F32[1], -1.0f)}; |         const Id f32_minus_one{Const(-1.0f)}; | ||||||
|         const Id f32_zero{Constant(F32[1], 0.0f)}; |         const Id f32_zero{Const(0.0f)}; | ||||||
|         fswzadd_lut_a = ConstantComposite(F32[4], f32_minus_one, f32_one, f32_minus_one, f32_zero); |         fswzadd_lut_a = ConstantComposite(F32[4], f32_minus_one, f32_one, f32_minus_one, f32_zero); | ||||||
|         fswzadd_lut_b = |         fswzadd_lut_b = | ||||||
|             ConstantComposite(F32[4], f32_minus_one, f32_minus_one, f32_one, f32_minus_one); |             ConstantComposite(F32[4], f32_minus_one, f32_minus_one, f32_one, f32_minus_one); | ||||||
|  | @ -1118,7 +1117,7 @@ void EmitContext::DefineOutputs(const IR::Program& program) { | ||||||
|         if (stage == Stage::Fragment) { |         if (stage == Stage::Fragment) { | ||||||
|             throw NotImplementedException("Storing ClipDistance in fragment stage"); |             throw NotImplementedException("Storing ClipDistance in fragment stage"); | ||||||
|         } |         } | ||||||
|         const Id type{TypeArray(F32[1], Constant(U32[1], 8U))}; |         const Id type{TypeArray(F32[1], Const(8U))}; | ||||||
|         clip_distances = DefineOutput(*this, type, invocations, spv::BuiltIn::ClipDistance); |         clip_distances = DefineOutput(*this, type, invocations, spv::BuiltIn::ClipDistance); | ||||||
|     } |     } | ||||||
|     if (info.stores_layer && |     if (info.stores_layer && | ||||||
|  | @ -1136,7 +1135,7 @@ void EmitContext::DefineOutputs(const IR::Program& program) { | ||||||
|         viewport_index = DefineOutput(*this, U32[1], invocations, spv::BuiltIn::ViewportIndex); |         viewport_index = DefineOutput(*this, U32[1], invocations, spv::BuiltIn::ViewportIndex); | ||||||
|     } |     } | ||||||
|     if (info.stores_viewport_mask && profile.support_viewport_mask) { |     if (info.stores_viewport_mask && profile.support_viewport_mask) { | ||||||
|         viewport_mask = DefineOutput(*this, TypeArray(U32[1], Constant(U32[1], 1u)), std::nullopt); |         viewport_mask = DefineOutput(*this, TypeArray(U32[1], Const(1u)), std::nullopt); | ||||||
|     } |     } | ||||||
|     for (size_t index = 0; index < info.stores_generics.size(); ++index) { |     for (size_t index = 0; index < info.stores_generics.size(); ++index) { | ||||||
|         if (info.stores_generics[index]) { |         if (info.stores_generics[index]) { | ||||||
|  | @ -1146,13 +1145,13 @@ void EmitContext::DefineOutputs(const IR::Program& program) { | ||||||
|     switch (stage) { |     switch (stage) { | ||||||
|     case Stage::TessellationControl: |     case Stage::TessellationControl: | ||||||
|         if (info.stores_tess_level_outer) { |         if (info.stores_tess_level_outer) { | ||||||
|             const Id type{TypeArray(F32[1], Constant(U32[1], 4))}; |             const Id type{TypeArray(F32[1], Const(4U))}; | ||||||
|             output_tess_level_outer = |             output_tess_level_outer = | ||||||
|                 DefineOutput(*this, type, std::nullopt, spv::BuiltIn::TessLevelOuter); |                 DefineOutput(*this, type, std::nullopt, spv::BuiltIn::TessLevelOuter); | ||||||
|             Decorate(output_tess_level_outer, spv::Decoration::Patch); |             Decorate(output_tess_level_outer, spv::Decoration::Patch); | ||||||
|         } |         } | ||||||
|         if (info.stores_tess_level_inner) { |         if (info.stores_tess_level_inner) { | ||||||
|             const Id type{TypeArray(F32[1], Constant(U32[1], 2))}; |             const Id type{TypeArray(F32[1], Const(2U))}; | ||||||
|             output_tess_level_inner = |             output_tess_level_inner = | ||||||
|                 DefineOutput(*this, type, std::nullopt, spv::BuiltIn::TessLevelInner); |                 DefineOutput(*this, type, std::nullopt, spv::BuiltIn::TessLevelInner); | ||||||
|             Decorate(output_tess_level_inner, spv::Decoration::Patch); |             Decorate(output_tess_level_inner, spv::Decoration::Patch); | ||||||
|  |  | ||||||
|  | @ -114,7 +114,7 @@ public: | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|     Id Const(u32 element_1, u32 element_2, u32 element_3, u32 element_4) { |     Id Const(u32 element_1, u32 element_2, u32 element_3, u32 element_4) { | ||||||
|         return ConstantComposite(U32[2], Const(element_1), Const(element_2), Const(element_3), |         return ConstantComposite(U32[4], Const(element_1), Const(element_2), Const(element_3), | ||||||
|                                  Const(element_4)); |                                  Const(element_4)); | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -7,10 +7,10 @@ | ||||||
| namespace Shader::Backend::SPIRV { | namespace Shader::Backend::SPIRV { | ||||||
| namespace { | namespace { | ||||||
| Id SharedPointer(EmitContext& ctx, Id offset, u32 index_offset = 0) { | Id SharedPointer(EmitContext& ctx, Id offset, u32 index_offset = 0) { | ||||||
|     const Id shift_id{ctx.Constant(ctx.U32[1], 2U)}; |     const Id shift_id{ctx.Const(2U)}; | ||||||
|     Id index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; |     Id index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; | ||||||
|     if (index_offset > 0) { |     if (index_offset > 0) { | ||||||
|         index = ctx.OpIAdd(ctx.U32[1], index, ctx.Constant(ctx.U32[1], index_offset)); |         index = ctx.OpIAdd(ctx.U32[1], index, ctx.Const(index_offset)); | ||||||
|     } |     } | ||||||
|     return ctx.profile.support_explicit_workgroup_layout |     return ctx.profile.support_explicit_workgroup_layout | ||||||
|                ? ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, ctx.u32_zero_value, index) |                ? ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, ctx.u32_zero_value, index) | ||||||
|  | @ -20,14 +20,14 @@ Id SharedPointer(EmitContext& ctx, Id offset, u32 index_offset = 0) { | ||||||
| Id StorageIndex(EmitContext& ctx, const IR::Value& offset, size_t element_size) { | Id StorageIndex(EmitContext& ctx, const IR::Value& offset, size_t element_size) { | ||||||
|     if (offset.IsImmediate()) { |     if (offset.IsImmediate()) { | ||||||
|         const u32 imm_offset{static_cast<u32>(offset.U32() / element_size)}; |         const u32 imm_offset{static_cast<u32>(offset.U32() / element_size)}; | ||||||
|         return ctx.Constant(ctx.U32[1], imm_offset); |         return ctx.Const(imm_offset); | ||||||
|     } |     } | ||||||
|     const u32 shift{static_cast<u32>(std::countr_zero(element_size))}; |     const u32 shift{static_cast<u32>(std::countr_zero(element_size))}; | ||||||
|     const Id index{ctx.Def(offset)}; |     const Id index{ctx.Def(offset)}; | ||||||
|     if (shift == 0) { |     if (shift == 0) { | ||||||
|         return index; |         return index; | ||||||
|     } |     } | ||||||
|     const Id shift_id{ctx.Constant(ctx.U32[1], shift)}; |     const Id shift_id{ctx.Const(shift)}; | ||||||
|     return ctx.OpShiftRightLogical(ctx.U32[1], index, shift_id); |     return ctx.OpShiftRightLogical(ctx.U32[1], index, shift_id); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | @ -43,7 +43,7 @@ Id StoragePointer(EmitContext& ctx, const StorageTypeDefinition& type_def, | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| std::pair<Id, Id> AtomicArgs(EmitContext& ctx) { | std::pair<Id, Id> AtomicArgs(EmitContext& ctx) { | ||||||
|     const Id scope{ctx.Constant(ctx.U32[1], static_cast<u32>(spv::Scope::Device))}; |     const Id scope{ctx.Const(static_cast<u32>(spv::Scope::Device))}; | ||||||
|     const Id semantics{ctx.u32_zero_value}; |     const Id semantics{ctx.u32_zero_value}; | ||||||
|     return {scope, semantics}; |     return {scope, semantics}; | ||||||
| } | } | ||||||
|  | @ -103,13 +103,13 @@ Id EmitSharedAtomicUMax32(EmitContext& ctx, Id offset, Id value) { | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| Id EmitSharedAtomicInc32(EmitContext& ctx, Id offset, Id value) { | Id EmitSharedAtomicInc32(EmitContext& ctx, Id offset, Id value) { | ||||||
|     const Id shift_id{ctx.Constant(ctx.U32[1], 2U)}; |     const Id shift_id{ctx.Const(2U)}; | ||||||
|     const Id index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; |     const Id index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; | ||||||
|     return ctx.OpFunctionCall(ctx.U32[1], ctx.increment_cas_shared, index, value); |     return ctx.OpFunctionCall(ctx.U32[1], ctx.increment_cas_shared, index, value); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| Id EmitSharedAtomicDec32(EmitContext& ctx, Id offset, Id value) { | Id EmitSharedAtomicDec32(EmitContext& ctx, Id offset, Id value) { | ||||||
|     const Id shift_id{ctx.Constant(ctx.U32[1], 2U)}; |     const Id shift_id{ctx.Const(2U)}; | ||||||
|     const Id index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; |     const Id index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; | ||||||
|     return ctx.OpFunctionCall(ctx.U32[1], ctx.decrement_cas_shared, index, value); |     return ctx.OpFunctionCall(ctx.U32[1], ctx.decrement_cas_shared, index, value); | ||||||
| } | } | ||||||
|  | @ -132,7 +132,7 @@ Id EmitSharedAtomicExchange32(EmitContext& ctx, Id offset, Id value) { | ||||||
| 
 | 
 | ||||||
| Id EmitSharedAtomicExchange64(EmitContext& ctx, Id offset, Id value) { | Id EmitSharedAtomicExchange64(EmitContext& ctx, Id offset, Id value) { | ||||||
|     if (ctx.profile.support_int64_atomics && ctx.profile.support_explicit_workgroup_layout) { |     if (ctx.profile.support_int64_atomics && ctx.profile.support_explicit_workgroup_layout) { | ||||||
|         const Id shift_id{ctx.Constant(ctx.U32[1], 3U)}; |         const Id shift_id{ctx.Const(3U)}; | ||||||
|         const Id index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; |         const Id index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; | ||||||
|         const Id pointer{ |         const Id pointer{ | ||||||
|             ctx.OpAccessChain(ctx.shared_u64, ctx.shared_memory_u64, ctx.u32_zero_value, index)}; |             ctx.OpAccessChain(ctx.shared_u64, ctx.shared_memory_u64, ctx.u32_zero_value, index)}; | ||||||
|  |  | ||||||
|  | @ -12,8 +12,7 @@ void MemoryBarrier(EmitContext& ctx, spv::Scope scope) { | ||||||
|         spv::MemorySemanticsMask::AcquireRelease | spv::MemorySemanticsMask::UniformMemory | |         spv::MemorySemanticsMask::AcquireRelease | spv::MemorySemanticsMask::UniformMemory | | ||||||
|         spv::MemorySemanticsMask::WorkgroupMemory | spv::MemorySemanticsMask::AtomicCounterMemory | |         spv::MemorySemanticsMask::WorkgroupMemory | spv::MemorySemanticsMask::AtomicCounterMemory | | ||||||
|         spv::MemorySemanticsMask::ImageMemory}; |         spv::MemorySemanticsMask::ImageMemory}; | ||||||
|     ctx.OpMemoryBarrier(ctx.Constant(ctx.U32[1], static_cast<u32>(scope)), |     ctx.OpMemoryBarrier(ctx.Const(static_cast<u32>(scope)), ctx.Const(static_cast<u32>(semantics))); | ||||||
|                         ctx.Constant(ctx.U32[1], static_cast<u32>(semantics))); |  | ||||||
| } | } | ||||||
| } // Anonymous namespace
 | } // Anonymous namespace
 | ||||||
| 
 | 
 | ||||||
|  | @ -22,9 +21,9 @@ void EmitBarrier(EmitContext& ctx) { | ||||||
|     const auto memory{spv::Scope::Workgroup}; |     const auto memory{spv::Scope::Workgroup}; | ||||||
|     const auto memory_semantics{spv::MemorySemanticsMask::AcquireRelease | |     const auto memory_semantics{spv::MemorySemanticsMask::AcquireRelease | | ||||||
|                                 spv::MemorySemanticsMask::WorkgroupMemory}; |                                 spv::MemorySemanticsMask::WorkgroupMemory}; | ||||||
|     ctx.OpControlBarrier(ctx.Constant(ctx.U32[1], static_cast<u32>(execution)), |     ctx.OpControlBarrier(ctx.Const(static_cast<u32>(execution)), | ||||||
|                          ctx.Constant(ctx.U32[1], static_cast<u32>(memory)), |                          ctx.Const(static_cast<u32>(memory)), | ||||||
|                          ctx.Constant(ctx.U32[1], static_cast<u32>(memory_semantics))); |                          ctx.Const(static_cast<u32>(memory_semantics))); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| void EmitWorkgroupMemoryBarrier(EmitContext& ctx) { | void EmitWorkgroupMemoryBarrier(EmitContext& ctx) { | ||||||
|  |  | ||||||
|  | @ -69,7 +69,7 @@ std::optional<OutAttr> OutputAttrPointer(EmitContext& ctx, IR::Attribute attr) { | ||||||
|             return info.id; |             return info.id; | ||||||
|         } else { |         } else { | ||||||
|             const u32 index_element{element - info.first_element}; |             const u32 index_element{element - info.first_element}; | ||||||
|             const Id index_id{ctx.Constant(ctx.U32[1], index_element)}; |             const Id index_id{ctx.Const(index_element)}; | ||||||
|             return OutputAccessChain(ctx, ctx.output_f32, info.id, index_id); |             return OutputAccessChain(ctx, ctx.output_f32, info.id, index_id); | ||||||
|         } |         } | ||||||
|     } |     } | ||||||
|  | @ -81,7 +81,7 @@ std::optional<OutAttr> OutputAttrPointer(EmitContext& ctx, IR::Attribute attr) { | ||||||
|     case IR::Attribute::PositionZ: |     case IR::Attribute::PositionZ: | ||||||
|     case IR::Attribute::PositionW: { |     case IR::Attribute::PositionW: { | ||||||
|         const u32 element{static_cast<u32>(attr) % 4}; |         const u32 element{static_cast<u32>(attr) % 4}; | ||||||
|         const Id element_id{ctx.Constant(ctx.U32[1], element)}; |         const Id element_id{ctx.Const(element)}; | ||||||
|         return OutputAccessChain(ctx, ctx.output_f32, ctx.output_position, element_id); |         return OutputAccessChain(ctx, ctx.output_f32, ctx.output_position, element_id); | ||||||
|     } |     } | ||||||
|     case IR::Attribute::ClipDistance0: |     case IR::Attribute::ClipDistance0: | ||||||
|  | @ -94,7 +94,7 @@ std::optional<OutAttr> OutputAttrPointer(EmitContext& ctx, IR::Attribute attr) { | ||||||
|     case IR::Attribute::ClipDistance7: { |     case IR::Attribute::ClipDistance7: { | ||||||
|         const u32 base{static_cast<u32>(IR::Attribute::ClipDistance0)}; |         const u32 base{static_cast<u32>(IR::Attribute::ClipDistance0)}; | ||||||
|         const u32 index{static_cast<u32>(attr) - base}; |         const u32 index{static_cast<u32>(attr) - base}; | ||||||
|         const Id clip_num{ctx.Constant(ctx.U32[1], index)}; |         const Id clip_num{ctx.Const(index)}; | ||||||
|         return OutputAccessChain(ctx, ctx.output_f32, ctx.clip_distances, clip_num); |         return OutputAccessChain(ctx, ctx.output_f32, ctx.clip_distances, clip_num); | ||||||
|     } |     } | ||||||
|     case IR::Attribute::Layer: |     case IR::Attribute::Layer: | ||||||
|  | @ -131,7 +131,7 @@ Id GetCbuf(EmitContext& ctx, Id result_type, Id UniformDefinitions::*member_ptr, | ||||||
|         Id index{ctx.Def(offset)}; |         Id index{ctx.Def(offset)}; | ||||||
|         if (element_size > 1) { |         if (element_size > 1) { | ||||||
|             const u32 log2_element_size{static_cast<u32>(std::countr_zero(element_size))}; |             const u32 log2_element_size{static_cast<u32>(std::countr_zero(element_size))}; | ||||||
|             const Id shift{ctx.Constant(ctx.U32[1], log2_element_size)}; |             const Id shift{ctx.Const(log2_element_size)}; | ||||||
|             index = ctx.OpShiftRightArithmetic(ctx.U32[1], ctx.Def(offset), shift); |             index = ctx.OpShiftRightArithmetic(ctx.U32[1], ctx.Def(offset), shift); | ||||||
|         } |         } | ||||||
|         const Id access_chain{ctx.OpAccessChain(uniform_type, cbuf, ctx.u32_zero_value, index)}; |         const Id access_chain{ctx.OpAccessChain(uniform_type, cbuf, ctx.u32_zero_value, index)}; | ||||||
|  | @ -140,7 +140,7 @@ Id GetCbuf(EmitContext& ctx, Id result_type, Id UniformDefinitions::*member_ptr, | ||||||
|     if (offset.U32() % element_size != 0) { |     if (offset.U32() % element_size != 0) { | ||||||
|         throw NotImplementedException("Unaligned immediate constant buffer load"); |         throw NotImplementedException("Unaligned immediate constant buffer load"); | ||||||
|     } |     } | ||||||
|     const Id imm_offset{ctx.Constant(ctx.U32[1], offset.U32() / element_size)}; |     const Id imm_offset{ctx.Const(offset.U32() / element_size)}; | ||||||
|     const Id access_chain{ctx.OpAccessChain(uniform_type, cbuf, ctx.u32_zero_value, imm_offset)}; |     const Id access_chain{ctx.OpAccessChain(uniform_type, cbuf, ctx.u32_zero_value, imm_offset)}; | ||||||
|     return ctx.OpLoad(result_type, access_chain); |     return ctx.OpLoad(result_type, access_chain); | ||||||
| } | } | ||||||
|  | @ -212,13 +212,13 @@ Id EmitGetCbufU32x2(EmitContext& ctx, const IR::Value& binding, const IR::Value& | ||||||
| 
 | 
 | ||||||
| Id EmitGetAttribute(EmitContext& ctx, IR::Attribute attr, Id vertex) { | Id EmitGetAttribute(EmitContext& ctx, IR::Attribute attr, Id vertex) { | ||||||
|     const u32 element{static_cast<u32>(attr) % 4}; |     const u32 element{static_cast<u32>(attr) % 4}; | ||||||
|     const auto element_id{[&] { return ctx.Constant(ctx.U32[1], element); }}; |     const auto element_id{[&] { return ctx.Const(element); }}; | ||||||
|     if (IR::IsGeneric(attr)) { |     if (IR::IsGeneric(attr)) { | ||||||
|         const u32 index{IR::GenericAttributeIndex(attr)}; |         const u32 index{IR::GenericAttributeIndex(attr)}; | ||||||
|         const std::optional<AttrInfo> type{AttrTypes(ctx, index)}; |         const std::optional<AttrInfo> type{AttrTypes(ctx, index)}; | ||||||
|         if (!type) { |         if (!type) { | ||||||
|             // Attribute is disabled
 |             // Attribute is disabled
 | ||||||
|             return ctx.Constant(ctx.F32[1], 0.0f); |             return ctx.Const(0.0f); | ||||||
|         } |         } | ||||||
|         const Id generic_id{ctx.input_generics.at(index)}; |         const Id generic_id{ctx.input_generics.at(index)}; | ||||||
|         const Id pointer{AttrPointer(ctx, type->pointer, vertex, generic_id, element_id())}; |         const Id pointer{AttrPointer(ctx, type->pointer, vertex, generic_id, element_id())}; | ||||||
|  | @ -252,20 +252,19 @@ Id EmitGetAttribute(EmitContext& ctx, IR::Attribute attr, Id vertex) { | ||||||
|         } |         } | ||||||
|     case IR::Attribute::FrontFace: |     case IR::Attribute::FrontFace: | ||||||
|         return ctx.OpSelect(ctx.U32[1], ctx.OpLoad(ctx.U1, ctx.front_face), |         return ctx.OpSelect(ctx.U32[1], ctx.OpLoad(ctx.U1, ctx.front_face), | ||||||
|                             ctx.Constant(ctx.U32[1], std::numeric_limits<u32>::max()), |                             ctx.Const(std::numeric_limits<u32>::max()), ctx.u32_zero_value); | ||||||
|                             ctx.u32_zero_value); |  | ||||||
|     case IR::Attribute::PointSpriteS: |     case IR::Attribute::PointSpriteS: | ||||||
|         return ctx.OpLoad(ctx.F32[1], |         return ctx.OpLoad(ctx.F32[1], | ||||||
|                           ctx.OpAccessChain(ctx.input_f32, ctx.point_coord, ctx.u32_zero_value)); |                           ctx.OpAccessChain(ctx.input_f32, ctx.point_coord, ctx.u32_zero_value)); | ||||||
|     case IR::Attribute::PointSpriteT: |     case IR::Attribute::PointSpriteT: | ||||||
|         return ctx.OpLoad(ctx.F32[1], ctx.OpAccessChain(ctx.input_f32, ctx.point_coord, |         return ctx.OpLoad(ctx.F32[1], | ||||||
|                                                         ctx.Constant(ctx.U32[1], 1U))); |                           ctx.OpAccessChain(ctx.input_f32, ctx.point_coord, ctx.Const(1U))); | ||||||
|     case IR::Attribute::TessellationEvaluationPointU: |     case IR::Attribute::TessellationEvaluationPointU: | ||||||
|         return ctx.OpLoad(ctx.F32[1], |         return ctx.OpLoad(ctx.F32[1], | ||||||
|                           ctx.OpAccessChain(ctx.input_f32, ctx.tess_coord, ctx.u32_zero_value)); |                           ctx.OpAccessChain(ctx.input_f32, ctx.tess_coord, ctx.u32_zero_value)); | ||||||
|     case IR::Attribute::TessellationEvaluationPointV: |     case IR::Attribute::TessellationEvaluationPointV: | ||||||
|         return ctx.OpLoad(ctx.F32[1], ctx.OpAccessChain(ctx.input_f32, ctx.tess_coord, |         return ctx.OpLoad(ctx.F32[1], | ||||||
|                                                         ctx.Constant(ctx.U32[1], 1U))); |                           ctx.OpAccessChain(ctx.input_f32, ctx.tess_coord, ctx.Const(1U))); | ||||||
| 
 | 
 | ||||||
|     default: |     default: | ||||||
|         throw NotImplementedException("Read attribute {}", attr); |         throw NotImplementedException("Read attribute {}", attr); | ||||||
|  | @ -303,7 +302,7 @@ Id EmitGetPatch(EmitContext& ctx, IR::Patch patch) { | ||||||
|         throw NotImplementedException("Non-generic patch load"); |         throw NotImplementedException("Non-generic patch load"); | ||||||
|     } |     } | ||||||
|     const u32 index{IR::GenericPatchIndex(patch)}; |     const u32 index{IR::GenericPatchIndex(patch)}; | ||||||
|     const Id element{ctx.Constant(ctx.U32[1], IR::GenericPatchElement(patch))}; |     const Id element{ctx.Const(IR::GenericPatchElement(patch))}; | ||||||
|     const Id pointer{ctx.OpAccessChain(ctx.input_f32, ctx.patches.at(index), element)}; |     const Id pointer{ctx.OpAccessChain(ctx.input_f32, ctx.patches.at(index), element)}; | ||||||
|     return ctx.OpLoad(ctx.F32[1], pointer); |     return ctx.OpLoad(ctx.F32[1], pointer); | ||||||
| } | } | ||||||
|  | @ -312,7 +311,7 @@ void EmitSetPatch(EmitContext& ctx, IR::Patch patch, Id value) { | ||||||
|     const Id pointer{[&] { |     const Id pointer{[&] { | ||||||
|         if (IR::IsGeneric(patch)) { |         if (IR::IsGeneric(patch)) { | ||||||
|             const u32 index{IR::GenericPatchIndex(patch)}; |             const u32 index{IR::GenericPatchIndex(patch)}; | ||||||
|             const Id element{ctx.Constant(ctx.U32[1], IR::GenericPatchElement(patch))}; |             const Id element{ctx.Const(IR::GenericPatchElement(patch))}; | ||||||
|             return ctx.OpAccessChain(ctx.output_f32, ctx.patches.at(index), element); |             return ctx.OpAccessChain(ctx.output_f32, ctx.patches.at(index), element); | ||||||
|         } |         } | ||||||
|         switch (patch) { |         switch (patch) { | ||||||
|  | @ -321,15 +320,14 @@ void EmitSetPatch(EmitContext& ctx, IR::Patch patch, Id value) { | ||||||
|         case IR::Patch::TessellationLodTop: |         case IR::Patch::TessellationLodTop: | ||||||
|         case IR::Patch::TessellationLodBottom: { |         case IR::Patch::TessellationLodBottom: { | ||||||
|             const u32 index{static_cast<u32>(patch) - u32(IR::Patch::TessellationLodLeft)}; |             const u32 index{static_cast<u32>(patch) - u32(IR::Patch::TessellationLodLeft)}; | ||||||
|             const Id index_id{ctx.Constant(ctx.U32[1], index)}; |             const Id index_id{ctx.Const(index)}; | ||||||
|             return ctx.OpAccessChain(ctx.output_f32, ctx.output_tess_level_outer, index_id); |             return ctx.OpAccessChain(ctx.output_f32, ctx.output_tess_level_outer, index_id); | ||||||
|         } |         } | ||||||
|         case IR::Patch::TessellationLodInteriorU: |         case IR::Patch::TessellationLodInteriorU: | ||||||
|             return ctx.OpAccessChain(ctx.output_f32, ctx.output_tess_level_inner, |             return ctx.OpAccessChain(ctx.output_f32, ctx.output_tess_level_inner, | ||||||
|                                      ctx.u32_zero_value); |                                      ctx.u32_zero_value); | ||||||
|         case IR::Patch::TessellationLodInteriorV: |         case IR::Patch::TessellationLodInteriorV: | ||||||
|             return ctx.OpAccessChain(ctx.output_f32, ctx.output_tess_level_inner, |             return ctx.OpAccessChain(ctx.output_f32, ctx.output_tess_level_inner, ctx.Const(1u)); | ||||||
|                                      ctx.Constant(ctx.U32[1], 1u)); |  | ||||||
|         default: |         default: | ||||||
|             throw NotImplementedException("Patch {}", patch); |             throw NotImplementedException("Patch {}", patch); | ||||||
|         } |         } | ||||||
|  | @ -338,7 +336,7 @@ void EmitSetPatch(EmitContext& ctx, IR::Patch patch, Id value) { | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| void EmitSetFragColor(EmitContext& ctx, u32 index, u32 component, Id value) { | void EmitSetFragColor(EmitContext& ctx, u32 index, u32 component, Id value) { | ||||||
|     const Id component_id{ctx.Constant(ctx.U32[1], component)}; |     const Id component_id{ctx.Const(component)}; | ||||||
|     const Id pointer{ctx.OpAccessChain(ctx.output_f32, ctx.frag_color.at(index), component_id)}; |     const Id pointer{ctx.OpAccessChain(ctx.output_f32, ctx.frag_color.at(index), component_id)}; | ||||||
|     ctx.OpStore(pointer, value); |     ctx.OpStore(pointer, value); | ||||||
| } | } | ||||||
|  | @ -404,7 +402,7 @@ Id EmitIsHelperInvocation(EmitContext& ctx) { | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| Id EmitYDirection(EmitContext& ctx) { | Id EmitYDirection(EmitContext& ctx) { | ||||||
|     return ctx.Constant(ctx.F32[1], ctx.profile.y_negate ? -1.0f : 1.0f); |     return ctx.Const(ctx.profile.y_negate ? -1.0f : 1.0f); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| Id EmitLoadLocal(EmitContext& ctx, Id word_offset) { | Id EmitLoadLocal(EmitContext& ctx, Id word_offset) { | ||||||
|  |  | ||||||
|  | @ -117,7 +117,7 @@ Id EmitFPLog2(EmitContext& ctx, Id value) { | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| Id EmitFPRecip32(EmitContext& ctx, Id value) { | Id EmitFPRecip32(EmitContext& ctx, Id value) { | ||||||
|     return ctx.OpFDiv(ctx.F32[1], ctx.Constant(ctx.F32[1], 1.0f), value); |     return ctx.OpFDiv(ctx.F32[1], ctx.Const(1.0f), value); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| Id EmitFPRecip64(EmitContext& ctx, Id value) { | Id EmitFPRecip64(EmitContext& ctx, Id value) { | ||||||
|  | @ -143,8 +143,8 @@ Id EmitFPSaturate16(EmitContext& ctx, Id value) { | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| Id EmitFPSaturate32(EmitContext& ctx, Id value) { | Id EmitFPSaturate32(EmitContext& ctx, Id value) { | ||||||
|     const Id zero{ctx.Constant(ctx.F32[1], f32{0.0})}; |     const Id zero{ctx.Const(f32{0.0})}; | ||||||
|     const Id one{ctx.Constant(ctx.F32[1], f32{1.0})}; |     const Id one{ctx.Const(f32{1.0})}; | ||||||
|     return Clamp(ctx, ctx.F32[1], value, zero, one); |     return Clamp(ctx, ctx.F32[1], value, zero, one); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -45,16 +45,12 @@ public: | ||||||
|         if (opcode != values[1]->GetOpcode() || opcode != IR::Opcode::CompositeConstructU32x4) { |         if (opcode != values[1]->GetOpcode() || opcode != IR::Opcode::CompositeConstructU32x4) { | ||||||
|             throw LogicError("Invalid PTP arguments"); |             throw LogicError("Invalid PTP arguments"); | ||||||
|         } |         } | ||||||
|         auto read{[&](unsigned int a, unsigned int b) { |         auto read{[&](unsigned int a, unsigned int b) { return values[a]->Arg(b).U32(); }}; | ||||||
|             return ctx.Constant(ctx.U32[1], values[a]->Arg(b).U32()); |  | ||||||
|         }}; |  | ||||||
| 
 | 
 | ||||||
|         const Id offsets{ |         const Id offsets{ctx.ConstantComposite( | ||||||
|             ctx.ConstantComposite(ctx.TypeArray(ctx.U32[2], ctx.Constant(ctx.U32[1], 4)), |             ctx.TypeArray(ctx.U32[2], ctx.Const(4U)), ctx.Const(read(0, 0), read(0, 1)), | ||||||
|                                   ctx.ConstantComposite(ctx.U32[2], read(0, 0), read(0, 1)), |             ctx.Const(read(0, 2), read(0, 3)), ctx.Const(read(1, 0), read(1, 1)), | ||||||
|                                   ctx.ConstantComposite(ctx.U32[2], read(0, 2), read(0, 3)), |             ctx.Const(read(1, 2), read(1, 3)))}; | ||||||
|                                   ctx.ConstantComposite(ctx.U32[2], read(1, 0), read(1, 1)), |  | ||||||
|                                   ctx.ConstantComposite(ctx.U32[2], read(1, 2), read(1, 3)))}; |  | ||||||
|         Add(spv::ImageOperandsMask::ConstOffsets, offsets); |         Add(spv::ImageOperandsMask::ConstOffsets, offsets); | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|  | @ -108,7 +104,7 @@ private: | ||||||
|             return; |             return; | ||||||
|         } |         } | ||||||
|         if (offset.IsImmediate()) { |         if (offset.IsImmediate()) { | ||||||
|             Add(spv::ImageOperandsMask::ConstOffset, ctx.Constant(ctx.U32[1], offset.U32())); |             Add(spv::ImageOperandsMask::ConstOffset, ctx.Const(offset.U32())); | ||||||
|             return; |             return; | ||||||
|         } |         } | ||||||
|         IR::Inst* const inst{offset.InstRecursive()}; |         IR::Inst* const inst{offset.InstRecursive()}; | ||||||
|  | @ -361,9 +357,8 @@ Id EmitImageGather(EmitContext& ctx, IR::Inst* inst, const IR::Value& index, Id | ||||||
|     const auto info{inst->Flags<IR::TextureInstInfo>()}; |     const auto info{inst->Flags<IR::TextureInstInfo>()}; | ||||||
|     const ImageOperands operands(ctx, offset, offset2); |     const ImageOperands operands(ctx, offset, offset2); | ||||||
|     return Emit(&EmitContext::OpImageSparseGather, &EmitContext::OpImageGather, ctx, inst, |     return Emit(&EmitContext::OpImageSparseGather, &EmitContext::OpImageGather, ctx, inst, | ||||||
|                 ctx.F32[4], Texture(ctx, index), coords, |                 ctx.F32[4], Texture(ctx, index), coords, ctx.Const(info.gather_component), | ||||||
|                 ctx.Constant(ctx.U32[1], info.gather_component.Value()), operands.Mask(), |                 operands.Mask(), operands.Span()); | ||||||
|                 operands.Span()); |  | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| Id EmitImageGatherDref(EmitContext& ctx, IR::Inst* inst, const IR::Value& index, Id coords, | Id EmitImageGatherDref(EmitContext& ctx, IR::Inst* inst, const IR::Value& index, Id coords, | ||||||
|  |  | ||||||
|  | @ -44,7 +44,7 @@ Id EmitIAdd32(EmitContext& ctx, IR::Inst* inst, Id a, Id b) { | ||||||
|         // https://stackoverflow.com/questions/55468823/how-to-detect-integer-overflow-in-c
 |         // https://stackoverflow.com/questions/55468823/how-to-detect-integer-overflow-in-c
 | ||||||
|         constexpr u32 s32_max{static_cast<u32>(std::numeric_limits<s32>::max())}; |         constexpr u32 s32_max{static_cast<u32>(std::numeric_limits<s32>::max())}; | ||||||
|         const Id is_positive{ctx.OpSGreaterThanEqual(ctx.U1, a, ctx.u32_zero_value)}; |         const Id is_positive{ctx.OpSGreaterThanEqual(ctx.U1, a, ctx.u32_zero_value)}; | ||||||
|         const Id sub_a{ctx.OpISub(ctx.U32[1], ctx.Constant(ctx.U32[1], s32_max), a)}; |         const Id sub_a{ctx.OpISub(ctx.U32[1], ctx.Const(s32_max), a)}; | ||||||
| 
 | 
 | ||||||
|         const Id positive_test{ctx.OpSGreaterThan(ctx.U1, b, sub_a)}; |         const Id positive_test{ctx.OpSGreaterThan(ctx.U1, b, sub_a)}; | ||||||
|         const Id negative_test{ctx.OpSLessThan(ctx.U1, b, sub_a)}; |         const Id negative_test{ctx.OpSLessThan(ctx.U1, b, sub_a)}; | ||||||
|  |  | ||||||
|  | @ -11,14 +11,14 @@ namespace { | ||||||
| Id StorageIndex(EmitContext& ctx, const IR::Value& offset, size_t element_size) { | Id StorageIndex(EmitContext& ctx, const IR::Value& offset, size_t element_size) { | ||||||
|     if (offset.IsImmediate()) { |     if (offset.IsImmediate()) { | ||||||
|         const u32 imm_offset{static_cast<u32>(offset.U32() / element_size)}; |         const u32 imm_offset{static_cast<u32>(offset.U32() / element_size)}; | ||||||
|         return ctx.Constant(ctx.U32[1], imm_offset); |         return ctx.Const(imm_offset); | ||||||
|     } |     } | ||||||
|     const u32 shift{static_cast<u32>(std::countr_zero(element_size))}; |     const u32 shift{static_cast<u32>(std::countr_zero(element_size))}; | ||||||
|     const Id index{ctx.Def(offset)}; |     const Id index{ctx.Def(offset)}; | ||||||
|     if (shift == 0) { |     if (shift == 0) { | ||||||
|         return index; |         return index; | ||||||
|     } |     } | ||||||
|     const Id shift_id{ctx.Constant(ctx.U32[1], shift)}; |     const Id shift_id{ctx.Const(shift)}; | ||||||
|     return ctx.OpShiftRightLogical(ctx.U32[1], index, shift_id); |     return ctx.OpShiftRightLogical(ctx.U32[1], index, shift_id); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -7,22 +7,22 @@ | ||||||
| namespace Shader::Backend::SPIRV { | namespace Shader::Backend::SPIRV { | ||||||
| namespace { | namespace { | ||||||
| Id Pointer(EmitContext& ctx, Id pointer_type, Id array, Id offset, u32 shift) { | Id Pointer(EmitContext& ctx, Id pointer_type, Id array, Id offset, u32 shift) { | ||||||
|     const Id shift_id{ctx.Constant(ctx.U32[1], shift)}; |     const Id shift_id{ctx.Const(shift)}; | ||||||
|     const Id index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; |     const Id index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; | ||||||
|     return ctx.OpAccessChain(pointer_type, array, ctx.u32_zero_value, index); |     return ctx.OpAccessChain(pointer_type, array, ctx.u32_zero_value, index); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| Id Word(EmitContext& ctx, Id offset) { | Id Word(EmitContext& ctx, Id offset) { | ||||||
|     const Id shift_id{ctx.Constant(ctx.U32[1], 2U)}; |     const Id shift_id{ctx.Const(2U)}; | ||||||
|     const Id index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; |     const Id index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; | ||||||
|     const Id pointer{ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, index)}; |     const Id pointer{ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, index)}; | ||||||
|     return ctx.OpLoad(ctx.U32[1], pointer); |     return ctx.OpLoad(ctx.U32[1], pointer); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| std::pair<Id, Id> ExtractArgs(EmitContext& ctx, Id offset, u32 mask, u32 count) { | std::pair<Id, Id> ExtractArgs(EmitContext& ctx, Id offset, u32 mask, u32 count) { | ||||||
|     const Id shift{ctx.OpShiftLeftLogical(ctx.U32[1], offset, ctx.Constant(ctx.U32[1], 3U))}; |     const Id shift{ctx.OpShiftLeftLogical(ctx.U32[1], offset, ctx.Const(3U))}; | ||||||
|     const Id bit{ctx.OpBitwiseAnd(ctx.U32[1], shift, ctx.Constant(ctx.U32[1], mask))}; |     const Id bit{ctx.OpBitwiseAnd(ctx.U32[1], shift, ctx.Const(mask))}; | ||||||
|     const Id count_id{ctx.Constant(ctx.U32[1], count)}; |     const Id count_id{ctx.Const(count)}; | ||||||
|     return {bit, count_id}; |     return {bit, count_id}; | ||||||
| } | } | ||||||
| } // Anonymous namespace
 | } // Anonymous namespace
 | ||||||
|  | @ -83,9 +83,9 @@ Id EmitLoadSharedU64(EmitContext& ctx, Id offset) { | ||||||
|         const Id pointer{Pointer(ctx, ctx.shared_u32x2, ctx.shared_memory_u32x2, offset, 3)}; |         const Id pointer{Pointer(ctx, ctx.shared_u32x2, ctx.shared_memory_u32x2, offset, 3)}; | ||||||
|         return ctx.OpLoad(ctx.U32[2], pointer); |         return ctx.OpLoad(ctx.U32[2], pointer); | ||||||
|     } else { |     } else { | ||||||
|         const Id shift_id{ctx.Constant(ctx.U32[1], 2U)}; |         const Id shift_id{ctx.Const(2U)}; | ||||||
|         const Id base_index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; |         const Id base_index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; | ||||||
|         const Id next_index{ctx.OpIAdd(ctx.U32[1], base_index, ctx.Constant(ctx.U32[1], 1U))}; |         const Id next_index{ctx.OpIAdd(ctx.U32[1], base_index, ctx.Const(1U))}; | ||||||
|         const Id lhs_pointer{ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, base_index)}; |         const Id lhs_pointer{ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, base_index)}; | ||||||
|         const Id rhs_pointer{ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, next_index)}; |         const Id rhs_pointer{ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, next_index)}; | ||||||
|         return ctx.OpCompositeConstruct(ctx.U32[2], ctx.OpLoad(ctx.U32[1], lhs_pointer), |         return ctx.OpCompositeConstruct(ctx.U32[2], ctx.OpLoad(ctx.U32[1], lhs_pointer), | ||||||
|  | @ -98,12 +98,11 @@ Id EmitLoadSharedU128(EmitContext& ctx, Id offset) { | ||||||
|         const Id pointer{Pointer(ctx, ctx.shared_u32x4, ctx.shared_memory_u32x4, offset, 4)}; |         const Id pointer{Pointer(ctx, ctx.shared_u32x4, ctx.shared_memory_u32x4, offset, 4)}; | ||||||
|         return ctx.OpLoad(ctx.U32[4], pointer); |         return ctx.OpLoad(ctx.U32[4], pointer); | ||||||
|     } |     } | ||||||
|     const Id shift_id{ctx.Constant(ctx.U32[1], 2U)}; |     const Id shift_id{ctx.Const(2U)}; | ||||||
|     const Id base_index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; |     const Id base_index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift_id)}; | ||||||
|     std::array<Id, 4> values{}; |     std::array<Id, 4> values{}; | ||||||
|     for (u32 i = 0; i < 4; ++i) { |     for (u32 i = 0; i < 4; ++i) { | ||||||
|         const Id index{i == 0 ? base_index |         const Id index{i == 0 ? base_index : ctx.OpIAdd(ctx.U32[1], base_index, ctx.Const(i))}; | ||||||
|                               : ctx.OpIAdd(ctx.U32[1], base_index, ctx.Constant(ctx.U32[1], i))}; |  | ||||||
|         const Id pointer{ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, index)}; |         const Id pointer{ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, index)}; | ||||||
|         values[i] = ctx.OpLoad(ctx.U32[1], pointer); |         values[i] = ctx.OpLoad(ctx.U32[1], pointer); | ||||||
|     } |     } | ||||||
|  | @ -134,7 +133,7 @@ void EmitWriteSharedU32(EmitContext& ctx, Id offset, Id value) { | ||||||
|     if (ctx.profile.support_explicit_workgroup_layout) { |     if (ctx.profile.support_explicit_workgroup_layout) { | ||||||
|         pointer = Pointer(ctx, ctx.shared_u32, ctx.shared_memory_u32, offset, 2); |         pointer = Pointer(ctx, ctx.shared_u32, ctx.shared_memory_u32, offset, 2); | ||||||
|     } else { |     } else { | ||||||
|         const Id shift{ctx.Constant(ctx.U32[1], 2U)}; |         const Id shift{ctx.Const(2U)}; | ||||||
|         const Id word_offset{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift)}; |         const Id word_offset{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift)}; | ||||||
|         pointer = ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, word_offset); |         pointer = ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, word_offset); | ||||||
|     } |     } | ||||||
|  | @ -147,9 +146,9 @@ void EmitWriteSharedU64(EmitContext& ctx, Id offset, Id value) { | ||||||
|         ctx.OpStore(pointer, value); |         ctx.OpStore(pointer, value); | ||||||
|         return; |         return; | ||||||
|     } |     } | ||||||
|     const Id shift{ctx.Constant(ctx.U32[1], 2U)}; |     const Id shift{ctx.Const(2U)}; | ||||||
|     const Id word_offset{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift)}; |     const Id word_offset{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift)}; | ||||||
|     const Id next_offset{ctx.OpIAdd(ctx.U32[1], word_offset, ctx.Constant(ctx.U32[1], 1U))}; |     const Id next_offset{ctx.OpIAdd(ctx.U32[1], word_offset, ctx.Const(1U))}; | ||||||
|     const Id lhs_pointer{ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, word_offset)}; |     const Id lhs_pointer{ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, word_offset)}; | ||||||
|     const Id rhs_pointer{ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, next_offset)}; |     const Id rhs_pointer{ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, next_offset)}; | ||||||
|     ctx.OpStore(lhs_pointer, ctx.OpCompositeExtract(ctx.U32[1], value, 0U)); |     ctx.OpStore(lhs_pointer, ctx.OpCompositeExtract(ctx.U32[1], value, 0U)); | ||||||
|  | @ -162,11 +161,10 @@ void EmitWriteSharedU128(EmitContext& ctx, Id offset, Id value) { | ||||||
|         ctx.OpStore(pointer, value); |         ctx.OpStore(pointer, value); | ||||||
|         return; |         return; | ||||||
|     } |     } | ||||||
|     const Id shift{ctx.Constant(ctx.U32[1], 2U)}; |     const Id shift{ctx.Const(2U)}; | ||||||
|     const Id base_index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift)}; |     const Id base_index{ctx.OpShiftRightArithmetic(ctx.U32[1], offset, shift)}; | ||||||
|     for (u32 i = 0; i < 4; ++i) { |     for (u32 i = 0; i < 4; ++i) { | ||||||
|         const Id index{i == 0 ? base_index |         const Id index{i == 0 ? base_index : ctx.OpIAdd(ctx.U32[1], base_index, ctx.Const(i))}; | ||||||
|                               : ctx.OpIAdd(ctx.U32[1], base_index, ctx.Constant(ctx.U32[1], i))}; |  | ||||||
|         const Id pointer{ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, index)}; |         const Id pointer{ctx.OpAccessChain(ctx.shared_u32, ctx.shared_memory_u32, index)}; | ||||||
|         ctx.OpStore(pointer, ctx.OpCompositeExtract(ctx.U32[1], value, i)); |         ctx.OpStore(pointer, ctx.OpCompositeExtract(ctx.U32[1], value, i)); | ||||||
|     } |     } | ||||||
|  |  | ||||||
|  | @ -19,7 +19,7 @@ void ConvertDepthMode(EmitContext& ctx) { | ||||||
| void SetFixedPipelinePointSize(EmitContext& ctx) { | void SetFixedPipelinePointSize(EmitContext& ctx) { | ||||||
|     if (ctx.profile.fixed_state_point_size) { |     if (ctx.profile.fixed_state_point_size) { | ||||||
|         const float point_size{*ctx.profile.fixed_state_point_size}; |         const float point_size{*ctx.profile.fixed_state_point_size}; | ||||||
|         ctx.OpStore(ctx.output_point_size, ctx.Constant(ctx.F32[1], point_size)); |         ctx.OpStore(ctx.output_point_size, ctx.Const(point_size)); | ||||||
|     } |     } | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | @ -75,7 +75,7 @@ void AlphaTest(EmitContext& ctx) { | ||||||
| 
 | 
 | ||||||
|     const Id true_label{ctx.OpLabel()}; |     const Id true_label{ctx.OpLabel()}; | ||||||
|     const Id discard_label{ctx.OpLabel()}; |     const Id discard_label{ctx.OpLabel()}; | ||||||
|     const Id alpha_reference{ctx.Constant(ctx.F32[1], ctx.profile.alpha_test_reference)}; |     const Id alpha_reference{ctx.Const(ctx.profile.alpha_test_reference)}; | ||||||
|     const Id condition{ComparisonFunction(ctx, comparison, alpha, alpha_reference)}; |     const Id condition{ComparisonFunction(ctx, comparison, alpha, alpha_reference)}; | ||||||
| 
 | 
 | ||||||
|     ctx.OpSelectionMerge(true_label, spv::SelectionControlMask::MaskNone); |     ctx.OpSelectionMerge(true_label, spv::SelectionControlMask::MaskNone); | ||||||
|  | @ -88,8 +88,8 @@ void AlphaTest(EmitContext& ctx) { | ||||||
| 
 | 
 | ||||||
| void EmitPrologue(EmitContext& ctx) { | void EmitPrologue(EmitContext& ctx) { | ||||||
|     if (ctx.stage == Stage::VertexB) { |     if (ctx.stage == Stage::VertexB) { | ||||||
|         const Id zero{ctx.Constant(ctx.F32[1], 0.0f)}; |         const Id zero{ctx.Const(0.0f)}; | ||||||
|         const Id one{ctx.Constant(ctx.F32[1], 1.0f)}; |         const Id one{ctx.Const(1.0f)}; | ||||||
|         const Id default_vector{ctx.ConstantComposite(ctx.F32[4], zero, zero, zero, one)}; |         const Id default_vector{ctx.ConstantComposite(ctx.F32[4], zero, zero, zero, one)}; | ||||||
|         ctx.OpStore(ctx.output_position, default_vector); |         ctx.OpStore(ctx.output_position, default_vector); | ||||||
|         for (const auto& info : ctx.output_generics) { |         for (const auto& info : ctx.output_generics) { | ||||||
|  |  | ||||||
|  | @ -54,7 +54,7 @@ Id EmitLaneId(EmitContext& ctx) { | ||||||
|     if (!ctx.profile.warp_size_potentially_larger_than_guest) { |     if (!ctx.profile.warp_size_potentially_larger_than_guest) { | ||||||
|         return id; |         return id; | ||||||
|     } |     } | ||||||
|     return ctx.OpBitwiseAnd(ctx.U32[1], id, ctx.Constant(ctx.U32[1], 31U)); |     return ctx.OpBitwiseAnd(ctx.U32[1], id, ctx.Const(31U)); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| Id EmitVoteAll(EmitContext& ctx, Id pred) { | Id EmitVoteAll(EmitContext& ctx, Id pred) { | ||||||
|  | @ -168,10 +168,10 @@ Id EmitShuffleButterfly(EmitContext& ctx, IR::Inst* inst, Id value, Id index, Id | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| Id EmitFSwizzleAdd(EmitContext& ctx, Id op_a, Id op_b, Id swizzle) { | Id EmitFSwizzleAdd(EmitContext& ctx, Id op_a, Id op_b, Id swizzle) { | ||||||
|     const Id three{ctx.Constant(ctx.U32[1], 3)}; |     const Id three{ctx.Const(3U)}; | ||||||
|     Id mask{ctx.OpLoad(ctx.U32[1], ctx.subgroup_local_invocation_id)}; |     Id mask{ctx.OpLoad(ctx.U32[1], ctx.subgroup_local_invocation_id)}; | ||||||
|     mask = ctx.OpBitwiseAnd(ctx.U32[1], mask, three); |     mask = ctx.OpBitwiseAnd(ctx.U32[1], mask, three); | ||||||
|     mask = ctx.OpShiftLeftLogical(ctx.U32[1], mask, ctx.Constant(ctx.U32[1], 1)); |     mask = ctx.OpShiftLeftLogical(ctx.U32[1], mask, ctx.Const(1U)); | ||||||
|     mask = ctx.OpShiftRightLogical(ctx.U32[1], swizzle, mask); |     mask = ctx.OpShiftRightLogical(ctx.U32[1], swizzle, mask); | ||||||
|     mask = ctx.OpBitwiseAnd(ctx.U32[1], mask, three); |     mask = ctx.OpBitwiseAnd(ctx.U32[1], mask, three); | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue
	
	 ameerj
						ameerj