forked from eden-emu/eden
		
	
		
			
				
	
	
		
			1117 lines
		
	
	
	
		
			47 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			1117 lines
		
	
	
	
		
			47 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| // Copyright 2021 yuzu Emulator Project
 | |
| // Licensed under GPLv2 or any later version
 | |
| // Refer to the license.txt file included.
 | |
| 
 | |
| #include <algorithm>
 | |
| #include <array>
 | |
| #include <climits>
 | |
| #include <string_view>
 | |
| 
 | |
| #include <fmt/format.h>
 | |
| 
 | |
| #include "common/common_types.h"
 | |
| #include "common/div_ceil.h"
 | |
| #include "shader_recompiler/backend/spirv/emit_context.h"
 | |
| 
 | |
| namespace Shader::Backend::SPIRV {
 | |
| namespace {
 | |
| enum class Operation {
 | |
|     Increment,
 | |
|     Decrement,
 | |
|     FPAdd,
 | |
|     FPMin,
 | |
|     FPMax,
 | |
| };
 | |
| 
 | |
| struct AttrInfo {
 | |
|     Id pointer;
 | |
|     Id id;
 | |
|     bool needs_cast;
 | |
| };
 | |
| 
 | |
| Id ImageType(EmitContext& ctx, const TextureDescriptor& desc) {
 | |
|     const spv::ImageFormat format{spv::ImageFormat::Unknown};
 | |
|     const Id type{ctx.F32[1]};
 | |
|     const bool depth{desc.is_depth};
 | |
|     switch (desc.type) {
 | |
|     case TextureType::Color1D:
 | |
|         return ctx.TypeImage(type, spv::Dim::Dim1D, depth, false, false, 1, format);
 | |
|     case TextureType::ColorArray1D:
 | |
|         return ctx.TypeImage(type, spv::Dim::Dim1D, depth, true, false, 1, format);
 | |
|     case TextureType::Color2D:
 | |
|         return ctx.TypeImage(type, spv::Dim::Dim2D, depth, false, false, 1, format);
 | |
|     case TextureType::ColorArray2D:
 | |
|         return ctx.TypeImage(type, spv::Dim::Dim2D, depth, true, false, 1, format);
 | |
|     case TextureType::Color3D:
 | |
|         return ctx.TypeImage(type, spv::Dim::Dim3D, depth, false, false, 1, format);
 | |
|     case TextureType::ColorCube:
 | |
|         return ctx.TypeImage(type, spv::Dim::Cube, depth, false, false, 1, format);
 | |
|     case TextureType::ColorArrayCube:
 | |
|         return ctx.TypeImage(type, spv::Dim::Cube, depth, true, false, 1, format);
 | |
|     case TextureType::Buffer:
 | |
|         break;
 | |
|     }
 | |
|     throw InvalidArgument("Invalid texture type {}", desc.type);
 | |
| }
 | |
| 
 | |
| spv::ImageFormat GetImageFormat(ImageFormat format) {
 | |
|     switch (format) {
 | |
|     case ImageFormat::Typeless:
 | |
|         return spv::ImageFormat::Unknown;
 | |
|     case ImageFormat::R8_UINT:
 | |
|         return spv::ImageFormat::R8ui;
 | |
|     case ImageFormat::R8_SINT:
 | |
|         return spv::ImageFormat::R8i;
 | |
|     case ImageFormat::R16_UINT:
 | |
|         return spv::ImageFormat::R16ui;
 | |
|     case ImageFormat::R16_SINT:
 | |
|         return spv::ImageFormat::R16i;
 | |
|     case ImageFormat::R32_UINT:
 | |
|         return spv::ImageFormat::R32ui;
 | |
|     case ImageFormat::R32G32_UINT:
 | |
|         return spv::ImageFormat::Rg32ui;
 | |
|     case ImageFormat::R32G32B32A32_UINT:
 | |
|         return spv::ImageFormat::Rgba32ui;
 | |
|     }
 | |
|     throw InvalidArgument("Invalid image format {}", format);
 | |
| }
 | |
| 
 | |
| Id ImageType(EmitContext& ctx, const ImageDescriptor& desc) {
 | |
|     const spv::ImageFormat format{GetImageFormat(desc.format)};
 | |
|     const Id type{ctx.U32[1]};
 | |
|     switch (desc.type) {
 | |
|     case TextureType::Color1D:
 | |
|         return ctx.TypeImage(type, spv::Dim::Dim1D, false, false, false, 2, format);
 | |
|     case TextureType::ColorArray1D:
 | |
|         return ctx.TypeImage(type, spv::Dim::Dim1D, false, true, false, 2, format);
 | |
|     case TextureType::Color2D:
 | |
|         return ctx.TypeImage(type, spv::Dim::Dim2D, false, false, false, 2, format);
 | |
|     case TextureType::ColorArray2D:
 | |
|         return ctx.TypeImage(type, spv::Dim::Dim2D, false, true, false, 2, format);
 | |
|     case TextureType::Color3D:
 | |
|         return ctx.TypeImage(type, spv::Dim::Dim3D, false, false, false, 2, format);
 | |
|     case TextureType::Buffer:
 | |
|         throw NotImplementedException("Image buffer");
 | |
|     default:
 | |
|         break;
 | |
|     }
 | |
|     throw InvalidArgument("Invalid texture type {}", desc.type);
 | |
| }
 | |
| 
 | |
| Id DefineVariable(EmitContext& ctx, Id type, std::optional<spv::BuiltIn> builtin,
 | |
|                   spv::StorageClass storage_class) {
 | |
|     const Id pointer_type{ctx.TypePointer(storage_class, type)};
 | |
|     const Id id{ctx.AddGlobalVariable(pointer_type, storage_class)};
 | |
|     if (builtin) {
 | |
|         ctx.Decorate(id, spv::Decoration::BuiltIn, *builtin);
 | |
|     }
 | |
|     ctx.interfaces.push_back(id);
 | |
|     return id;
 | |
| }
 | |
| 
 | |
| u32 NumVertices(InputTopology input_topology) {
 | |
|     switch (input_topology) {
 | |
|     case InputTopology::Points:
 | |
|         return 1;
 | |
|     case InputTopology::Lines:
 | |
|         return 2;
 | |
|     case InputTopology::LinesAdjacency:
 | |
|         return 4;
 | |
|     case InputTopology::Triangles:
 | |
|         return 3;
 | |
|     case InputTopology::TrianglesAdjacency:
 | |
|         return 6;
 | |
|     }
 | |
|     throw InvalidArgument("Invalid input topology {}", input_topology);
 | |
| }
 | |
| 
 | |
| Id DefineInput(EmitContext& ctx, Id type, std::optional<spv::BuiltIn> builtin = std::nullopt) {
 | |
|     if (ctx.stage == Stage::Geometry) {
 | |
|         const u32 num_vertices{NumVertices(ctx.profile.input_topology)};
 | |
|         type = ctx.TypeArray(type, ctx.Constant(ctx.U32[1], num_vertices));
 | |
|     }
 | |
|     return DefineVariable(ctx, type, builtin, spv::StorageClass::Input);
 | |
| }
 | |
| 
 | |
| Id DefineOutput(EmitContext& ctx, Id type, std::optional<spv::BuiltIn> builtin = std::nullopt) {
 | |
|     return DefineVariable(ctx, type, builtin, spv::StorageClass::Output);
 | |
| }
 | |
| 
 | |
| void DefineGenericOutput(EmitContext& ctx, size_t index) {
 | |
|     static constexpr std::string_view swizzle{"xyzw"};
 | |
|     const size_t base_attr_index{static_cast<size_t>(IR::Attribute::Generic0X) + index * 4};
 | |
|     u32 element{0};
 | |
|     while (element < 4) {
 | |
|         const u32 remainder{4 - element};
 | |
|         const TransformFeedbackVarying* xfb_varying{};
 | |
|         if (!ctx.profile.xfb_varyings.empty()) {
 | |
|             xfb_varying = &ctx.profile.xfb_varyings[base_attr_index + element];
 | |
|             xfb_varying = xfb_varying && xfb_varying->components > 0 ? xfb_varying : nullptr;
 | |
|         }
 | |
|         const u32 num_components{xfb_varying ? xfb_varying->components : remainder};
 | |
| 
 | |
|         const Id id{DefineOutput(ctx, ctx.F32[num_components])};
 | |
|         ctx.Decorate(id, spv::Decoration::Location, static_cast<u32>(index));
 | |
|         if (element > 0) {
 | |
|             ctx.Decorate(id, spv::Decoration::Component, element);
 | |
|         }
 | |
|         if (xfb_varying) {
 | |
|             ctx.Decorate(id, spv::Decoration::XfbBuffer, xfb_varying->buffer);
 | |
|             ctx.Decorate(id, spv::Decoration::XfbStride, xfb_varying->stride);
 | |
|             ctx.Decorate(id, spv::Decoration::Offset, xfb_varying->offset);
 | |
|         }
 | |
|         if (num_components < 4 || element > 0) {
 | |
|             ctx.Name(id, fmt::format("out_attr{}", index));
 | |
|         } else {
 | |
|             const std::string_view subswizzle{swizzle.substr(element, num_components)};
 | |
|             ctx.Name(id, fmt::format("out_attr{}_{}", index, subswizzle));
 | |
|         }
 | |
|         const GenericElementInfo info{
 | |
|             .id = id,
 | |
|             .first_element = element,
 | |
|             .num_components = num_components,
 | |
|         };
 | |
|         std::fill_n(ctx.output_generics[index].begin(), num_components, info);
 | |
|         element += num_components;
 | |
|     }
 | |
| }
 | |
| 
 | |
| Id GetAttributeType(EmitContext& ctx, AttributeType type) {
 | |
|     switch (type) {
 | |
|     case AttributeType::Float:
 | |
|         return ctx.F32[4];
 | |
|     case AttributeType::SignedInt:
 | |
|         return ctx.TypeVector(ctx.TypeInt(32, true), 4);
 | |
|     case AttributeType::UnsignedInt:
 | |
|         return ctx.U32[4];
 | |
|     case AttributeType::Disabled:
 | |
|         break;
 | |
|     }
 | |
|     throw InvalidArgument("Invalid attribute type {}", type);
 | |
| }
 | |
| 
 | |
| std::optional<AttrInfo> AttrTypes(EmitContext& ctx, u32 index) {
 | |
|     const AttributeType type{ctx.profile.generic_input_types.at(index)};
 | |
|     switch (type) {
 | |
|     case AttributeType::Float:
 | |
|         return AttrInfo{ctx.input_f32, ctx.F32[1], false};
 | |
|     case AttributeType::UnsignedInt:
 | |
|         return AttrInfo{ctx.input_u32, ctx.U32[1], true};
 | |
|     case AttributeType::SignedInt:
 | |
|         return AttrInfo{ctx.input_s32, ctx.TypeInt(32, true), true};
 | |
|     case AttributeType::Disabled:
 | |
|         return std::nullopt;
 | |
|     }
 | |
|     throw InvalidArgument("Invalid attribute type {}", type);
 | |
| }
 | |
| 
 | |
| void DefineConstBuffers(EmitContext& ctx, const Info& info, Id UniformDefinitions::*member_type,
 | |
|                         u32 binding, Id type, char type_char, u32 element_size) {
 | |
|     const Id array_type{ctx.TypeArray(type, ctx.Constant(ctx.U32[1], 65536U / element_size))};
 | |
|     ctx.Decorate(array_type, spv::Decoration::ArrayStride, element_size);
 | |
| 
 | |
|     const Id struct_type{ctx.TypeStruct(array_type)};
 | |
|     ctx.Name(struct_type, fmt::format("cbuf_block_{}{}", type_char, element_size * CHAR_BIT));
 | |
|     ctx.Decorate(struct_type, spv::Decoration::Block);
 | |
|     ctx.MemberName(struct_type, 0, "data");
 | |
|     ctx.MemberDecorate(struct_type, 0, spv::Decoration::Offset, 0U);
 | |
| 
 | |
|     const Id struct_pointer_type{ctx.TypePointer(spv::StorageClass::Uniform, struct_type)};
 | |
|     const Id uniform_type{ctx.TypePointer(spv::StorageClass::Uniform, type)};
 | |
|     ctx.uniform_types.*member_type = uniform_type;
 | |
| 
 | |
|     for (const ConstantBufferDescriptor& desc : info.constant_buffer_descriptors) {
 | |
|         const Id id{ctx.AddGlobalVariable(struct_pointer_type, spv::StorageClass::Uniform)};
 | |
|         ctx.Decorate(id, spv::Decoration::Binding, binding);
 | |
|         ctx.Decorate(id, spv::Decoration::DescriptorSet, 0U);
 | |
|         ctx.Name(id, fmt::format("c{}", desc.index));
 | |
|         for (size_t i = 0; i < desc.count; ++i) {
 | |
|             ctx.cbufs[desc.index + i].*member_type = id;
 | |
|         }
 | |
|         if (ctx.profile.supported_spirv >= 0x00010400) {
 | |
|             ctx.interfaces.push_back(id);
 | |
|         }
 | |
|         binding += desc.count;
 | |
|     }
 | |
| }
 | |
| 
 | |
| void DefineSsbos(EmitContext& ctx, StorageTypeDefinition& type_def,
 | |
|                  Id StorageDefinitions::*member_type, const Info& info, u32 binding, Id type,
 | |
|                  u32 stride) {
 | |
|     const Id array_type{ctx.TypeRuntimeArray(type)};
 | |
|     ctx.Decorate(array_type, spv::Decoration::ArrayStride, stride);
 | |
| 
 | |
|     const Id struct_type{ctx.TypeStruct(array_type)};
 | |
|     ctx.Decorate(struct_type, spv::Decoration::Block);
 | |
|     ctx.MemberDecorate(struct_type, 0, spv::Decoration::Offset, 0U);
 | |
| 
 | |
|     const Id struct_pointer{ctx.TypePointer(spv::StorageClass::StorageBuffer, struct_type)};
 | |
|     type_def.array = struct_pointer;
 | |
|     type_def.element = ctx.TypePointer(spv::StorageClass::StorageBuffer, type);
 | |
| 
 | |
|     u32 index{};
 | |
|     for (const StorageBufferDescriptor& desc : info.storage_buffers_descriptors) {
 | |
|         const Id id{ctx.AddGlobalVariable(struct_pointer, spv::StorageClass::StorageBuffer)};
 | |
|         ctx.Decorate(id, spv::Decoration::Binding, binding);
 | |
|         ctx.Decorate(id, spv::Decoration::DescriptorSet, 0U);
 | |
|         ctx.Name(id, fmt::format("ssbo{}", index));
 | |
|         if (ctx.profile.supported_spirv >= 0x00010400) {
 | |
|             ctx.interfaces.push_back(id);
 | |
|         }
 | |
|         for (size_t i = 0; i < desc.count; ++i) {
 | |
|             ctx.ssbos[index + i].*member_type = id;
 | |
|         }
 | |
|         index += desc.count;
 | |
|         binding += desc.count;
 | |
|     }
 | |
| }
 | |
| 
 | |
| Id CasFunction(EmitContext& ctx, Operation operation, Id value_type) {
 | |
|     const Id func_type{ctx.TypeFunction(value_type, value_type, value_type)};
 | |
|     const Id func{ctx.OpFunction(value_type, spv::FunctionControlMask::MaskNone, func_type)};
 | |
|     const Id op_a{ctx.OpFunctionParameter(value_type)};
 | |
|     const Id op_b{ctx.OpFunctionParameter(value_type)};
 | |
|     ctx.AddLabel();
 | |
|     Id result{};
 | |
|     switch (operation) {
 | |
|     case Operation::Increment: {
 | |
|         const Id pred{ctx.OpUGreaterThanEqual(ctx.U1, op_a, op_b)};
 | |
|         const Id incr{ctx.OpIAdd(value_type, op_a, ctx.Constant(value_type, 1))};
 | |
|         result = ctx.OpSelect(value_type, pred, ctx.u32_zero_value, incr);
 | |
|         break;
 | |
|     }
 | |
|     case Operation::Decrement: {
 | |
|         const Id lhs{ctx.OpIEqual(ctx.U1, op_a, ctx.Constant(value_type, 0u))};
 | |
|         const Id rhs{ctx.OpUGreaterThan(ctx.U1, op_a, op_b)};
 | |
|         const Id pred{ctx.OpLogicalOr(ctx.U1, lhs, rhs)};
 | |
|         const Id decr{ctx.OpISub(value_type, op_a, ctx.Constant(value_type, 1))};
 | |
|         result = ctx.OpSelect(value_type, pred, op_b, decr);
 | |
|         break;
 | |
|     }
 | |
|     case Operation::FPAdd:
 | |
|         result = ctx.OpFAdd(value_type, op_a, op_b);
 | |
|         break;
 | |
|     case Operation::FPMin:
 | |
|         result = ctx.OpFMin(value_type, op_a, op_b);
 | |
|         break;
 | |
|     case Operation::FPMax:
 | |
|         result = ctx.OpFMax(value_type, op_a, op_b);
 | |
|         break;
 | |
|     default:
 | |
|         break;
 | |
|     }
 | |
|     ctx.OpReturnValue(result);
 | |
|     ctx.OpFunctionEnd();
 | |
|     return func;
 | |
| }
 | |
| 
 | |
| Id CasLoop(EmitContext& ctx, Operation operation, Id array_pointer, Id element_pointer,
 | |
|            Id value_type, Id memory_type, spv::Scope scope) {
 | |
|     const bool is_shared{scope == spv::Scope::Workgroup};
 | |
|     const bool is_struct{!is_shared || ctx.profile.support_explicit_workgroup_layout};
 | |
|     const Id cas_func{CasFunction(ctx, operation, value_type)};
 | |
|     const Id zero{ctx.u32_zero_value};
 | |
|     const Id scope_id{ctx.Constant(ctx.U32[1], static_cast<u32>(scope))};
 | |
| 
 | |
|     const Id loop_header{ctx.OpLabel()};
 | |
|     const Id continue_block{ctx.OpLabel()};
 | |
|     const Id merge_block{ctx.OpLabel()};
 | |
|     const Id func_type{is_shared
 | |
|                            ? ctx.TypeFunction(value_type, ctx.U32[1], value_type)
 | |
|                            : ctx.TypeFunction(value_type, ctx.U32[1], value_type, array_pointer)};
 | |
| 
 | |
|     const Id func{ctx.OpFunction(value_type, spv::FunctionControlMask::MaskNone, func_type)};
 | |
|     const Id index{ctx.OpFunctionParameter(ctx.U32[1])};
 | |
|     const Id op_b{ctx.OpFunctionParameter(value_type)};
 | |
|     const Id base{is_shared ? ctx.shared_memory_u32 : ctx.OpFunctionParameter(array_pointer)};
 | |
|     ctx.AddLabel();
 | |
|     ctx.OpBranch(loop_header);
 | |
|     ctx.AddLabel(loop_header);
 | |
| 
 | |
|     ctx.OpLoopMerge(merge_block, continue_block, spv::LoopControlMask::MaskNone);
 | |
|     ctx.OpBranch(continue_block);
 | |
| 
 | |
|     ctx.AddLabel(continue_block);
 | |
|     const Id word_pointer{is_struct ? ctx.OpAccessChain(element_pointer, base, zero, index)
 | |
|                                     : ctx.OpAccessChain(element_pointer, base, index)};
 | |
|     if (value_type.value == ctx.F32[2].value) {
 | |
|         const Id u32_value{ctx.OpLoad(ctx.U32[1], word_pointer)};
 | |
|         const Id value{ctx.OpUnpackHalf2x16(ctx.F32[2], u32_value)};
 | |
|         const Id new_value{ctx.OpFunctionCall(value_type, cas_func, value, op_b)};
 | |
|         const Id u32_new_value{ctx.OpPackHalf2x16(ctx.U32[1], new_value)};
 | |
|         const Id atomic_res{ctx.OpAtomicCompareExchange(ctx.U32[1], word_pointer, scope_id, zero,
 | |
|                                                         zero, u32_new_value, u32_value)};
 | |
|         const Id success{ctx.OpIEqual(ctx.U1, atomic_res, u32_value)};
 | |
|         ctx.OpBranchConditional(success, merge_block, loop_header);
 | |
| 
 | |
|         ctx.AddLabel(merge_block);
 | |
|         ctx.OpReturnValue(ctx.OpUnpackHalf2x16(ctx.F32[2], atomic_res));
 | |
|     } else {
 | |
|         const Id value{ctx.OpLoad(memory_type, word_pointer)};
 | |
|         const bool matching_type{value_type.value == memory_type.value};
 | |
|         const Id bitcast_value{matching_type ? value : ctx.OpBitcast(value_type, value)};
 | |
|         const Id cal_res{ctx.OpFunctionCall(value_type, cas_func, bitcast_value, op_b)};
 | |
|         const Id new_value{matching_type ? cal_res : ctx.OpBitcast(memory_type, cal_res)};
 | |
|         const Id atomic_res{ctx.OpAtomicCompareExchange(ctx.U32[1], word_pointer, scope_id, zero,
 | |
|                                                         zero, new_value, value)};
 | |
|         const Id success{ctx.OpIEqual(ctx.U1, atomic_res, value)};
 | |
|         ctx.OpBranchConditional(success, merge_block, loop_header);
 | |
| 
 | |
|         ctx.AddLabel(merge_block);
 | |
|         ctx.OpReturnValue(ctx.OpBitcast(value_type, atomic_res));
 | |
|     }
 | |
|     ctx.OpFunctionEnd();
 | |
|     return func;
 | |
| }
 | |
| } // Anonymous namespace
 | |
| 
 | |
| void VectorTypes::Define(Sirit::Module& sirit_ctx, Id base_type, std::string_view name) {
 | |
|     defs[0] = sirit_ctx.Name(base_type, name);
 | |
| 
 | |
|     std::array<char, 6> def_name;
 | |
|     for (int i = 1; i < 4; ++i) {
 | |
|         const std::string_view def_name_view(
 | |
|             def_name.data(),
 | |
|             fmt::format_to_n(def_name.data(), def_name.size(), "{}x{}", name, i + 1).size);
 | |
|         defs[static_cast<size_t>(i)] =
 | |
|             sirit_ctx.Name(sirit_ctx.TypeVector(base_type, i + 1), def_name_view);
 | |
|     }
 | |
| }
 | |
| 
 | |
| EmitContext::EmitContext(const Profile& profile_, IR::Program& program, u32& binding)
 | |
|     : Sirit::Module(profile_.supported_spirv), profile{profile_}, stage{program.stage} {
 | |
|     AddCapability(spv::Capability::Shader);
 | |
|     DefineCommonTypes(program.info);
 | |
|     DefineCommonConstants();
 | |
|     DefineInterfaces(program.info);
 | |
|     DefineLocalMemory(program);
 | |
|     DefineSharedMemory(program);
 | |
|     DefineSharedMemoryFunctions(program);
 | |
|     DefineConstantBuffers(program.info, binding);
 | |
|     DefineStorageBuffers(program.info, binding);
 | |
|     DefineTextureBuffers(program.info, binding);
 | |
|     DefineImageBuffers(program.info, binding);
 | |
|     DefineTextures(program.info, binding);
 | |
|     DefineImages(program.info, binding);
 | |
|     DefineAttributeMemAccess(program.info);
 | |
|     DefineLabels(program);
 | |
| }
 | |
| 
 | |
| EmitContext::~EmitContext() = default;
 | |
| 
 | |
| Id EmitContext::Def(const IR::Value& value) {
 | |
|     if (!value.IsImmediate()) {
 | |
|         return value.InstRecursive()->Definition<Id>();
 | |
|     }
 | |
|     switch (value.Type()) {
 | |
|     case IR::Type::Void:
 | |
|         // Void instructions are used for optional arguments (e.g. texture offsets)
 | |
|         // They are not meant to be used in the SPIR-V module
 | |
|         return Id{};
 | |
|     case IR::Type::U1:
 | |
|         return value.U1() ? true_value : false_value;
 | |
|     case IR::Type::U32:
 | |
|         return Constant(U32[1], value.U32());
 | |
|     case IR::Type::U64:
 | |
|         return Constant(U64, value.U64());
 | |
|     case IR::Type::F32:
 | |
|         return Constant(F32[1], value.F32());
 | |
|     case IR::Type::F64:
 | |
|         return Constant(F64[1], value.F64());
 | |
|     case IR::Type::Label:
 | |
|         return value.Label()->Definition<Id>();
 | |
|     default:
 | |
|         throw NotImplementedException("Immediate type {}", value.Type());
 | |
|     }
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineCommonTypes(const Info& info) {
 | |
|     void_id = TypeVoid();
 | |
| 
 | |
|     U1 = Name(TypeBool(), "u1");
 | |
| 
 | |
|     F32.Define(*this, TypeFloat(32), "f32");
 | |
|     U32.Define(*this, TypeInt(32, false), "u32");
 | |
| 
 | |
|     private_u32 = Name(TypePointer(spv::StorageClass::Private, U32[1]), "private_u32");
 | |
| 
 | |
|     input_f32 = Name(TypePointer(spv::StorageClass::Input, F32[1]), "input_f32");
 | |
|     input_u32 = Name(TypePointer(spv::StorageClass::Input, U32[1]), "input_u32");
 | |
|     input_s32 = Name(TypePointer(spv::StorageClass::Input, TypeInt(32, true)), "input_s32");
 | |
| 
 | |
|     output_f32 = Name(TypePointer(spv::StorageClass::Output, F32[1]), "output_f32");
 | |
| 
 | |
|     if (info.uses_int8) {
 | |
|         AddCapability(spv::Capability::Int8);
 | |
|         U8 = Name(TypeInt(8, false), "u8");
 | |
|         S8 = Name(TypeInt(8, true), "s8");
 | |
|     }
 | |
|     if (info.uses_int16) {
 | |
|         AddCapability(spv::Capability::Int16);
 | |
|         U16 = Name(TypeInt(16, false), "u16");
 | |
|         S16 = Name(TypeInt(16, true), "s16");
 | |
|     }
 | |
|     if (info.uses_int64) {
 | |
|         AddCapability(spv::Capability::Int64);
 | |
|         U64 = Name(TypeInt(64, false), "u64");
 | |
|     }
 | |
|     if (info.uses_fp16) {
 | |
|         AddCapability(spv::Capability::Float16);
 | |
|         F16.Define(*this, TypeFloat(16), "f16");
 | |
|     }
 | |
|     if (info.uses_fp64) {
 | |
|         AddCapability(spv::Capability::Float64);
 | |
|         F64.Define(*this, TypeFloat(64), "f64");
 | |
|     }
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineCommonConstants() {
 | |
|     true_value = ConstantTrue(U1);
 | |
|     false_value = ConstantFalse(U1);
 | |
|     u32_zero_value = Constant(U32[1], 0U);
 | |
|     f32_zero_value = Constant(F32[1], 0.0f);
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineInterfaces(const Info& info) {
 | |
|     DefineInputs(info);
 | |
|     DefineOutputs(info);
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineLocalMemory(const IR::Program& program) {
 | |
|     if (program.local_memory_size == 0) {
 | |
|         return;
 | |
|     }
 | |
|     const u32 num_elements{Common::DivCeil(program.local_memory_size, 4U)};
 | |
|     const Id type{TypeArray(U32[1], Constant(U32[1], num_elements))};
 | |
|     const Id pointer{TypePointer(spv::StorageClass::Private, type)};
 | |
|     local_memory = AddGlobalVariable(pointer, spv::StorageClass::Private);
 | |
|     if (profile.supported_spirv >= 0x00010400) {
 | |
|         interfaces.push_back(local_memory);
 | |
|     }
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineSharedMemory(const IR::Program& program) {
 | |
|     if (program.shared_memory_size == 0) {
 | |
|         return;
 | |
|     }
 | |
|     const auto make{[&](Id element_type, u32 element_size) {
 | |
|         const u32 num_elements{Common::DivCeil(program.shared_memory_size, element_size)};
 | |
|         const Id array_type{TypeArray(element_type, Constant(U32[1], num_elements))};
 | |
|         Decorate(array_type, spv::Decoration::ArrayStride, element_size);
 | |
| 
 | |
|         const Id struct_type{TypeStruct(array_type)};
 | |
|         MemberDecorate(struct_type, 0U, spv::Decoration::Offset, 0U);
 | |
|         Decorate(struct_type, spv::Decoration::Block);
 | |
| 
 | |
|         const Id pointer{TypePointer(spv::StorageClass::Workgroup, struct_type)};
 | |
|         const Id element_pointer{TypePointer(spv::StorageClass::Workgroup, element_type)};
 | |
|         const Id variable{AddGlobalVariable(pointer, spv::StorageClass::Workgroup)};
 | |
|         Decorate(variable, spv::Decoration::Aliased);
 | |
|         interfaces.push_back(variable);
 | |
| 
 | |
|         return std::make_tuple(variable, element_pointer, pointer);
 | |
|     }};
 | |
|     if (profile.support_explicit_workgroup_layout) {
 | |
|         AddExtension("SPV_KHR_workgroup_memory_explicit_layout");
 | |
|         AddCapability(spv::Capability::WorkgroupMemoryExplicitLayoutKHR);
 | |
|         if (program.info.uses_int8) {
 | |
|             AddCapability(spv::Capability::WorkgroupMemoryExplicitLayout8BitAccessKHR);
 | |
|             std::tie(shared_memory_u8, shared_u8, std::ignore) = make(U8, 1);
 | |
|         }
 | |
|         if (program.info.uses_int16) {
 | |
|             AddCapability(spv::Capability::WorkgroupMemoryExplicitLayout16BitAccessKHR);
 | |
|             std::tie(shared_memory_u16, shared_u16, std::ignore) = make(U16, 2);
 | |
|         }
 | |
|         if (program.info.uses_int64) {
 | |
|             std::tie(shared_memory_u64, shared_u64, std::ignore) = make(U64, 8);
 | |
|         }
 | |
|         std::tie(shared_memory_u32, shared_u32, shared_memory_u32_type) = make(U32[1], 4);
 | |
|         std::tie(shared_memory_u32x2, shared_u32x2, std::ignore) = make(U32[2], 8);
 | |
|         std::tie(shared_memory_u32x4, shared_u32x4, std::ignore) = make(U32[4], 16);
 | |
|         return;
 | |
|     }
 | |
|     const u32 num_elements{Common::DivCeil(program.shared_memory_size, 4U)};
 | |
|     const Id type{TypeArray(U32[1], Constant(U32[1], num_elements))};
 | |
|     shared_memory_u32_type = TypePointer(spv::StorageClass::Workgroup, type);
 | |
| 
 | |
|     shared_u32 = TypePointer(spv::StorageClass::Workgroup, U32[1]);
 | |
|     shared_memory_u32 = AddGlobalVariable(shared_memory_u32_type, spv::StorageClass::Workgroup);
 | |
|     interfaces.push_back(shared_memory_u32);
 | |
| 
 | |
|     const Id func_type{TypeFunction(void_id, U32[1], U32[1])};
 | |
|     const auto make_function{[&](u32 mask, u32 size) {
 | |
|         const Id loop_header{OpLabel()};
 | |
|         const Id continue_block{OpLabel()};
 | |
|         const Id merge_block{OpLabel()};
 | |
| 
 | |
|         const Id func{OpFunction(void_id, spv::FunctionControlMask::MaskNone, func_type)};
 | |
|         const Id offset{OpFunctionParameter(U32[1])};
 | |
|         const Id insert_value{OpFunctionParameter(U32[1])};
 | |
|         AddLabel();
 | |
|         OpBranch(loop_header);
 | |
| 
 | |
|         AddLabel(loop_header);
 | |
|         const Id word_offset{OpShiftRightArithmetic(U32[1], offset, Constant(U32[1], 2U))};
 | |
|         const Id shift_offset{OpShiftLeftLogical(U32[1], offset, Constant(U32[1], 3U))};
 | |
|         const Id bit_offset{OpBitwiseAnd(U32[1], shift_offset, Constant(U32[1], mask))};
 | |
|         const Id count{Constant(U32[1], size)};
 | |
|         OpLoopMerge(merge_block, continue_block, spv::LoopControlMask::MaskNone);
 | |
|         OpBranch(continue_block);
 | |
| 
 | |
|         AddLabel(continue_block);
 | |
|         const Id word_pointer{OpAccessChain(shared_u32, shared_memory_u32, word_offset)};
 | |
|         const Id old_value{OpLoad(U32[1], word_pointer)};
 | |
|         const Id new_value{OpBitFieldInsert(U32[1], old_value, insert_value, bit_offset, count)};
 | |
|         const Id atomic_res{OpAtomicCompareExchange(U32[1], word_pointer, Constant(U32[1], 1U),
 | |
|                                                     u32_zero_value, u32_zero_value, new_value,
 | |
|                                                     old_value)};
 | |
|         const Id success{OpIEqual(U1, atomic_res, old_value)};
 | |
|         OpBranchConditional(success, merge_block, loop_header);
 | |
| 
 | |
|         AddLabel(merge_block);
 | |
|         OpReturn();
 | |
|         OpFunctionEnd();
 | |
|         return func;
 | |
|     }};
 | |
|     if (program.info.uses_int8) {
 | |
|         shared_store_u8_func = make_function(24, 8);
 | |
|     }
 | |
|     if (program.info.uses_int16) {
 | |
|         shared_store_u16_func = make_function(16, 16);
 | |
|     }
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineSharedMemoryFunctions(const IR::Program& program) {
 | |
|     if (program.info.uses_shared_increment) {
 | |
|         increment_cas_shared = CasLoop(*this, Operation::Increment, shared_memory_u32_type,
 | |
|                                        shared_u32, U32[1], U32[1], spv::Scope::Workgroup);
 | |
|     }
 | |
|     if (program.info.uses_shared_decrement) {
 | |
|         decrement_cas_shared = CasLoop(*this, Operation::Decrement, shared_memory_u32_type,
 | |
|                                        shared_u32, U32[1], U32[1], spv::Scope::Workgroup);
 | |
|     }
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineAttributeMemAccess(const Info& info) {
 | |
|     const auto make_load{[&] {
 | |
|         const bool is_array{stage == Stage::Geometry};
 | |
|         const Id end_block{OpLabel()};
 | |
|         const Id default_label{OpLabel()};
 | |
| 
 | |
|         const Id func_type_load{is_array ? TypeFunction(F32[1], U32[1], U32[1])
 | |
|                                          : TypeFunction(F32[1], U32[1])};
 | |
|         const Id func{OpFunction(F32[1], spv::FunctionControlMask::MaskNone, func_type_load)};
 | |
|         const Id offset{OpFunctionParameter(U32[1])};
 | |
|         const Id vertex{is_array ? OpFunctionParameter(U32[1]) : Id{}};
 | |
| 
 | |
|         AddLabel();
 | |
|         const Id base_index{OpShiftRightArithmetic(U32[1], offset, Constant(U32[1], 2U))};
 | |
|         const Id masked_index{OpBitwiseAnd(U32[1], base_index, Constant(U32[1], 3U))};
 | |
|         const Id compare_index{OpShiftRightArithmetic(U32[1], base_index, Constant(U32[1], 2U))};
 | |
|         std::vector<Sirit::Literal> literals;
 | |
|         std::vector<Id> labels;
 | |
|         if (info.loads_position) {
 | |
|             literals.push_back(static_cast<u32>(IR::Attribute::PositionX) >> 2);
 | |
|             labels.push_back(OpLabel());
 | |
|         }
 | |
|         const u32 base_attribute_value = static_cast<u32>(IR::Attribute::Generic0X) >> 2;
 | |
|         for (u32 i = 0; i < info.input_generics.size(); ++i) {
 | |
|             if (!info.input_generics[i].used) {
 | |
|                 continue;
 | |
|             }
 | |
|             literals.push_back(base_attribute_value + i);
 | |
|             labels.push_back(OpLabel());
 | |
|         }
 | |
|         OpSelectionMerge(end_block, spv::SelectionControlMask::MaskNone);
 | |
|         OpSwitch(compare_index, default_label, literals, labels);
 | |
|         AddLabel(default_label);
 | |
|         OpReturnValue(Constant(F32[1], 0.0f));
 | |
|         size_t label_index{0};
 | |
|         if (info.loads_position) {
 | |
|             AddLabel(labels[label_index]);
 | |
|             const Id pointer{is_array
 | |
|                                  ? OpAccessChain(input_f32, input_position, vertex, masked_index)
 | |
|                                  : OpAccessChain(input_f32, input_position, masked_index)};
 | |
|             const Id result{OpLoad(F32[1], pointer)};
 | |
|             OpReturnValue(result);
 | |
|             ++label_index;
 | |
|         }
 | |
|         for (size_t i = 0; i < info.input_generics.size(); i++) {
 | |
|             if (!info.input_generics[i].used) {
 | |
|                 continue;
 | |
|             }
 | |
|             AddLabel(labels[label_index]);
 | |
|             const auto type{AttrTypes(*this, static_cast<u32>(i))};
 | |
|             if (!type) {
 | |
|                 OpReturnValue(Constant(F32[1], 0.0f));
 | |
|                 ++label_index;
 | |
|                 continue;
 | |
|             }
 | |
|             const Id generic_id{input_generics.at(i)};
 | |
|             const Id pointer{is_array
 | |
|                                  ? OpAccessChain(type->pointer, generic_id, vertex, masked_index)
 | |
|                                  : OpAccessChain(type->pointer, generic_id, masked_index)};
 | |
|             const Id value{OpLoad(type->id, pointer)};
 | |
|             const Id result{type->needs_cast ? OpBitcast(F32[1], value) : value};
 | |
|             OpReturnValue(result);
 | |
|             ++label_index;
 | |
|         }
 | |
|         AddLabel(end_block);
 | |
|         OpUnreachable();
 | |
|         OpFunctionEnd();
 | |
|         return func;
 | |
|     }};
 | |
|     const auto make_store{[&] {
 | |
|         const Id end_block{OpLabel()};
 | |
|         const Id default_label{OpLabel()};
 | |
| 
 | |
|         const Id func_type_store{TypeFunction(void_id, U32[1], F32[1])};
 | |
|         const Id func{OpFunction(void_id, spv::FunctionControlMask::MaskNone, func_type_store)};
 | |
|         const Id offset{OpFunctionParameter(U32[1])};
 | |
|         const Id store_value{OpFunctionParameter(F32[1])};
 | |
|         AddLabel();
 | |
|         const Id base_index{OpShiftRightArithmetic(U32[1], offset, Constant(U32[1], 2U))};
 | |
|         const Id masked_index{OpBitwiseAnd(U32[1], base_index, Constant(U32[1], 3U))};
 | |
|         const Id compare_index{OpShiftRightArithmetic(U32[1], base_index, Constant(U32[1], 2U))};
 | |
|         std::vector<Sirit::Literal> literals;
 | |
|         std::vector<Id> labels;
 | |
|         if (info.stores_position) {
 | |
|             literals.push_back(static_cast<u32>(IR::Attribute::PositionX) >> 2);
 | |
|             labels.push_back(OpLabel());
 | |
|         }
 | |
|         const u32 base_attribute_value = static_cast<u32>(IR::Attribute::Generic0X) >> 2;
 | |
|         for (size_t i = 0; i < info.stores_generics.size(); i++) {
 | |
|             if (!info.stores_generics[i]) {
 | |
|                 continue;
 | |
|             }
 | |
|             literals.push_back(base_attribute_value + static_cast<u32>(i));
 | |
|             labels.push_back(OpLabel());
 | |
|         }
 | |
|         if (info.stores_clip_distance) {
 | |
|             literals.push_back(static_cast<u32>(IR::Attribute::ClipDistance0) >> 2);
 | |
|             labels.push_back(OpLabel());
 | |
|             literals.push_back(static_cast<u32>(IR::Attribute::ClipDistance4) >> 2);
 | |
|             labels.push_back(OpLabel());
 | |
|         }
 | |
|         OpSelectionMerge(end_block, spv::SelectionControlMask::MaskNone);
 | |
|         OpSwitch(compare_index, default_label, literals, labels);
 | |
|         AddLabel(default_label);
 | |
|         OpReturn();
 | |
|         size_t label_index{0};
 | |
|         if (info.stores_position) {
 | |
|             AddLabel(labels[label_index]);
 | |
|             const Id pointer{OpAccessChain(output_f32, output_position, masked_index)};
 | |
|             OpStore(pointer, store_value);
 | |
|             OpReturn();
 | |
|             ++label_index;
 | |
|         }
 | |
|         for (size_t i = 0; i < info.stores_generics.size(); ++i) {
 | |
|             if (!info.stores_generics[i]) {
 | |
|                 continue;
 | |
|             }
 | |
|             if (output_generics[i][0].num_components != 4) {
 | |
|                 throw NotImplementedException("Physical stores and transform feedbacks");
 | |
|             }
 | |
|             AddLabel(labels[label_index]);
 | |
|             const Id generic_id{output_generics[i][0].id};
 | |
|             const Id pointer{OpAccessChain(output_f32, generic_id, masked_index)};
 | |
|             OpStore(pointer, store_value);
 | |
|             OpReturn();
 | |
|             ++label_index;
 | |
|         }
 | |
|         if (info.stores_clip_distance) {
 | |
|             AddLabel(labels[label_index]);
 | |
|             const Id pointer{OpAccessChain(output_f32, clip_distances, masked_index)};
 | |
|             OpStore(pointer, store_value);
 | |
|             OpReturn();
 | |
|             ++label_index;
 | |
|             AddLabel(labels[label_index]);
 | |
|             const Id fixed_index{OpIAdd(U32[1], masked_index, Constant(U32[1], 4))};
 | |
|             const Id pointer2{OpAccessChain(output_f32, clip_distances, fixed_index)};
 | |
|             OpStore(pointer2, store_value);
 | |
|             OpReturn();
 | |
|             ++label_index;
 | |
|         }
 | |
|         AddLabel(end_block);
 | |
|         OpUnreachable();
 | |
|         OpFunctionEnd();
 | |
|         return func;
 | |
|     }};
 | |
|     if (info.loads_indexed_attributes) {
 | |
|         indexed_load_func = make_load();
 | |
|     }
 | |
|     if (info.stores_indexed_attributes) {
 | |
|         indexed_store_func = make_store();
 | |
|     }
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineConstantBuffers(const Info& info, u32& binding) {
 | |
|     if (info.constant_buffer_descriptors.empty()) {
 | |
|         return;
 | |
|     }
 | |
|     if (True(info.used_constant_buffer_types & IR::Type::U8)) {
 | |
|         DefineConstBuffers(*this, info, &UniformDefinitions::U8, binding, U8, 'u', sizeof(u8));
 | |
|         DefineConstBuffers(*this, info, &UniformDefinitions::S8, binding, S8, 's', sizeof(s8));
 | |
|     }
 | |
|     if (True(info.used_constant_buffer_types & IR::Type::U16)) {
 | |
|         DefineConstBuffers(*this, info, &UniformDefinitions::U16, binding, U16, 'u', sizeof(u16));
 | |
|         DefineConstBuffers(*this, info, &UniformDefinitions::S16, binding, S16, 's', sizeof(s16));
 | |
|     }
 | |
|     if (True(info.used_constant_buffer_types & IR::Type::U32)) {
 | |
|         DefineConstBuffers(*this, info, &UniformDefinitions::U32, binding, U32[1], 'u',
 | |
|                            sizeof(u32));
 | |
|     }
 | |
|     if (True(info.used_constant_buffer_types & IR::Type::F32)) {
 | |
|         DefineConstBuffers(*this, info, &UniformDefinitions::F32, binding, F32[1], 'f',
 | |
|                            sizeof(f32));
 | |
|     }
 | |
|     if (True(info.used_constant_buffer_types & IR::Type::U32x2)) {
 | |
|         DefineConstBuffers(*this, info, &UniformDefinitions::U32x2, binding, U32[2], 'u',
 | |
|                            sizeof(u32[2]));
 | |
|     }
 | |
|     for (const ConstantBufferDescriptor& desc : info.constant_buffer_descriptors) {
 | |
|         binding += desc.count;
 | |
|     }
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineStorageBuffers(const Info& info, u32& binding) {
 | |
|     if (info.storage_buffers_descriptors.empty()) {
 | |
|         return;
 | |
|     }
 | |
|     AddExtension("SPV_KHR_storage_buffer_storage_class");
 | |
| 
 | |
|     if (True(info.used_storage_buffer_types & IR::Type::U8)) {
 | |
|         DefineSsbos(*this, storage_types.U8, &StorageDefinitions::U8, info, binding, U8,
 | |
|                     sizeof(u8));
 | |
|         DefineSsbos(*this, storage_types.S8, &StorageDefinitions::S8, info, binding, S8,
 | |
|                     sizeof(u8));
 | |
|     }
 | |
|     if (True(info.used_storage_buffer_types & IR::Type::U16)) {
 | |
|         DefineSsbos(*this, storage_types.U16, &StorageDefinitions::U16, info, binding, U16,
 | |
|                     sizeof(u16));
 | |
|         DefineSsbos(*this, storage_types.S16, &StorageDefinitions::S16, info, binding, S16,
 | |
|                     sizeof(u16));
 | |
|     }
 | |
|     if (True(info.used_storage_buffer_types & IR::Type::U32)) {
 | |
|         DefineSsbos(*this, storage_types.U32, &StorageDefinitions::U32, info, binding, U32[1],
 | |
|                     sizeof(u32));
 | |
|     }
 | |
|     if (True(info.used_storage_buffer_types & IR::Type::F32)) {
 | |
|         DefineSsbos(*this, storage_types.F32, &StorageDefinitions::F32, info, binding, F32[1],
 | |
|                     sizeof(f32));
 | |
|     }
 | |
|     if (True(info.used_storage_buffer_types & IR::Type::U64)) {
 | |
|         DefineSsbos(*this, storage_types.U64, &StorageDefinitions::U64, info, binding, U64,
 | |
|                     sizeof(u64));
 | |
|     }
 | |
|     if (True(info.used_storage_buffer_types & IR::Type::U32x2)) {
 | |
|         DefineSsbos(*this, storage_types.U32x2, &StorageDefinitions::U32x2, info, binding, U32[2],
 | |
|                     sizeof(u32[2]));
 | |
|     }
 | |
|     if (True(info.used_storage_buffer_types & IR::Type::U32x4)) {
 | |
|         DefineSsbos(*this, storage_types.U32x4, &StorageDefinitions::U32x4, info, binding, U32[4],
 | |
|                     sizeof(u32[4]));
 | |
|     }
 | |
|     for (const StorageBufferDescriptor& desc : info.storage_buffers_descriptors) {
 | |
|         binding += desc.count;
 | |
|     }
 | |
|     const bool needs_function{
 | |
|         info.uses_global_increment || info.uses_global_decrement || info.uses_atomic_f32_add ||
 | |
|         info.uses_atomic_f16x2_add || info.uses_atomic_f16x2_min || info.uses_atomic_f16x2_max ||
 | |
|         info.uses_atomic_f32x2_add || info.uses_atomic_f32x2_min || info.uses_atomic_f32x2_max};
 | |
|     if (needs_function) {
 | |
|         AddCapability(spv::Capability::VariablePointersStorageBuffer);
 | |
|     }
 | |
|     if (info.uses_global_increment) {
 | |
|         increment_cas_ssbo = CasLoop(*this, Operation::Increment, storage_types.U32.array,
 | |
|                                      storage_types.U32.element, U32[1], U32[1], spv::Scope::Device);
 | |
|     }
 | |
|     if (info.uses_global_decrement) {
 | |
|         decrement_cas_ssbo = CasLoop(*this, Operation::Decrement, storage_types.U32.array,
 | |
|                                      storage_types.U32.element, U32[1], U32[1], spv::Scope::Device);
 | |
|     }
 | |
|     if (info.uses_atomic_f32_add) {
 | |
|         f32_add_cas = CasLoop(*this, Operation::FPAdd, storage_types.U32.array,
 | |
|                               storage_types.U32.element, F32[1], U32[1], spv::Scope::Device);
 | |
|     }
 | |
|     if (info.uses_atomic_f16x2_add) {
 | |
|         f16x2_add_cas = CasLoop(*this, Operation::FPAdd, storage_types.U32.array,
 | |
|                                 storage_types.U32.element, F16[2], F16[2], spv::Scope::Device);
 | |
|     }
 | |
|     if (info.uses_atomic_f16x2_min) {
 | |
|         f16x2_min_cas = CasLoop(*this, Operation::FPMin, storage_types.U32.array,
 | |
|                                 storage_types.U32.element, F16[2], F16[2], spv::Scope::Device);
 | |
|     }
 | |
|     if (info.uses_atomic_f16x2_max) {
 | |
|         f16x2_max_cas = CasLoop(*this, Operation::FPMax, storage_types.U32.array,
 | |
|                                 storage_types.U32.element, F16[2], F16[2], spv::Scope::Device);
 | |
|     }
 | |
|     if (info.uses_atomic_f32x2_add) {
 | |
|         f32x2_add_cas = CasLoop(*this, Operation::FPAdd, storage_types.U32.array,
 | |
|                                 storage_types.U32.element, F32[2], F32[2], spv::Scope::Device);
 | |
|     }
 | |
|     if (info.uses_atomic_f32x2_min) {
 | |
|         f32x2_min_cas = CasLoop(*this, Operation::FPMin, storage_types.U32.array,
 | |
|                                 storage_types.U32.element, F32[2], F32[2], spv::Scope::Device);
 | |
|     }
 | |
|     if (info.uses_atomic_f32x2_max) {
 | |
|         f32x2_max_cas = CasLoop(*this, Operation::FPMax, storage_types.U32.array,
 | |
|                                 storage_types.U32.element, F32[2], F32[2], spv::Scope::Device);
 | |
|     }
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineTextureBuffers(const Info& info, u32& binding) {
 | |
|     if (info.texture_buffer_descriptors.empty()) {
 | |
|         return;
 | |
|     }
 | |
|     const spv::ImageFormat format{spv::ImageFormat::Unknown};
 | |
|     image_buffer_type = TypeImage(F32[1], spv::Dim::Buffer, 0U, false, false, 1, format);
 | |
|     sampled_texture_buffer_type = TypeSampledImage(image_buffer_type);
 | |
| 
 | |
|     const Id type{TypePointer(spv::StorageClass::UniformConstant, sampled_texture_buffer_type)};
 | |
|     texture_buffers.reserve(info.texture_buffer_descriptors.size());
 | |
|     for (const TextureBufferDescriptor& desc : info.texture_buffer_descriptors) {
 | |
|         if (desc.count != 1) {
 | |
|             throw NotImplementedException("Array of texture buffers");
 | |
|         }
 | |
|         const Id id{AddGlobalVariable(type, spv::StorageClass::UniformConstant)};
 | |
|         Decorate(id, spv::Decoration::Binding, binding);
 | |
|         Decorate(id, spv::Decoration::DescriptorSet, 0U);
 | |
|         Name(id, fmt::format("texbuf{}_{:02x}", desc.cbuf_index, desc.cbuf_offset));
 | |
|         texture_buffers.insert(texture_buffers.end(), desc.count, id);
 | |
|         if (profile.supported_spirv >= 0x00010400) {
 | |
|             interfaces.push_back(id);
 | |
|         }
 | |
|         binding += desc.count;
 | |
|     }
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineImageBuffers(const Info& info, u32& binding) {
 | |
|     image_buffers.reserve(info.image_buffer_descriptors.size());
 | |
|     for (const ImageBufferDescriptor& desc : info.image_buffer_descriptors) {
 | |
|         if (desc.count != 1) {
 | |
|             throw NotImplementedException("Array of image buffers");
 | |
|         }
 | |
|         const spv::ImageFormat format{GetImageFormat(desc.format)};
 | |
|         const Id image_type{TypeImage(U32[4], spv::Dim::Buffer, false, false, false, 2, format)};
 | |
|         const Id pointer_type{TypePointer(spv::StorageClass::UniformConstant, image_type)};
 | |
|         const Id id{AddGlobalVariable(pointer_type, spv::StorageClass::UniformConstant)};
 | |
|         Decorate(id, spv::Decoration::Binding, binding);
 | |
|         Decorate(id, spv::Decoration::DescriptorSet, 0U);
 | |
|         Name(id, fmt::format("imgbuf{}_{:02x}", desc.cbuf_index, desc.cbuf_offset));
 | |
|         const ImageBufferDefinition def{
 | |
|             .id = id,
 | |
|             .image_type = image_type,
 | |
|         };
 | |
|         image_buffers.insert(image_buffers.end(), desc.count, def);
 | |
|         if (profile.supported_spirv >= 0x00010400) {
 | |
|             interfaces.push_back(id);
 | |
|         }
 | |
|         binding += desc.count;
 | |
|     }
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineTextures(const Info& info, u32& binding) {
 | |
|     textures.reserve(info.texture_descriptors.size());
 | |
|     for (const TextureDescriptor& desc : info.texture_descriptors) {
 | |
|         if (desc.count != 1) {
 | |
|             throw NotImplementedException("Array of textures");
 | |
|         }
 | |
|         const Id image_type{ImageType(*this, desc)};
 | |
|         const Id sampled_type{TypeSampledImage(image_type)};
 | |
|         const Id pointer_type{TypePointer(spv::StorageClass::UniformConstant, sampled_type)};
 | |
|         const Id id{AddGlobalVariable(pointer_type, spv::StorageClass::UniformConstant)};
 | |
|         Decorate(id, spv::Decoration::Binding, binding);
 | |
|         Decorate(id, spv::Decoration::DescriptorSet, 0U);
 | |
|         Name(id, fmt::format("tex{}_{:02x}", desc.cbuf_index, desc.cbuf_offset));
 | |
|         for (u32 index = 0; index < desc.count; ++index) {
 | |
|             // TODO: Pass count info
 | |
|             textures.push_back(TextureDefinition{
 | |
|                 .id{id},
 | |
|                 .sampled_type{sampled_type},
 | |
|                 .image_type{image_type},
 | |
|             });
 | |
|         }
 | |
|         if (profile.supported_spirv >= 0x00010400) {
 | |
|             interfaces.push_back(id);
 | |
|         }
 | |
|         binding += desc.count;
 | |
|     }
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineImages(const Info& info, u32& binding) {
 | |
|     images.reserve(info.image_descriptors.size());
 | |
|     for (const ImageDescriptor& desc : info.image_descriptors) {
 | |
|         if (desc.count != 1) {
 | |
|             throw NotImplementedException("Array of textures");
 | |
|         }
 | |
|         const Id image_type{ImageType(*this, desc)};
 | |
|         const Id pointer_type{TypePointer(spv::StorageClass::UniformConstant, image_type)};
 | |
|         const Id id{AddGlobalVariable(pointer_type, spv::StorageClass::UniformConstant)};
 | |
|         Decorate(id, spv::Decoration::Binding, binding);
 | |
|         Decorate(id, spv::Decoration::DescriptorSet, 0U);
 | |
|         Name(id, fmt::format("img{}_{:02x}", desc.cbuf_index, desc.cbuf_offset));
 | |
|         for (u32 index = 0; index < desc.count; ++index) {
 | |
|             images.push_back(ImageDefinition{
 | |
|                 .id{id},
 | |
|                 .image_type{image_type},
 | |
|             });
 | |
|         }
 | |
|         if (profile.supported_spirv >= 0x00010400) {
 | |
|             interfaces.push_back(id);
 | |
|         }
 | |
|         binding += desc.count;
 | |
|     }
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineLabels(IR::Program& program) {
 | |
|     for (IR::Block* const block : program.blocks) {
 | |
|         block->SetDefinition(OpLabel());
 | |
|     }
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineInputs(const Info& info) {
 | |
|     if (info.uses_workgroup_id) {
 | |
|         workgroup_id = DefineInput(*this, U32[3], spv::BuiltIn::WorkgroupId);
 | |
|     }
 | |
|     if (info.uses_local_invocation_id) {
 | |
|         local_invocation_id = DefineInput(*this, U32[3], spv::BuiltIn::LocalInvocationId);
 | |
|     }
 | |
|     if (info.uses_is_helper_invocation) {
 | |
|         is_helper_invocation = DefineInput(*this, U1, spv::BuiltIn::HelperInvocation);
 | |
|     }
 | |
|     if (info.uses_subgroup_mask) {
 | |
|         subgroup_mask_eq = DefineInput(*this, U32[4], spv::BuiltIn::SubgroupEqMaskKHR);
 | |
|         subgroup_mask_lt = DefineInput(*this, U32[4], spv::BuiltIn::SubgroupLtMaskKHR);
 | |
|         subgroup_mask_le = DefineInput(*this, U32[4], spv::BuiltIn::SubgroupLeMaskKHR);
 | |
|         subgroup_mask_gt = DefineInput(*this, U32[4], spv::BuiltIn::SubgroupGtMaskKHR);
 | |
|         subgroup_mask_ge = DefineInput(*this, U32[4], spv::BuiltIn::SubgroupGeMaskKHR);
 | |
|     }
 | |
|     if (info.uses_subgroup_invocation_id ||
 | |
|         (profile.warp_size_potentially_larger_than_guest &&
 | |
|          (info.uses_subgroup_vote || info.uses_subgroup_mask))) {
 | |
|         subgroup_local_invocation_id =
 | |
|             DefineInput(*this, U32[1], spv::BuiltIn::SubgroupLocalInvocationId);
 | |
|     }
 | |
|     if (info.uses_fswzadd) {
 | |
|         const Id f32_one{Constant(F32[1], 1.0f)};
 | |
|         const Id f32_minus_one{Constant(F32[1], -1.0f)};
 | |
|         const Id f32_zero{Constant(F32[1], 0.0f)};
 | |
|         fswzadd_lut_a = ConstantComposite(F32[4], f32_minus_one, f32_one, f32_minus_one, f32_zero);
 | |
|         fswzadd_lut_b =
 | |
|             ConstantComposite(F32[4], f32_minus_one, f32_minus_one, f32_one, f32_minus_one);
 | |
|     }
 | |
|     if (info.loads_position) {
 | |
|         const bool is_fragment{stage != Stage::Fragment};
 | |
|         const spv::BuiltIn built_in{is_fragment ? spv::BuiltIn::Position : spv::BuiltIn::FragCoord};
 | |
|         input_position = DefineInput(*this, F32[4], built_in);
 | |
|     }
 | |
|     if (info.loads_instance_id) {
 | |
|         if (profile.support_vertex_instance_id) {
 | |
|             instance_id = DefineInput(*this, U32[1], spv::BuiltIn::InstanceId);
 | |
|         } else {
 | |
|             instance_index = DefineInput(*this, U32[1], spv::BuiltIn::InstanceIndex);
 | |
|             base_instance = DefineInput(*this, U32[1], spv::BuiltIn::BaseInstance);
 | |
|         }
 | |
|     }
 | |
|     if (info.loads_vertex_id) {
 | |
|         if (profile.support_vertex_instance_id) {
 | |
|             vertex_id = DefineInput(*this, U32[1], spv::BuiltIn::VertexId);
 | |
|         } else {
 | |
|             vertex_index = DefineInput(*this, U32[1], spv::BuiltIn::VertexIndex);
 | |
|             base_vertex = DefineInput(*this, U32[1], spv::BuiltIn::BaseVertex);
 | |
|         }
 | |
|     }
 | |
|     if (info.loads_front_face) {
 | |
|         front_face = DefineInput(*this, U1, spv::BuiltIn::FrontFacing);
 | |
|     }
 | |
|     if (info.loads_point_coord) {
 | |
|         point_coord = DefineInput(*this, F32[2], spv::BuiltIn::PointCoord);
 | |
|     }
 | |
|     for (size_t index = 0; index < info.input_generics.size(); ++index) {
 | |
|         const InputVarying generic{info.input_generics[index]};
 | |
|         if (!generic.used) {
 | |
|             continue;
 | |
|         }
 | |
|         const AttributeType input_type{profile.generic_input_types[index]};
 | |
|         if (input_type == AttributeType::Disabled) {
 | |
|             continue;
 | |
|         }
 | |
|         const Id type{GetAttributeType(*this, input_type)};
 | |
|         const Id id{DefineInput(*this, type)};
 | |
|         Decorate(id, spv::Decoration::Location, static_cast<u32>(index));
 | |
|         Name(id, fmt::format("in_attr{}", index));
 | |
|         input_generics[index] = id;
 | |
| 
 | |
|         if (stage != Stage::Fragment) {
 | |
|             continue;
 | |
|         }
 | |
|         switch (generic.interpolation) {
 | |
|         case Interpolation::Smooth:
 | |
|             // Default
 | |
|             // Decorate(id, spv::Decoration::Smooth);
 | |
|             break;
 | |
|         case Interpolation::NoPerspective:
 | |
|             Decorate(id, spv::Decoration::NoPerspective);
 | |
|             break;
 | |
|         case Interpolation::Flat:
 | |
|             Decorate(id, spv::Decoration::Flat);
 | |
|             break;
 | |
|         }
 | |
|     }
 | |
| }
 | |
| 
 | |
| void EmitContext::DefineOutputs(const Info& info) {
 | |
|     if (info.stores_position || stage == Stage::VertexB) {
 | |
|         output_position = DefineOutput(*this, F32[4], spv::BuiltIn::Position);
 | |
|     }
 | |
|     if (info.stores_point_size || profile.fixed_state_point_size) {
 | |
|         if (stage == Stage::Fragment) {
 | |
|             throw NotImplementedException("Storing PointSize in fragment stage");
 | |
|         }
 | |
|         output_point_size = DefineOutput(*this, F32[1], spv::BuiltIn::PointSize);
 | |
|     }
 | |
|     if (info.stores_clip_distance) {
 | |
|         if (stage == Stage::Fragment) {
 | |
|             throw NotImplementedException("Storing ClipDistance in fragment stage");
 | |
|         }
 | |
|         const Id type{TypeArray(F32[1], Constant(U32[1], 8U))};
 | |
|         clip_distances = DefineOutput(*this, type, spv::BuiltIn::ClipDistance);
 | |
|     }
 | |
|     if (info.stores_layer &&
 | |
|         (profile.support_viewport_index_layer_non_geometry || stage == Stage::Geometry)) {
 | |
|         if (stage == Stage::Fragment) {
 | |
|             throw NotImplementedException("Storing Layer in fragment stage");
 | |
|         }
 | |
|         layer = DefineOutput(*this, U32[1], spv::BuiltIn::Layer);
 | |
|     }
 | |
|     if (info.stores_viewport_index &&
 | |
|         (profile.support_viewport_index_layer_non_geometry || stage == Stage::Geometry)) {
 | |
|         if (stage == Stage::Fragment) {
 | |
|             throw NotImplementedException("Storing ViewportIndex in fragment stage");
 | |
|         }
 | |
|         viewport_index = DefineOutput(*this, U32[1], spv::BuiltIn::ViewportIndex);
 | |
|     }
 | |
|     for (size_t index = 0; index < info.stores_generics.size(); ++index) {
 | |
|         if (info.stores_generics[index]) {
 | |
|             DefineGenericOutput(*this, index);
 | |
|         }
 | |
|     }
 | |
|     if (stage == Stage::Fragment) {
 | |
|         for (u32 index = 0; index < 8; ++index) {
 | |
|             if (!info.stores_frag_color[index]) {
 | |
|                 continue;
 | |
|             }
 | |
|             frag_color[index] = DefineOutput(*this, F32[4]);
 | |
|             Decorate(frag_color[index], spv::Decoration::Location, index);
 | |
|             Name(frag_color[index], fmt::format("frag_color{}", index));
 | |
|         }
 | |
|         if (info.stores_frag_depth) {
 | |
|             frag_depth = DefineOutput(*this, F32[1]);
 | |
|             Decorate(frag_depth, spv::Decoration::BuiltIn, spv::BuiltIn::FragDepth);
 | |
|             Name(frag_depth, "frag_depth");
 | |
|         }
 | |
|     }
 | |
| }
 | |
| 
 | |
| } // namespace Shader::Backend::SPIRV
 | 
