glasm: Implement TEX and TEXS instructions
Remove lod clamp from texture instructions with lod, as this is not needed (nor supported).
This commit is contained in:
		| @@ -283,6 +283,9 @@ void SetupOptions(std::string& header, Info info) { | ||||
|     if (info.uses_subgroup_shuffles) { | ||||
|         header += "OPTION NV_shader_thread_shuffle;"; | ||||
|     } | ||||
|     if (info.uses_sparse_residency) { | ||||
|         header += "OPTION EXT_sparse_texture2;"; | ||||
|     } | ||||
|     const auto non_zero_frag_colors{info.stores_frag_color | std::views::drop(1)}; | ||||
|     if (std::ranges::find(non_zero_frag_colors, true) != non_zero_frag_colors.end()) { | ||||
|         header += "OPTION ARB_draw_buffers;"; | ||||
|   | ||||
| @@ -9,6 +9,34 @@ | ||||
|  | ||||
| namespace Shader::Backend::GLASM { | ||||
| namespace { | ||||
| struct ScopedRegister { | ||||
|     ScopedRegister() = default; | ||||
|     ScopedRegister(RegAlloc& reg_alloc_) : reg_alloc{®_alloc_}, reg{reg_alloc->AllocReg()} {} | ||||
|  | ||||
|     ~ScopedRegister() { | ||||
|         if (reg_alloc) { | ||||
|             reg_alloc->FreeReg(reg); | ||||
|         } | ||||
|     } | ||||
|  | ||||
|     ScopedRegister& operator=(ScopedRegister&& rhs) noexcept { | ||||
|         if (reg_alloc) { | ||||
|             reg_alloc->FreeReg(reg); | ||||
|         } | ||||
|         reg_alloc = std::exchange(rhs.reg_alloc, nullptr); | ||||
|         reg = rhs.reg; | ||||
|     } | ||||
|  | ||||
|     ScopedRegister(ScopedRegister&& rhs) noexcept | ||||
|         : reg_alloc{std::exchange(rhs.reg_alloc, nullptr)}, reg{rhs.reg} {} | ||||
|  | ||||
|     ScopedRegister& operator=(const ScopedRegister&) = delete; | ||||
|     ScopedRegister(const ScopedRegister&) = delete; | ||||
|  | ||||
|     RegAlloc* reg_alloc{}; | ||||
|     Register reg; | ||||
| }; | ||||
|  | ||||
| std::string Texture([[maybe_unused]] EmitContext& ctx, IR::TextureInstInfo info, | ||||
|                     [[maybe_unused]] const IR::Value& index) { | ||||
|     // FIXME | ||||
| @@ -36,6 +64,61 @@ std::string_view TextureType(IR::TextureInstInfo info) { | ||||
|     } | ||||
|     throw InvalidArgument("Invalid texture type {}", info.type.Value()); | ||||
| } | ||||
|  | ||||
| std::string_view ShadowTextureType(IR::TextureInstInfo info) { | ||||
|     switch (info.type) { | ||||
|     case TextureType::Color1D: | ||||
|         return "SHADOW1D"; | ||||
|     case TextureType::ColorArray1D: | ||||
|         return "SHADOWARRAY1D"; | ||||
|     case TextureType::Color2D: | ||||
|         return "SHADOW2D"; | ||||
|     case TextureType::ColorArray2D: | ||||
|         return "SHADOWARRAY2D"; | ||||
|     case TextureType::Color3D: | ||||
|         return "SHADOW3D"; | ||||
|     case TextureType::ColorCube: | ||||
|         return "SHADOWCUBE"; | ||||
|     case TextureType::ColorArrayCube: | ||||
|         return "SHADOWARRAYCUBE"; | ||||
|     case TextureType::Buffer: | ||||
|         return "SHADOWBUFFER"; | ||||
|     } | ||||
|     throw InvalidArgument("Invalid texture type {}", info.type.Value()); | ||||
| } | ||||
|  | ||||
| std::string Offset(EmitContext& ctx, const IR::Value& offset) { | ||||
|     if (offset.IsEmpty()) { | ||||
|         return ""; | ||||
|     } | ||||
|     return fmt::format(",offset({})", Register{ctx.reg_alloc.Consume(offset)}); | ||||
| } | ||||
|  | ||||
| std::pair<std::string, ScopedRegister> Coord(EmitContext& ctx, const IR::Value& coord) { | ||||
|     if (coord.IsImmediate()) { | ||||
|         ScopedRegister scoped_reg(ctx.reg_alloc); | ||||
|         return {fmt::to_string(scoped_reg.reg), std::move(scoped_reg)}; | ||||
|     } | ||||
|     std::string coord_vec{fmt::to_string(Register{ctx.reg_alloc.Consume(coord)})}; | ||||
|     if (coord.InstRecursive()->HasUses()) { | ||||
|         // Move non-dead coords to a separate register, although this should never happen because | ||||
|         // vectors are only assembled for immediate texture instructions | ||||
|         ctx.Add("MOV.F RC,{};", coord_vec); | ||||
|         coord_vec = "RC"; | ||||
|     } | ||||
|     return {std::move(coord_vec), ScopedRegister{}}; | ||||
| } | ||||
|  | ||||
| void StoreSparse(EmitContext& ctx, IR::Inst* sparse_inst) { | ||||
|     if (!sparse_inst) { | ||||
|         return; | ||||
|     } | ||||
|     const Register sparse_ret{ctx.reg_alloc.Define(*sparse_inst)}; | ||||
|     ctx.Add("MOV.S {},-1;" | ||||
|             "MOV.S {}(NONRESIDENT),0;", | ||||
|             sparse_ret, sparse_ret); | ||||
|     sparse_inst->Invalidate(); | ||||
| } | ||||
| } // Anonymous namespace | ||||
|  | ||||
| void EmitImageSampleImplicitLod(EmitContext& ctx, IR::Inst& inst, const IR::Value& index, | ||||
| @@ -46,17 +129,8 @@ void EmitImageSampleImplicitLod(EmitContext& ctx, IR::Inst& inst, const IR::Valu | ||||
|     const std::string_view lod_clamp_mod{info.has_lod_clamp ? ".LODCLAMP" : ""}; | ||||
|     const std::string_view type{TextureType(info)}; | ||||
|     const std::string texture{Texture(ctx, info, index)}; | ||||
|     std::string offset_vec; | ||||
|     if (!offset.IsEmpty()) { | ||||
|         offset_vec = fmt::format(",offset({})", Register{ctx.reg_alloc.Consume(offset)}); | ||||
|     } | ||||
|     std::string coord_vec{fmt::to_string(Register{ctx.reg_alloc.Consume(coord)})}; | ||||
|     if (coord.InstRecursive()->HasUses()) { | ||||
|         // Move non-dead coords to a separate register, although this should never happen because | ||||
|         // vectors are only assembled for immediate texture instructions | ||||
|         ctx.Add("MOV.F RC,{};", coord_vec); | ||||
|         coord_vec = "RC"; | ||||
|     } | ||||
|     const std::string offset_vec{Offset(ctx, offset)}; | ||||
|     const auto [coord_vec, coord_alloc]{Coord(ctx, coord)}; | ||||
|     const Register ret{ctx.reg_alloc.Define(inst)}; | ||||
|     if (info.has_bias) { | ||||
|         if (info.type == TextureType::ColorArrayCube) { | ||||
| @@ -83,38 +157,172 @@ void EmitImageSampleImplicitLod(EmitContext& ctx, IR::Inst& inst, const IR::Valu | ||||
|                     type, offset_vec); | ||||
|         } | ||||
|     } | ||||
|     if (sparse_inst) { | ||||
|         const Register sparse_ret{ctx.reg_alloc.Define(*sparse_inst)}; | ||||
|         ctx.Add("MOV.S {},-1;" | ||||
|                 "MOV.S {}(NONRESIDENT),0;", | ||||
|                 sparse_ret, sparse_ret); | ||||
|         sparse_inst->Invalidate(); | ||||
|     StoreSparse(ctx, sparse_inst); | ||||
| } | ||||
|  | ||||
| void EmitImageSampleExplicitLod(EmitContext& ctx, IR::Inst& inst, const IR::Value& index, | ||||
|                                 const IR::Value& coord, ScalarF32 lod, const IR::Value& offset) { | ||||
|     const auto info{inst.Flags<IR::TextureInstInfo>()}; | ||||
|     const auto sparse_inst{inst.GetAssociatedPseudoOperation(IR::Opcode::GetSparseFromOp)}; | ||||
|     const std::string_view sparse_mod{sparse_inst ? ".SPARSE" : ""}; | ||||
|     const std::string_view type{TextureType(info)}; | ||||
|     const std::string texture{Texture(ctx, info, index)}; | ||||
|     const std::string offset_vec{Offset(ctx, offset)}; | ||||
|     const auto [coord_vec, coord_alloc]{Coord(ctx, coord)}; | ||||
|     const Register ret{ctx.reg_alloc.Define(inst)}; | ||||
|     if (info.type == TextureType::ColorArrayCube) { | ||||
|         ctx.Add("TXL.F{} {},{},{},{},ARRAYCUBE{};", sparse_mod, ret, coord_vec, lod, texture, | ||||
|                 offset_vec); | ||||
|     } else { | ||||
|         ctx.Add("MOV.F {}.w,{};" | ||||
|                 "TXL.F{} {},{},{},{}{};", | ||||
|                 coord_vec, lod, sparse_mod, ret, coord_vec, texture, type, offset_vec); | ||||
|     } | ||||
|     StoreSparse(ctx, sparse_inst); | ||||
| } | ||||
|  | ||||
| void EmitImageSampleExplicitLod([[maybe_unused]] EmitContext& ctx, [[maybe_unused]] IR::Inst& inst, | ||||
|                                 [[maybe_unused]] const IR::Value& index, | ||||
|                                 [[maybe_unused]] Register coord, [[maybe_unused]] Register lod_lc, | ||||
|                                 [[maybe_unused]] const IR::Value& offset) { | ||||
|     throw NotImplementedException("GLASM instruction"); | ||||
| void EmitImageSampleDrefImplicitLod(EmitContext& ctx, IR::Inst& inst, const IR::Value& index, | ||||
|                                     const IR::Value& coord, ScalarF32 dref, Register bias_lc, | ||||
|                                     const IR::Value& offset) { | ||||
|     const auto info{inst.Flags<IR::TextureInstInfo>()}; | ||||
|     const auto sparse_inst{inst.GetAssociatedPseudoOperation(IR::Opcode::GetSparseFromOp)}; | ||||
|     const std::string_view sparse_mod{sparse_inst ? ".SPARSE" : ""}; | ||||
|     const std::string_view type{ShadowTextureType(info)}; | ||||
|     const std::string texture{Texture(ctx, info, index)}; | ||||
|     const std::string offset_vec{Offset(ctx, offset)}; | ||||
|     const auto [coord_vec, coord_alloc]{Coord(ctx, coord)}; | ||||
|     const Register ret{ctx.reg_alloc.Define(inst)}; | ||||
|     if (info.has_bias) { | ||||
|         if (info.has_lod_clamp) { | ||||
|             switch (info.type) { | ||||
|             case TextureType::Color1D: | ||||
|             case TextureType::ColorArray1D: | ||||
|             case TextureType::Color2D: | ||||
|                 ctx.Add("MOV.F {}.z,{};" | ||||
|                         "MOV.F {}.w,{}.x;" | ||||
|                         "TXB.F.LODCLAMP{} {},{},{}.y,{},{}{};", | ||||
|                         coord_vec, dref, coord_vec, bias_lc, sparse_mod, ret, coord_vec, bias_lc, | ||||
|                         texture, type, offset_vec); | ||||
|                 break; | ||||
|             case TextureType::ColorArray2D: | ||||
|             case TextureType::ColorCube: | ||||
|                 ctx.Add("MOV.F {}.w,{};" | ||||
|                         "TXB.F.LODCLAMP{} {},{},{},{},{}{};", | ||||
|                         coord_vec, dref, sparse_mod, ret, coord_vec, bias_lc, texture, type, | ||||
|                         offset_vec); | ||||
|                 break; | ||||
|             default: | ||||
|                 throw NotImplementedException("Invalid type {} with bias and lod clamp", | ||||
|                                               info.type.Value()); | ||||
|             } | ||||
|         } else { | ||||
|             switch (info.type) { | ||||
|             case TextureType::Color1D: | ||||
|             case TextureType::ColorArray1D: | ||||
|             case TextureType::Color2D: | ||||
|                 ctx.Add("MOV.F {}.z,{};" | ||||
|                         "MOV.F {}.w,{}.x;" | ||||
|                         "TXB.F{} {},{},{},{}{};", | ||||
|                         coord_vec, dref, coord_vec, bias_lc, sparse_mod, ret, coord_vec, texture, | ||||
|                         type, offset_vec); | ||||
|                 break; | ||||
|             case TextureType::ColorArray2D: | ||||
|             case TextureType::ColorCube: | ||||
|                 ctx.Add("MOV.F {}.w,{};" | ||||
|                         "TXB.F{} {},{},{},{},{}{};", | ||||
|                         coord_vec, dref, sparse_mod, ret, coord_vec, bias_lc, texture, type, | ||||
|                         offset_vec); | ||||
|                 break; | ||||
|             case TextureType::ColorArrayCube: { | ||||
|                 const ScopedRegister pair{ctx.reg_alloc}; | ||||
|                 ctx.Add("MOV.F {}.x,{};" | ||||
|                         "MOV.F {}.y,{}.x;" | ||||
|                         "TXB.F{} {},{},{},{},{}{};", | ||||
|                         pair.reg, dref, pair.reg, bias_lc, sparse_mod, ret, coord_vec, pair.reg, | ||||
|                         texture, type, offset_vec); | ||||
|                 break; | ||||
|             } | ||||
|             default: | ||||
|                 throw NotImplementedException("Invalid type {}", info.type.Value()); | ||||
|             } | ||||
|         } | ||||
|     } else { | ||||
|         if (info.has_lod_clamp) { | ||||
|             if (info.type != TextureType::ColorArrayCube) { | ||||
|                 const bool w_swizzle{info.type == TextureType::ColorArray2D || | ||||
|                                      info.type == TextureType::ColorCube}; | ||||
|                 const char dref_swizzle{w_swizzle ? 'w' : 'z'}; | ||||
|                 ctx.Add("MOV.F {}.{},{};" | ||||
|                         "TEX.F.LODCLAMP{} {},{},{},{},{}{};", | ||||
|                         coord_vec, dref_swizzle, dref, sparse_mod, ret, coord_vec, bias_lc, texture, | ||||
|                         type, offset_vec); | ||||
|             } else { | ||||
|                 const ScopedRegister pair{ctx.reg_alloc}; | ||||
|                 ctx.Add("MOV.F {}.x,{};" | ||||
|                         "MOV.F {}.y,{};" | ||||
|                         "TEX.F.LODCLAMP{} {},{},{},{},{}{};", | ||||
|                         pair.reg, dref, pair.reg, bias_lc, sparse_mod, ret, coord_vec, pair.reg, | ||||
|                         texture, type, offset_vec); | ||||
|             } | ||||
|         } else { | ||||
|             if (info.type != TextureType::ColorArrayCube) { | ||||
|                 const bool w_swizzle{info.type == TextureType::ColorArray2D || | ||||
|                                      info.type == TextureType::ColorCube}; | ||||
|                 const char dref_swizzle{w_swizzle ? 'w' : 'z'}; | ||||
|                 ctx.Add("MOV.F {}.{},{};" | ||||
|                         "TEX.F{} {},{},{},{}{};", | ||||
|                         coord_vec, dref_swizzle, dref, sparse_mod, ret, coord_vec, texture, type, | ||||
|                         offset_vec); | ||||
|             } else { | ||||
|                 const ScopedRegister pair{ctx.reg_alloc}; | ||||
|                 ctx.Add("TEX.F{} {},{},{},{},{}{};", sparse_mod, ret, coord_vec, dref, texture, | ||||
|                         type, offset_vec); | ||||
|             } | ||||
|         } | ||||
|     } | ||||
|     StoreSparse(ctx, sparse_inst); | ||||
| } | ||||
|  | ||||
| void EmitImageSampleDrefImplicitLod([[maybe_unused]] EmitContext& ctx, | ||||
|                                     [[maybe_unused]] IR::Inst& inst, | ||||
|                                     [[maybe_unused]] const IR::Value& index, | ||||
|                                     [[maybe_unused]] Register coord, [[maybe_unused]] Register dref, | ||||
|                                     [[maybe_unused]] Register bias_lc, | ||||
|                                     [[maybe_unused]] const IR::Value& offset) { | ||||
|     throw NotImplementedException("GLASM instruction"); | ||||
| } | ||||
|  | ||||
| void EmitImageSampleDrefExplicitLod([[maybe_unused]] EmitContext& ctx, | ||||
|                                     [[maybe_unused]] IR::Inst& inst, | ||||
|                                     [[maybe_unused]] const IR::Value& index, | ||||
|                                     [[maybe_unused]] Register coord, [[maybe_unused]] Register dref, | ||||
|                                     [[maybe_unused]] Register lod_lc, | ||||
|                                     [[maybe_unused]] const IR::Value& offset) { | ||||
|     throw NotImplementedException("GLASM instruction"); | ||||
| void EmitImageSampleDrefExplicitLod(EmitContext& ctx, IR::Inst& inst, const IR::Value& index, | ||||
|                                     const IR::Value& coord, ScalarF32 dref, ScalarF32 lod, | ||||
|                                     const IR::Value& offset) { | ||||
|     const auto info{inst.Flags<IR::TextureInstInfo>()}; | ||||
|     const auto sparse_inst{inst.GetAssociatedPseudoOperation(IR::Opcode::GetSparseFromOp)}; | ||||
|     const std::string_view sparse_mod{sparse_inst ? ".SPARSE" : ""}; | ||||
|     const std::string_view type{ShadowTextureType(info)}; | ||||
|     const std::string texture{Texture(ctx, info, index)}; | ||||
|     const std::string offset_vec{Offset(ctx, offset)}; | ||||
|     const auto [coord_vec, coord_alloc]{Coord(ctx, coord)}; | ||||
|     const Register ret{ctx.reg_alloc.Define(inst)}; | ||||
|     switch (info.type) { | ||||
|     case TextureType::Color1D: | ||||
|     case TextureType::ColorArray1D: | ||||
|     case TextureType::Color2D: | ||||
|         ctx.Add("MOV.F {}.z,{};" | ||||
|                 "MOV.F {}.w,{};" | ||||
|                 "TXL.F{} {},{},{},{}{};", | ||||
|                 coord_vec, dref, coord_vec, lod, sparse_mod, ret, coord_vec, texture, type, | ||||
|                 offset_vec); | ||||
|         break; | ||||
|     case TextureType::ColorArray2D: | ||||
|     case TextureType::ColorCube: | ||||
|         ctx.Add("MOV.F {}.w,{};" | ||||
|                 "TXL.F{} {},{},{},{},{}{};", | ||||
|                 coord_vec, dref, sparse_mod, ret, coord_vec, lod, texture, type, offset_vec); | ||||
|         break; | ||||
|     case TextureType::ColorArrayCube: { | ||||
|         const ScopedRegister pair{ctx.reg_alloc}; | ||||
|         ctx.Add("MOV.F {}.x,{};" | ||||
|                 "MOV.F {}.y,{};" | ||||
|                 "TXL.F{} {},{},{},{},{}{};", | ||||
|                 pair.reg, dref, pair.reg, lod, sparse_mod, ret, coord_vec, pair.reg, texture, type, | ||||
|                 offset_vec); | ||||
|         break; | ||||
|     } | ||||
|     default: | ||||
|         throw NotImplementedException("Invalid type {}", info.type.Value()); | ||||
|     } | ||||
|     StoreSparse(ctx, sparse_inst); | ||||
| } | ||||
|  | ||||
| void EmitImageGather([[maybe_unused]] EmitContext& ctx, [[maybe_unused]] IR::Inst& inst, | ||||
|   | ||||
| @@ -527,12 +527,12 @@ void EmitBoundImageWrite(EmitContext&); | ||||
| void EmitImageSampleImplicitLod(EmitContext& ctx, IR::Inst& inst, const IR::Value& index, | ||||
|                                 const IR::Value& coord, Register bias_lc, const IR::Value& offset); | ||||
| void EmitImageSampleExplicitLod(EmitContext& ctx, IR::Inst& inst, const IR::Value& index, | ||||
|                                 Register coord, Register lod_lc, const IR::Value& offset); | ||||
|                                 const IR::Value& coord, ScalarF32 lod, const IR::Value& offset); | ||||
| void EmitImageSampleDrefImplicitLod(EmitContext& ctx, IR::Inst& inst, const IR::Value& index, | ||||
|                                     Register coord, Register dref, Register bias_lc, | ||||
|                                     const IR::Value& coord, ScalarF32 dref, Register bias_lc, | ||||
|                                     const IR::Value& offset); | ||||
| void EmitImageSampleDrefExplicitLod(EmitContext& ctx, IR::Inst& inst, const IR::Value& index, | ||||
|                                     Register coord, Register dref, Register lod_lc, | ||||
|                                     const IR::Value& coord, ScalarF32 dref, ScalarF32 lod, | ||||
|                                     const IR::Value& offset); | ||||
| void EmitImageGather(EmitContext& ctx, IR::Inst& inst, const IR::Value& index, Register coord, | ||||
|                      const IR::Value& offset, const IR::Value& offset2); | ||||
|   | ||||
| @@ -38,7 +38,7 @@ void Store(EmitContext& ctx, const IR::Value& binding, ScalarU32 offset, ValueTy | ||||
| void Load(EmitContext& ctx, IR::Inst& inst, const IR::Value& binding, ScalarU32 offset, | ||||
|           std::string_view size) { | ||||
|     const Register ret{ctx.reg_alloc.Define(inst)}; | ||||
|     StorageOp(ctx, binding, offset, fmt::format("STORE.{} {},DC.x;", size, ret), | ||||
|     StorageOp(ctx, binding, offset, fmt::format("LOAD.{} {},DC.x;", size, ret), | ||||
|               fmt::format("MOV.U {},{{0,0,0,0}};", ret)); | ||||
| } | ||||
| } // Anonymous namespace | ||||
|   | ||||
| @@ -337,9 +337,9 @@ Id EmitImageSampleImplicitLod(EmitContext& ctx, IR::Inst* inst, const IR::Value& | ||||
| } | ||||
|  | ||||
| Id EmitImageSampleExplicitLod(EmitContext& ctx, IR::Inst* inst, const IR::Value& index, Id coords, | ||||
|                               Id lod_lc, const IR::Value& offset) { | ||||
|                               Id lod, const IR::Value& offset) { | ||||
|     const auto info{inst->Flags<IR::TextureInstInfo>()}; | ||||
|     const ImageOperands operands(ctx, false, true, info.has_lod_clamp != 0, lod_lc, offset); | ||||
|     const ImageOperands operands(ctx, false, true, false, lod, offset); | ||||
|     return Emit(&EmitContext::OpImageSparseSampleExplicitLod, | ||||
|                 &EmitContext::OpImageSampleExplicitLod, ctx, inst, ctx.F32[4], | ||||
|                 Texture(ctx, info, index), coords, operands.Mask(), operands.Span()); | ||||
| @@ -356,9 +356,9 @@ Id EmitImageSampleDrefImplicitLod(EmitContext& ctx, IR::Inst* inst, const IR::Va | ||||
| } | ||||
|  | ||||
| Id EmitImageSampleDrefExplicitLod(EmitContext& ctx, IR::Inst* inst, const IR::Value& index, | ||||
|                                   Id coords, Id dref, Id lod_lc, const IR::Value& offset) { | ||||
|                                   Id coords, Id dref, Id lod, const IR::Value& offset) { | ||||
|     const auto info{inst->Flags<IR::TextureInstInfo>()}; | ||||
|     const ImageOperands operands(ctx, false, true, info.has_lod_clamp != 0, lod_lc, offset); | ||||
|     const ImageOperands operands(ctx, false, true, false, lod, offset); | ||||
|     return Emit(&EmitContext::OpImageSparseSampleDrefExplicitLod, | ||||
|                 &EmitContext::OpImageSampleDrefExplicitLod, ctx, inst, ctx.F32[1], | ||||
|                 Texture(ctx, info, index), coords, dref, operands.Mask(), operands.Span()); | ||||
|   | ||||
| @@ -491,11 +491,11 @@ Id EmitBoundImageWrite(EmitContext&); | ||||
| Id EmitImageSampleImplicitLod(EmitContext& ctx, IR::Inst* inst, const IR::Value& index, Id coords, | ||||
|                               Id bias_lc, const IR::Value& offset); | ||||
| Id EmitImageSampleExplicitLod(EmitContext& ctx, IR::Inst* inst, const IR::Value& index, Id coords, | ||||
|                               Id lod_lc, const IR::Value& offset); | ||||
|                               Id lod, const IR::Value& offset); | ||||
| Id EmitImageSampleDrefImplicitLod(EmitContext& ctx, IR::Inst* inst, const IR::Value& index, | ||||
|                                   Id coords, Id dref, Id bias_lc, const IR::Value& offset); | ||||
| Id EmitImageSampleDrefExplicitLod(EmitContext& ctx, IR::Inst* inst, const IR::Value& index, | ||||
|                                   Id coords, Id dref, Id lod_lc, const IR::Value& offset); | ||||
|                                   Id coords, Id dref, Id lod, const IR::Value& offset); | ||||
| Id EmitImageGather(EmitContext& ctx, IR::Inst* inst, const IR::Value& index, Id coords, | ||||
|                    const IR::Value& offset, const IR::Value& offset2); | ||||
| Id EmitImageGatherDref(EmitContext& ctx, IR::Inst* inst, const IR::Value& index, Id coords, | ||||
|   | ||||
| @@ -1778,12 +1778,10 @@ Value IREmitter::ImageSampleImplicitLod(const Value& handle, const Value& coords | ||||
| } | ||||
|  | ||||
| Value IREmitter::ImageSampleExplicitLod(const Value& handle, const Value& coords, const F32& lod, | ||||
|                                         const Value& offset, const F32& lod_clamp, | ||||
|                                         TextureInstInfo info) { | ||||
|     const Value lod_lc{MakeLodClampPair(*this, lod, lod_clamp)}; | ||||
|                                         const Value& offset, TextureInstInfo info) { | ||||
|     const Opcode op{handle.IsImmediate() ? Opcode::BoundImageSampleExplicitLod | ||||
|                                          : Opcode::BindlessImageSampleExplicitLod}; | ||||
|     return Inst(op, Flags{info}, handle, coords, lod_lc, offset); | ||||
|     return Inst(op, Flags{info}, handle, coords, lod, offset); | ||||
| } | ||||
|  | ||||
| F32 IREmitter::ImageSampleDrefImplicitLod(const Value& handle, const Value& coords, const F32& dref, | ||||
| @@ -1796,12 +1794,11 @@ F32 IREmitter::ImageSampleDrefImplicitLod(const Value& handle, const Value& coor | ||||
| } | ||||
|  | ||||
| F32 IREmitter::ImageSampleDrefExplicitLod(const Value& handle, const Value& coords, const F32& dref, | ||||
|                                           const F32& lod, const Value& offset, const F32& lod_clamp, | ||||
|                                           const F32& lod, const Value& offset, | ||||
|                                           TextureInstInfo info) { | ||||
|     const Value lod_lc{MakeLodClampPair(*this, lod, lod_clamp)}; | ||||
|     const Opcode op{handle.IsImmediate() ? Opcode::BoundImageSampleDrefExplicitLod | ||||
|                                          : Opcode::BindlessImageSampleDrefExplicitLod}; | ||||
|     return Inst<F32>(op, Flags{info}, handle, coords, dref, lod_lc, offset); | ||||
|     return Inst<F32>(op, Flags{info}, handle, coords, dref, lod, offset); | ||||
| } | ||||
|  | ||||
| Value IREmitter::ImageGather(const Value& handle, const Value& coords, const Value& offset, | ||||
|   | ||||
| @@ -302,15 +302,14 @@ public: | ||||
|                                                const F32& lod_clamp, TextureInstInfo info); | ||||
|     [[nodiscard]] Value ImageSampleExplicitLod(const Value& handle, const Value& coords, | ||||
|                                                const F32& lod, const Value& offset, | ||||
|                                                const F32& lod_clamp, TextureInstInfo info); | ||||
|                                                TextureInstInfo info); | ||||
|     [[nodiscard]] F32 ImageSampleDrefImplicitLod(const Value& handle, const Value& coords, | ||||
|                                                  const F32& dref, const F32& bias, | ||||
|                                                  const Value& offset, const F32& lod_clamp, | ||||
|                                                  TextureInstInfo info); | ||||
|     [[nodiscard]] F32 ImageSampleDrefExplicitLod(const Value& handle, const Value& coords, | ||||
|                                                  const F32& dref, const F32& lod, | ||||
|                                                  const Value& offset, const F32& lod_clamp, | ||||
|                                                  TextureInstInfo info); | ||||
|                                                  const Value& offset, TextureInstInfo info); | ||||
|     [[nodiscard]] Value ImageQueryDimension(const Value& handle, const IR::U32& lod); | ||||
|  | ||||
|     [[nodiscard]] Value ImageQueryLod(const Value& handle, const Value& coords, | ||||
|   | ||||
| @@ -177,14 +177,13 @@ void Impl(TranslatorVisitor& v, u64 insn, bool aoffi, Blod blod, bool lc, | ||||
|     const IR::Value sample{[&]() -> IR::Value { | ||||
|         if (tex.dc == 0) { | ||||
|             if (HasExplicitLod(blod)) { | ||||
|                 return v.ir.ImageSampleExplicitLod(handle, coords, lod, offset, lod_clamp, info); | ||||
|                 return v.ir.ImageSampleExplicitLod(handle, coords, lod, offset, info); | ||||
|             } else { | ||||
|                 return v.ir.ImageSampleImplicitLod(handle, coords, lod, offset, lod_clamp, info); | ||||
|             } | ||||
|         } | ||||
|         if (HasExplicitLod(blod)) { | ||||
|             return v.ir.ImageSampleDrefExplicitLod(handle, coords, dref, lod, offset, lod_clamp, | ||||
|                                                    info); | ||||
|             return v.ir.ImageSampleDrefExplicitLod(handle, coords, dref, lod, offset, info); | ||||
|         } else { | ||||
|             return v.ir.ImageSampleDrefImplicitLod(handle, coords, dref, lod, offset, lod_clamp, | ||||
|                                                    info); | ||||
|   | ||||
| @@ -81,18 +81,18 @@ IR::Value Sample(TranslatorVisitor& v, u64 insn) { | ||||
|     switch (texs.encoding) { | ||||
|     case 0: // 1D.LZ | ||||
|         info.type.Assign(TextureType::Color1D); | ||||
|         return v.ir.ImageSampleExplicitLod(handle, v.F(reg_a), zero, {}, {}, info); | ||||
|         return v.ir.ImageSampleExplicitLod(handle, v.F(reg_a), zero, {}, info); | ||||
|     case 1: // 2D | ||||
|         info.type.Assign(TextureType::Color2D); | ||||
|         return v.ir.ImageSampleImplicitLod(handle, Composite(v, reg_a, reg_b), {}, {}, {}, info); | ||||
|     case 2: // 2D.LZ | ||||
|         info.type.Assign(TextureType::Color2D); | ||||
|         return v.ir.ImageSampleExplicitLod(handle, Composite(v, reg_a, reg_b), zero, {}, {}, info); | ||||
|         return v.ir.ImageSampleExplicitLod(handle, Composite(v, reg_a, reg_b), zero, {}, info); | ||||
|     case 3: // 2D.LL | ||||
|         CheckAlignment(reg_a, 2); | ||||
|         info.type.Assign(TextureType::Color2D); | ||||
|         return v.ir.ImageSampleExplicitLod(handle, Composite(v, reg_a, reg_a + 1), v.F(reg_b), {}, | ||||
|                                            {}, info); | ||||
|                                            info); | ||||
|     case 4: // 2D.DC | ||||
|         CheckAlignment(reg_a, 2); | ||||
|         info.type.Assign(TextureType::Color2D); | ||||
| @@ -105,13 +105,13 @@ IR::Value Sample(TranslatorVisitor& v, u64 insn) { | ||||
|         info.type.Assign(TextureType::Color2D); | ||||
|         info.is_depth.Assign(1); | ||||
|         return v.ir.ImageSampleDrefExplicitLod(handle, Composite(v, reg_a, reg_a + 1), | ||||
|                                                v.F(reg_b + 1), v.F(reg_b), {}, {}, info); | ||||
|                                                v.F(reg_b + 1), v.F(reg_b), {}, info); | ||||
|     case 6: // 2D.LZ.DC | ||||
|         CheckAlignment(reg_a, 2); | ||||
|         info.type.Assign(TextureType::Color2D); | ||||
|         info.is_depth.Assign(1); | ||||
|         return v.ir.ImageSampleDrefExplicitLod(handle, Composite(v, reg_a, reg_a + 1), v.F(reg_b), | ||||
|                                                zero, {}, {}, info); | ||||
|                                                zero, {}, info); | ||||
|     case 7: // ARRAY_2D | ||||
|         CheckAlignment(reg_a, 2); | ||||
|         info.type.Assign(TextureType::ColorArray2D); | ||||
| @@ -123,7 +123,7 @@ IR::Value Sample(TranslatorVisitor& v, u64 insn) { | ||||
|         info.type.Assign(TextureType::ColorArray2D); | ||||
|         return v.ir.ImageSampleExplicitLod( | ||||
|             handle, v.ir.CompositeConstruct(v.F(reg_a + 1), v.F(reg_b), ReadArray(v, v.X(reg_a))), | ||||
|             zero, {}, {}, info); | ||||
|             zero, {}, info); | ||||
|     case 9: // ARRAY_2D.LZ.DC | ||||
|         CheckAlignment(reg_a, 2); | ||||
|         CheckAlignment(reg_b, 2); | ||||
| @@ -131,7 +131,7 @@ IR::Value Sample(TranslatorVisitor& v, u64 insn) { | ||||
|         info.is_depth.Assign(1); | ||||
|         return v.ir.ImageSampleDrefExplicitLod( | ||||
|             handle, v.ir.CompositeConstruct(v.F(reg_a + 1), v.F(reg_b), ReadArray(v, v.X(reg_a))), | ||||
|             v.F(reg_b + 1), zero, {}, {}, info); | ||||
|             v.F(reg_b + 1), zero, {}, info); | ||||
|     case 10: // 3D | ||||
|         CheckAlignment(reg_a, 2); | ||||
|         info.type.Assign(TextureType::Color3D); | ||||
| @@ -141,7 +141,7 @@ IR::Value Sample(TranslatorVisitor& v, u64 insn) { | ||||
|         CheckAlignment(reg_a, 2); | ||||
|         info.type.Assign(TextureType::Color3D); | ||||
|         return v.ir.ImageSampleExplicitLod(handle, Composite(v, reg_a, reg_a + 1, reg_b), zero, {}, | ||||
|                                            {}, info); | ||||
|                                            info); | ||||
|     case 12: // CUBE | ||||
|         CheckAlignment(reg_a, 2); | ||||
|         info.type.Assign(TextureType::ColorCube); | ||||
| @@ -152,7 +152,7 @@ IR::Value Sample(TranslatorVisitor& v, u64 insn) { | ||||
|         CheckAlignment(reg_b, 2); | ||||
|         info.type.Assign(TextureType::ColorCube); | ||||
|         return v.ir.ImageSampleExplicitLod(handle, Composite(v, reg_a, reg_a + 1, reg_b), | ||||
|                                            v.F(reg_b + 1), {}, {}, info); | ||||
|                                            v.F(reg_b + 1), {}, info); | ||||
|     default: | ||||
|         throw NotImplementedException("Illegal encoding {}", texs.encoding.Value()); | ||||
|     } | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 ReinUsesLisp
					ReinUsesLisp