shader: Implement CAL inlining function calls

This commit is contained in:
ReinUsesLisp 2021-03-14 03:41:05 -03:00 committed by ameerj
parent b9f7bf4472
commit 71f96fa636
24 changed files with 286 additions and 330 deletions

@ -27,8 +27,6 @@ add_library(shader_recompiler STATIC
frontend/ir/condition.h frontend/ir/condition.h
frontend/ir/flow_test.cpp frontend/ir/flow_test.cpp
frontend/ir/flow_test.h frontend/ir/flow_test.h
frontend/ir/function.cpp
frontend/ir/function.h
frontend/ir/ir_emitter.cpp frontend/ir/ir_emitter.cpp
frontend/ir/ir_emitter.h frontend/ir/ir_emitter.h
frontend/ir/microinstruction.cpp frontend/ir/microinstruction.cpp
@ -43,8 +41,6 @@ add_library(shader_recompiler STATIC
frontend/ir/program.cpp frontend/ir/program.cpp
frontend/ir/program.h frontend/ir/program.h
frontend/ir/reg.h frontend/ir/reg.h
frontend/ir/structured_control_flow.cpp
frontend/ir/structured_control_flow.h
frontend/ir/type.cpp frontend/ir/type.cpp
frontend/ir/type.h frontend/ir/type.h
frontend/ir/value.cpp frontend/ir/value.cpp
@ -60,6 +56,8 @@ add_library(shader_recompiler STATIC
frontend/maxwell/opcodes.h frontend/maxwell/opcodes.h
frontend/maxwell/program.cpp frontend/maxwell/program.cpp
frontend/maxwell/program.h frontend/maxwell/program.h
frontend/maxwell/structured_control_flow.cpp
frontend/maxwell/structured_control_flow.h
frontend/maxwell/translate/impl/bitfield_extract.cpp frontend/maxwell/translate/impl/bitfield_extract.cpp
frontend/maxwell/translate/impl/bitfield_insert.cpp frontend/maxwell/translate/impl/bitfield_insert.cpp
frontend/maxwell/translate/impl/common_encoding.h frontend/maxwell/translate/impl/common_encoding.h

@ -262,11 +262,9 @@ void EmitContext::DefineTextures(const Info& info, u32& binding) {
} }
void EmitContext::DefineLabels(IR::Program& program) { void EmitContext::DefineLabels(IR::Program& program) {
for (const IR::Function& function : program.functions) { for (IR::Block* const block : program.blocks) {
for (IR::Block* const block : function.blocks) {
block->SetDefinition(OpLabel()); block->SetDefinition(OpLabel());
} }
}
} }
} // namespace Shader::Backend::SPIRV } // namespace Shader::Backend::SPIRV

@ -10,7 +10,6 @@
#include "shader_recompiler/backend/spirv/emit_spirv.h" #include "shader_recompiler/backend/spirv/emit_spirv.h"
#include "shader_recompiler/frontend/ir/basic_block.h" #include "shader_recompiler/frontend/ir/basic_block.h"
#include "shader_recompiler/frontend/ir/function.h"
#include "shader_recompiler/frontend/ir/microinstruction.h" #include "shader_recompiler/frontend/ir/microinstruction.h"
#include "shader_recompiler/frontend/ir/program.h" #include "shader_recompiler/frontend/ir/program.h"
@ -199,18 +198,14 @@ Id PhiArgDef(EmitContext& ctx, IR::Inst* inst, size_t index) {
std::vector<u32> EmitSPIRV(const Profile& profile, Environment& env, IR::Program& program) { std::vector<u32> EmitSPIRV(const Profile& profile, Environment& env, IR::Program& program) {
EmitContext ctx{profile, program}; EmitContext ctx{profile, program};
const Id void_function{ctx.TypeFunction(ctx.void_id)}; const Id void_function{ctx.TypeFunction(ctx.void_id)};
// FIXME: Forward declare functions (needs sirit support) const Id func{ctx.OpFunction(ctx.void_id, spv::FunctionControlMask::MaskNone, void_function)};
Id func{}; for (IR::Block* const block : program.blocks) {
for (IR::Function& function : program.functions) {
func = ctx.OpFunction(ctx.void_id, spv::FunctionControlMask::MaskNone, void_function);
for (IR::Block* const block : function.blocks) {
ctx.AddLabel(block->Definition<Id>()); ctx.AddLabel(block->Definition<Id>());
for (IR::Inst& inst : block->Instructions()) { for (IR::Inst& inst : block->Instructions()) {
EmitInst(ctx, &inst); EmitInst(ctx, &inst);
} }
} }
ctx.OpFunctionEnd(); ctx.OpFunctionEnd();
}
boost::container::small_vector<Id, 32> interfaces; boost::container::small_vector<Id, 32> interfaces;
const Info& info{program.info}; const Info& info{program.info};
if (info.uses_workgroup_id) { if (info.uses_workgroup_id) {

@ -1,5 +0,0 @@
// Copyright 2021 yuzu Emulator Project
// Licensed under GPLv2 or any later version
// Refer to the license.txt file included.
#include "shader_recompiler/frontend/ir/function.h"

@ -1,18 +0,0 @@
// Copyright 2021 yuzu Emulator Project
// Licensed under GPLv2 or any later version
// Refer to the license.txt file included.
#pragma once
#include <boost/container/small_vector.hpp>
#include "shader_recompiler/frontend/ir/basic_block.h"
namespace Shader::IR {
struct Function {
BlockList blocks;
BlockList post_order_blocks;
};
} // namespace Shader::IR

@ -9,7 +9,8 @@
#include <fmt/format.h> #include <fmt/format.h>
#include "shader_recompiler/frontend/ir/function.h" #include "shader_recompiler/frontend/ir/basic_block.h"
#include "shader_recompiler/frontend/ir/microinstruction.h"
#include "shader_recompiler/frontend/ir/program.h" #include "shader_recompiler/frontend/ir/program.h"
namespace Shader::IR { namespace Shader::IR {
@ -19,19 +20,14 @@ std::string DumpProgram(const Program& program) {
std::map<const IR::Inst*, size_t> inst_to_index; std::map<const IR::Inst*, size_t> inst_to_index;
std::map<const IR::Block*, size_t> block_to_index; std::map<const IR::Block*, size_t> block_to_index;
for (const IR::Function& function : program.functions) { for (const IR::Block* const block : program.blocks) {
for (const IR::Block* const block : function.blocks) {
block_to_index.emplace(block, index); block_to_index.emplace(block, index);
++index; ++index;
} }
}
std::string ret; std::string ret;
for (const IR::Function& function : program.functions) { for (const auto& block : program.blocks) {
ret += fmt::format("Function\n");
for (const auto& block : function.blocks) {
ret += IR::DumpBlock(*block, block_to_index, inst_to_index, index) + '\n'; ret += IR::DumpBlock(*block, block_to_index, inst_to_index, index) + '\n';
} }
}
return ret; return ret;
} }

@ -8,13 +8,14 @@
#include <boost/container/small_vector.hpp> #include <boost/container/small_vector.hpp>
#include "shader_recompiler/frontend/ir/function.h" #include "shader_recompiler/frontend/ir/basic_block.h"
#include "shader_recompiler/shader_info.h" #include "shader_recompiler/shader_info.h"
namespace Shader::IR { namespace Shader::IR {
struct Program { struct Program {
boost::container::small_vector<Function, 1> functions; BlockList blocks;
BlockList post_order_blocks;
Info info; Info info;
}; };

@ -31,13 +31,12 @@ struct Compare {
return lhs.begin < rhs.begin; return lhs.begin < rhs.begin;
} }
}; };
} // Anonymous namespace
static u32 BranchOffset(Location pc, Instruction inst) { u32 BranchOffset(Location pc, Instruction inst) {
return pc.Offset() + inst.branch.Offset() + 8; return pc.Offset() + inst.branch.Offset() + 8;
} }
static void Split(Block* old_block, Block* new_block, Location pc) { void Split(Block* old_block, Block* new_block, Location pc) {
if (pc <= old_block->begin || pc >= old_block->end) { if (pc <= old_block->begin || pc >= old_block->end) {
throw InvalidArgument("Invalid address to split={}", pc); throw InvalidArgument("Invalid address to split={}", pc);
} }
@ -49,21 +48,19 @@ static void Split(Block* old_block, Block* new_block, Location pc) {
.cond{old_block->cond}, .cond{old_block->cond},
.branch_true{old_block->branch_true}, .branch_true{old_block->branch_true},
.branch_false{old_block->branch_false}, .branch_false{old_block->branch_false},
.ir{nullptr},
}; };
*old_block = Block{ *old_block = Block{
.begin{old_block->begin}, .begin{old_block->begin},
.end{pc}, .end{pc},
.end_class{EndClass::Branch}, .end_class{EndClass::Branch},
.stack{std::move(old_block->stack)}, .stack{std::move(old_block->stack)},
.cond{IR::Condition{true}}, .cond{true},
.branch_true{new_block}, .branch_true{new_block},
.branch_false{nullptr}, .branch_false{nullptr},
.ir{nullptr},
}; };
} }
static Token OpcodeToken(Opcode opcode) { Token OpcodeToken(Opcode opcode) {
switch (opcode) { switch (opcode) {
case Opcode::PBK: case Opcode::PBK:
case Opcode::BRK: case Opcode::BRK:
@ -89,7 +86,7 @@ static Token OpcodeToken(Opcode opcode) {
} }
} }
static bool IsAbsoluteJump(Opcode opcode) { bool IsAbsoluteJump(Opcode opcode) {
switch (opcode) { switch (opcode) {
case Opcode::JCAL: case Opcode::JCAL:
case Opcode::JMP: case Opcode::JMP:
@ -100,7 +97,7 @@ static bool IsAbsoluteJump(Opcode opcode) {
} }
} }
static bool HasFlowTest(Opcode opcode) { bool HasFlowTest(Opcode opcode) {
switch (opcode) { switch (opcode) {
case Opcode::BRA: case Opcode::BRA:
case Opcode::BRX: case Opcode::BRX:
@ -121,13 +118,14 @@ static bool HasFlowTest(Opcode opcode) {
} }
} }
static std::string NameOf(const Block& block) { std::string NameOf(const Block& block) {
if (block.begin.IsVirtual()) { if (block.begin.IsVirtual()) {
return fmt::format("\"Virtual {}\"", block.begin); return fmt::format("\"Virtual {}\"", block.begin);
} else { } else {
return fmt::format("\"{}\"", block.begin); return fmt::format("\"{}\"", block.begin);
} }
} }
} // Anonymous namespace
void Stack::Push(Token token, Location target) { void Stack::Push(Token token, Location target) {
entries.push_back({ entries.push_back({
@ -166,26 +164,24 @@ bool Block::Contains(Location pc) const noexcept {
return pc >= begin && pc < end; return pc >= begin && pc < end;
} }
Function::Function(Location start_address) Function::Function(ObjectPool<Block>& block_pool, Location start_address)
: entrypoint{start_address}, labels{{ : entrypoint{start_address}, labels{{
.address{start_address}, .address{start_address},
.block{nullptr}, .block{block_pool.Create(Block{
.begin{start_address},
.end{start_address},
.end_class{EndClass::Branch},
.stack{},
.cond{true},
.branch_true{nullptr},
.branch_false{nullptr},
})},
.stack{}, .stack{},
}} {} }} {}
CFG::CFG(Environment& env_, ObjectPool<Block>& block_pool_, Location start_address) CFG::CFG(Environment& env_, ObjectPool<Block>& block_pool_, Location start_address)
: env{env_}, block_pool{block_pool_} { : env{env_}, block_pool{block_pool_} {
functions.emplace_back(start_address); functions.emplace_back(block_pool, start_address);
functions.back().labels.back().block = block_pool.Create(Block{
.begin{start_address},
.end{start_address},
.end_class{EndClass::Branch},
.stack{},
.cond{IR::Condition{true}},
.branch_true{nullptr},
.branch_false{nullptr},
.ir{nullptr},
});
for (FunctionId function_id = 0; function_id < functions.size(); ++function_id) { for (FunctionId function_id = 0; function_id < functions.size(); ++function_id) {
while (!functions[function_id].labels.empty()) { while (!functions[function_id].labels.empty()) {
Function& function{functions[function_id]}; Function& function{functions[function_id]};
@ -308,11 +304,17 @@ CFG::AnalysisState CFG::AnalyzeInst(Block* block, FunctionId function_id, Locati
const Location cal_pc{is_absolute ? inst.branch.Absolute() : BranchOffset(pc, inst)}; const Location cal_pc{is_absolute ? inst.branch.Absolute() : BranchOffset(pc, inst)};
// Technically CAL pushes into PRET, but that's implicit in the function call for us // Technically CAL pushes into PRET, but that's implicit in the function call for us
// Insert the function into the list if it doesn't exist // Insert the function into the list if it doesn't exist
if (std::ranges::find(functions, cal_pc, &Function::entrypoint) == functions.end()) { const auto it{std::ranges::find(functions, cal_pc, &Function::entrypoint)};
functions.emplace_back(cal_pc); const bool exists{it != functions.end()};
const FunctionId call_id{exists ? std::distance(functions.begin(), it) : functions.size()};
if (!exists) {
functions.emplace_back(block_pool, cal_pc);
} }
// Handle CAL like a regular instruction block->end_class = EndClass::Call;
break; block->function_call = call_id;
block->return_block = AddLabel(block, block->stack, pc + 1, function_id);
block->end = pc;
return AnalysisState::Branch;
} }
default: default:
break; break;
@ -348,7 +350,6 @@ void CFG::AnalyzeCondInst(Block* block, FunctionId function_id, Location pc,
.cond{cond}, .cond{cond},
.branch_true{conditional_block}, .branch_true{conditional_block},
.branch_false{nullptr}, .branch_false{nullptr},
.ir{nullptr},
}; };
// Save the contents of the visited block in the conditional block // Save the contents of the visited block in the conditional block
*conditional_block = std::move(*block); *conditional_block = std::move(*block);
@ -401,16 +402,6 @@ void CFG::AnalyzeBRX(Block*, Location, Instruction, bool is_absolute) {
throw NotImplementedException("{}", is_absolute ? "JMX" : "BRX"); throw NotImplementedException("{}", is_absolute ? "JMX" : "BRX");
} }
void CFG::AnalyzeCAL(Location pc, Instruction inst, bool is_absolute) {
const Location cal_pc{is_absolute ? inst.branch.Absolute() : BranchOffset(pc, inst)};
// Technically CAL pushes into PRET, but that's implicit in the function call for us
// Insert the function to the function list if it doesn't exist
const auto it{std::ranges::find(functions, cal_pc, &Function::entrypoint)};
if (it == functions.end()) {
functions.emplace_back(cal_pc);
}
}
CFG::AnalysisState CFG::AnalyzeEXIT(Block* block, FunctionId function_id, Location pc, CFG::AnalysisState CFG::AnalyzeEXIT(Block* block, FunctionId function_id, Location pc,
Instruction inst) { Instruction inst) {
const IR::FlowTest flow_test{inst.branch.flow_test}; const IR::FlowTest flow_test{inst.branch.flow_test};
@ -455,10 +446,9 @@ Block* CFG::AddLabel(Block* block, Stack stack, Location pc, FunctionId function
.end{pc}, .end{pc},
.end_class{EndClass::Branch}, .end_class{EndClass::Branch},
.stack{stack}, .stack{stack},
.cond{IR::Condition{true}}, .cond{true},
.branch_true{nullptr}, .branch_true{nullptr},
.branch_false{nullptr}, .branch_false{nullptr},
.ir{nullptr},
})}; })};
function.labels.push_back(Label{ function.labels.push_back(Label{
.address{pc}, .address{pc},
@ -495,6 +485,14 @@ std::string CFG::Dot() const {
add_branch(block.branch_false, false); add_branch(block.branch_false, false);
} }
break; break;
case EndClass::Call:
dot += fmt::format("\t\t{}->N{};\n", name, node_uid);
dot += fmt::format("\t\tN{}->{};\n", node_uid, NameOf(*block.return_block));
dot += fmt::format("\t\tN{} [label=\"Call {}\"][shape=square][style=stripped];\n",
node_uid, block.function_call);
dot += '\n';
++node_uid;
break;
case EndClass::Exit: case EndClass::Exit:
dot += fmt::format("\t\t{}->N{};\n", name, node_uid); dot += fmt::format("\t\t{}->N{};\n", name, node_uid);
dot += fmt::format("\t\tN{} [label=\"Exit\"][shape=square][style=stripped];\n", dot += fmt::format("\t\tN{} [label=\"Exit\"][shape=square][style=stripped];\n",

@ -20,16 +20,13 @@
#include "shader_recompiler/frontend/maxwell/opcodes.h" #include "shader_recompiler/frontend/maxwell/opcodes.h"
#include "shader_recompiler/object_pool.h" #include "shader_recompiler/object_pool.h"
namespace Shader::IR {
class Block;
}
namespace Shader::Maxwell::Flow { namespace Shader::Maxwell::Flow {
using FunctionId = size_t; using FunctionId = size_t;
enum class EndClass { enum class EndClass {
Branch, Branch,
Call,
Exit, Exit,
Return, Return,
}; };
@ -75,9 +72,14 @@ struct Block : boost::intrusive::set_base_hook<
EndClass end_class; EndClass end_class;
Stack stack; Stack stack;
IR::Condition cond; IR::Condition cond;
union {
Block* branch_true; Block* branch_true;
FunctionId function_call;
};
union {
Block* branch_false; Block* branch_false;
IR::Block* ir; Block* return_block;
};
}; };
struct Label { struct Label {
@ -87,7 +89,7 @@ struct Label {
}; };
struct Function { struct Function {
Function(Location start_address); explicit Function(ObjectPool<Block>& block_pool, Location start_address);
Location entrypoint; Location entrypoint;
boost::container::small_vector<Label, 16> labels; boost::container::small_vector<Label, 16> labels;
@ -137,7 +139,6 @@ private:
void AnalyzeBRA(Block* block, FunctionId function_id, Location pc, Instruction inst, void AnalyzeBRA(Block* block, FunctionId function_id, Location pc, Instruction inst,
bool is_absolute); bool is_absolute);
void AnalyzeBRX(Block* block, Location pc, Instruction inst, bool is_absolute); void AnalyzeBRX(Block* block, Location pc, Instruction inst, bool is_absolute);
void AnalyzeCAL(Location pc, Instruction inst, bool is_absolute);
AnalysisState AnalyzeEXIT(Block* block, FunctionId function_id, Location pc, Instruction inst); AnalysisState AnalyzeEXIT(Block* block, FunctionId function_id, Location pc, Instruction inst);
/// Return the branch target block id /// Return the branch target block id

@ -8,67 +8,44 @@
#include "shader_recompiler/frontend/ir/basic_block.h" #include "shader_recompiler/frontend/ir/basic_block.h"
#include "shader_recompiler/frontend/ir/post_order.h" #include "shader_recompiler/frontend/ir/post_order.h"
#include "shader_recompiler/frontend/ir/structured_control_flow.h"
#include "shader_recompiler/frontend/maxwell/program.h" #include "shader_recompiler/frontend/maxwell/program.h"
#include "shader_recompiler/frontend/maxwell/structured_control_flow.h"
#include "shader_recompiler/frontend/maxwell/translate/translate.h" #include "shader_recompiler/frontend/maxwell/translate/translate.h"
#include "shader_recompiler/ir_opt/passes.h" #include "shader_recompiler/ir_opt/passes.h"
namespace Shader::Maxwell { namespace Shader::Maxwell {
namespace {
IR::BlockList TranslateCode(ObjectPool<IR::Inst>& inst_pool, ObjectPool<IR::Block>& block_pool, static void RemoveUnreachableBlocks(IR::Program& program) {
Environment& env, Flow::Function& cfg_function) { // Some blocks might be unreachable if a function call exists unconditionally
const size_t num_blocks{cfg_function.blocks.size()}; // If this happens the number of blocks and post order blocks will mismatch
std::vector<IR::Block*> blocks(cfg_function.blocks.size()); if (program.blocks.size() == program.post_order_blocks.size()) {
std::ranges::for_each(cfg_function.blocks, [&, i = size_t{0}](auto& cfg_block) mutable { return;
const u32 begin{cfg_block.begin.Offset()};
const u32 end{cfg_block.end.Offset()};
blocks[i] = block_pool.Create(inst_pool, begin, end);
cfg_block.ir = blocks[i];
++i;
});
std::ranges::for_each(cfg_function.blocks, [&, i = size_t{0}](auto& cfg_block) mutable {
IR::Block* const block{blocks[i]};
++i;
if (cfg_block.end_class != Flow::EndClass::Branch) {
block->SetReturn();
} else if (cfg_block.cond == IR::Condition{true}) {
block->SetBranch(cfg_block.branch_true->ir);
} else if (cfg_block.cond == IR::Condition{false}) {
block->SetBranch(cfg_block.branch_false->ir);
} else {
block->SetBranches(cfg_block.cond, cfg_block.branch_true->ir,
cfg_block.branch_false->ir);
} }
const IR::BlockList& post_order{program.post_order_blocks};
std::erase_if(program.blocks, [&](IR::Block* block) {
return std::ranges::find(post_order, block) == post_order.end();
}); });
return IR::VisitAST(inst_pool, block_pool, blocks,
[&](IR::Block* block) { Translate(env, block); });
} }
} // Anonymous namespace
IR::Program TranslateProgram(ObjectPool<IR::Inst>& inst_pool, ObjectPool<IR::Block>& block_pool, IR::Program TranslateProgram(ObjectPool<IR::Inst>& inst_pool, ObjectPool<IR::Block>& block_pool,
Environment& env, Flow::CFG& cfg) { Environment& env, Flow::CFG& cfg) {
IR::Program program; IR::Program program;
auto& functions{program.functions}; program.blocks = VisitAST(inst_pool, block_pool, env, cfg);
functions.reserve(cfg.Functions().size()); program.post_order_blocks = PostOrder(program.blocks);
for (Flow::Function& cfg_function : cfg.Functions()) { RemoveUnreachableBlocks(program);
functions.push_back(IR::Function{
.blocks{TranslateCode(inst_pool, block_pool, env, cfg_function)}, // Replace instructions before the SSA rewrite
.post_order_blocks{},
});
}
Optimization::LowerFp16ToFp32(program); Optimization::LowerFp16ToFp32(program);
for (IR::Function& function : functions) {
function.post_order_blocks = PostOrder(function.blocks); Optimization::SsaRewritePass(program);
Optimization::SsaRewritePass(function.post_order_blocks);
}
Optimization::GlobalMemoryToStorageBufferPass(program); Optimization::GlobalMemoryToStorageBufferPass(program);
Optimization::TexturePass(env, program); Optimization::TexturePass(env, program);
for (IR::Function& function : functions) {
Optimization::PostOrderInvoke(Optimization::ConstantPropagationPass, function); Optimization::ConstantPropagationPass(program);
Optimization::PostOrderInvoke(Optimization::DeadCodeEliminationPass, function); Optimization::DeadCodeEliminationPass(program);
Optimization::IdentityRemovalPass(function); Optimization::IdentityRemovalPass(program);
Optimization::VerificationPass(function); Optimization::VerificationPass(program);
}
Optimization::CollectShaderInfoPass(program); Optimization::CollectShaderInfoPass(program);
return program; return program;
} }

@ -14,11 +14,14 @@
#include <boost/intrusive/list.hpp> #include <boost/intrusive/list.hpp>
#include "shader_recompiler/environment.h"
#include "shader_recompiler/frontend/ir/basic_block.h" #include "shader_recompiler/frontend/ir/basic_block.h"
#include "shader_recompiler/frontend/ir/ir_emitter.h" #include "shader_recompiler/frontend/ir/ir_emitter.h"
#include "shader_recompiler/frontend/maxwell/structured_control_flow.h"
#include "shader_recompiler/frontend/maxwell/translate/translate.h"
#include "shader_recompiler/object_pool.h" #include "shader_recompiler/object_pool.h"
namespace Shader::IR { namespace Shader::Maxwell {
namespace { namespace {
struct Statement; struct Statement;
@ -79,7 +82,7 @@ struct Variable {};
#pragma warning(disable : 26495) // Always initialize a member variable, expected in Statement #pragma warning(disable : 26495) // Always initialize a member variable, expected in Statement
#endif #endif
struct Statement : ListBaseHook { struct Statement : ListBaseHook {
Statement(Block* code_, Statement* up_) : code{code_}, up{up_}, type{StatementType::Code} {} Statement(IR::Block* code_, Statement* up_) : code{code_}, up{up_}, type{StatementType::Code} {}
Statement(Goto, Statement* cond_, Node label_, Statement* up_) Statement(Goto, Statement* cond_, Node label_, Statement* up_)
: label{label_}, cond{cond_}, up{up_}, type{StatementType::Goto} {} : label{label_}, cond{cond_}, up{up_}, type{StatementType::Goto} {}
Statement(Label, u32 id_, Statement* up_) : id{id_}, up{up_}, type{StatementType::Label} {} Statement(Label, u32 id_, Statement* up_) : id{id_}, up{up_}, type{StatementType::Label} {}
@ -91,7 +94,7 @@ struct Statement : ListBaseHook {
: cond{cond_}, up{up_}, type{StatementType::Break} {} : cond{cond_}, up{up_}, type{StatementType::Break} {}
Statement(Return) : type{StatementType::Return} {} Statement(Return) : type{StatementType::Return} {}
Statement(FunctionTag) : children{}, type{StatementType::Function} {} Statement(FunctionTag) : children{}, type{StatementType::Function} {}
Statement(Identity, Condition cond_) : guest_cond{cond_}, type{StatementType::Identity} {} Statement(Identity, IR::Condition cond_) : guest_cond{cond_}, type{StatementType::Identity} {}
Statement(Not, Statement* op_) : op{op_}, type{StatementType::Not} {} Statement(Not, Statement* op_) : op{op_}, type{StatementType::Not} {}
Statement(Or, Statement* op_a_, Statement* op_b_) Statement(Or, Statement* op_a_, Statement* op_b_)
: op_a{op_a_}, op_b{op_b_}, type{StatementType::Or} {} : op_a{op_a_}, op_b{op_b_}, type{StatementType::Or} {}
@ -106,10 +109,10 @@ struct Statement : ListBaseHook {
} }
union { union {
Block* code; IR::Block* code;
Node label; Node label;
Tree children; Tree children;
Condition guest_cond; IR::Condition guest_cond;
Statement* op; Statement* op;
Statement* op_a; Statement* op_a;
}; };
@ -269,9 +272,10 @@ bool SearchNode(const Tree& tree, ConstNode stmt, size_t& offset) {
class GotoPass { class GotoPass {
public: public:
explicit GotoPass(std::span<Block* const> blocks, ObjectPool<Statement>& stmt_pool) explicit GotoPass(Flow::CFG& cfg, ObjectPool<IR::Inst>& inst_pool_,
: pool{stmt_pool} { ObjectPool<IR::Block>& block_pool_, ObjectPool<Statement>& stmt_pool)
std::vector gotos{BuildUnorderedTreeGetGotos(blocks)}; : inst_pool{inst_pool_}, block_pool{block_pool_}, pool{stmt_pool} {
std::vector gotos{BuildTree(cfg)};
for (const Node& goto_stmt : gotos | std::views::reverse) { for (const Node& goto_stmt : gotos | std::views::reverse) {
RemoveGoto(goto_stmt); RemoveGoto(goto_stmt);
} }
@ -316,6 +320,7 @@ private:
} }
} }
// TODO: Remove this // TODO: Remove this
{
Node it{goto_stmt}; Node it{goto_stmt};
bool sibling{false}; bool sibling{false};
do { do {
@ -329,6 +334,7 @@ private:
if (!sibling) { if (!sibling) {
throw LogicError("Not siblings"); throw LogicError("Not siblings");
} }
}
// goto_stmt and label_stmt are guaranteed to be siblings, eliminate // goto_stmt and label_stmt are guaranteed to be siblings, eliminate
if (std::next(goto_stmt) == label_stmt) { if (std::next(goto_stmt) == label_stmt) {
// Simply eliminate the goto if the label is next to it // Simply eliminate the goto if the label is next to it
@ -342,63 +348,84 @@ private:
} }
} }
std::vector<Node> BuildUnorderedTreeGetGotos(std::span<Block* const> blocks) { std::vector<Node> BuildTree(Flow::CFG& cfg) {
// Assume all blocks have two branches u32 label_id{0};
std::vector<Node> gotos; std::vector<Node> gotos;
gotos.reserve(blocks.size() * 2); Flow::Function& first_function{cfg.Functions().front()};
BuildTree(cfg, first_function, label_id, gotos, root_stmt.children.end(), std::nullopt);
const std::unordered_map labels_map{BuildLabels(blocks)};
Tree& root{root_stmt.children};
auto insert_point{root.begin()};
// Skip all goto variables zero-initialization
std::advance(insert_point, labels_map.size());
for (Block* const block : blocks) {
// Skip label
++insert_point;
// Skip set variable
++insert_point;
root.insert(insert_point, *pool.Create(block, &root_stmt));
if (block->IsTerminationBlock()) {
root.insert(insert_point, *pool.Create(Return{}));
continue;
}
const Condition cond{block->BranchCondition()};
Statement* const true_cond{pool.Create(Identity{}, Condition{true})};
if (cond == Condition{true} || cond == Condition{false}) {
const bool is_true{cond == Condition{true}};
const Block* const branch{is_true ? block->TrueBranch() : block->FalseBranch()};
const Node label{labels_map.at(branch)};
Statement* const goto_stmt{pool.Create(Goto{}, true_cond, label, &root_stmt)};
gotos.push_back(root.insert(insert_point, *goto_stmt));
} else {
Statement* const ident_cond{pool.Create(Identity{}, cond)};
const Node true_label{labels_map.at(block->TrueBranch())};
const Node false_label{labels_map.at(block->FalseBranch())};
Statement* goto_true{pool.Create(Goto{}, ident_cond, true_label, &root_stmt)};
Statement* goto_false{pool.Create(Goto{}, true_cond, false_label, &root_stmt)};
gotos.push_back(root.insert(insert_point, *goto_true));
gotos.push_back(root.insert(insert_point, *goto_false));
}
}
return gotos; return gotos;
} }
std::unordered_map<const Block*, Node> BuildLabels(std::span<Block* const> blocks) { void BuildTree(Flow::CFG& cfg, Flow::Function& function, u32& label_id,
// TODO: Consider storing labels intrusively inside the block std::vector<Node>& gotos, Node function_insert_point,
std::unordered_map<const Block*, Node> labels_map; std::optional<Node> return_label) {
Statement* const false_stmt{pool.Create(Identity{}, IR::Condition{false})};
Tree& root{root_stmt.children}; Tree& root{root_stmt.children};
u32 label_id{0}; std::unordered_map<Flow::Block*, Node> local_labels;
for (const Block* const block : blocks) { local_labels.reserve(function.blocks.size());
for (Flow::Block& block : function.blocks) {
Statement* const label{pool.Create(Label{}, label_id, &root_stmt)}; Statement* const label{pool.Create(Label{}, label_id, &root_stmt)};
labels_map.emplace(block, root.insert(root.end(), *label)); const Node label_it{root.insert(function_insert_point, *label)};
Statement* const false_stmt{pool.Create(Identity{}, Condition{false})}; local_labels.emplace(&block, label_it);
root.push_back(*pool.Create(SetVariable{}, label_id, false_stmt, &root_stmt));
root.push_front(*pool.Create(SetVariable{}, label_id, false_stmt, &root_stmt));
++label_id; ++label_id;
} }
return labels_map; for (Flow::Block& block : function.blocks) {
const Node label{local_labels.at(&block)};
// Insertion point
const Node ip{std::next(label)};
// Reset goto variables before the first block and after its respective label
const auto make_reset_variable{[&]() -> Statement& {
return *pool.Create(SetVariable{}, label->id, false_stmt, &root_stmt);
}};
root.push_front(make_reset_variable());
root.insert(ip, make_reset_variable());
const u32 begin_offset{block.begin.Offset()};
const u32 end_offset{block.end.Offset()};
IR::Block* const ir_block{block_pool.Create(inst_pool, begin_offset, end_offset)};
root.insert(ip, *pool.Create(ir_block, &root_stmt));
switch (block.end_class) {
case Flow::EndClass::Branch: {
Statement* const always_cond{pool.Create(Identity{}, IR::Condition{true})};
if (block.cond == IR::Condition{true}) {
const Node true_label{local_labels.at(block.branch_true)};
gotos.push_back(
root.insert(ip, *pool.Create(Goto{}, always_cond, true_label, &root_stmt)));
} else if (block.cond == IR::Condition{false}) {
const Node false_label{local_labels.at(block.branch_false)};
gotos.push_back(root.insert(
ip, *pool.Create(Goto{}, always_cond, false_label, &root_stmt)));
} else {
const Node true_label{local_labels.at(block.branch_true)};
const Node false_label{local_labels.at(block.branch_false)};
Statement* const true_cond{pool.Create(Identity{}, block.cond)};
gotos.push_back(
root.insert(ip, *pool.Create(Goto{}, true_cond, true_label, &root_stmt)));
gotos.push_back(root.insert(
ip, *pool.Create(Goto{}, always_cond, false_label, &root_stmt)));
}
break;
}
case Flow::EndClass::Call: {
Flow::Function& call{cfg.Functions()[block.function_call]};
const Node call_return_label{local_labels.at(block.return_block)};
BuildTree(cfg, call, label_id, gotos, ip, call_return_label);
break;
}
case Flow::EndClass::Exit:
root.insert(ip, *pool.Create(Return{}));
break;
case Flow::EndClass::Return: {
Statement* const always_cond{pool.Create(Identity{}, block.cond)};
auto goto_stmt{pool.Create(Goto{}, always_cond, return_label.value(), &root_stmt)};
gotos.push_back(root.insert(ip, *goto_stmt));
break;
}
}
}
} }
void UpdateTreeUp(Statement* tree) { void UpdateTreeUp(Statement* tree) {
@ -556,11 +583,13 @@ private:
return offset; return offset;
} }
ObjectPool<IR::Inst>& inst_pool;
ObjectPool<IR::Block>& block_pool;
ObjectPool<Statement>& pool; ObjectPool<Statement>& pool;
Statement root_stmt{FunctionTag{}}; Statement root_stmt{FunctionTag{}};
}; };
Block* TryFindForwardBlock(const Statement& stmt) { IR::Block* TryFindForwardBlock(const Statement& stmt) {
const Tree& tree{stmt.up->children}; const Tree& tree{stmt.up->children};
const ConstNode end{tree.cend()}; const ConstNode end{tree.cend()};
ConstNode forward_node{std::next(Tree::s_iterator_to(stmt))}; ConstNode forward_node{std::next(Tree::s_iterator_to(stmt))};
@ -573,12 +602,12 @@ Block* TryFindForwardBlock(const Statement& stmt) {
return nullptr; return nullptr;
} }
[[nodiscard]] U1 VisitExpr(IREmitter& ir, const Statement& stmt) { [[nodiscard]] IR::U1 VisitExpr(IR::IREmitter& ir, const Statement& stmt) {
switch (stmt.type) { switch (stmt.type) {
case StatementType::Identity: case StatementType::Identity:
return ir.Condition(stmt.guest_cond); return ir.Condition(stmt.guest_cond);
case StatementType::Not: case StatementType::Not:
return ir.LogicalNot(U1{VisitExpr(ir, *stmt.op)}); return ir.LogicalNot(IR::U1{VisitExpr(ir, *stmt.op)});
case StatementType::Or: case StatementType::Or:
return ir.LogicalOr(VisitExpr(ir, *stmt.op_a), VisitExpr(ir, *stmt.op_b)); return ir.LogicalOr(VisitExpr(ir, *stmt.op_a), VisitExpr(ir, *stmt.op_b));
case StatementType::Variable: case StatementType::Variable:
@ -590,18 +619,18 @@ Block* TryFindForwardBlock(const Statement& stmt) {
class TranslatePass { class TranslatePass {
public: public:
TranslatePass(ObjectPool<Inst>& inst_pool_, ObjectPool<Block>& block_pool_, TranslatePass(ObjectPool<IR::Inst>& inst_pool_, ObjectPool<IR::Block>& block_pool_,
ObjectPool<Statement>& stmt_pool_, Statement& root_stmt, ObjectPool<Statement>& stmt_pool_, Environment& env_, Statement& root_stmt,
const std::function<void(IR::Block*)>& func_, BlockList& block_list_) IR::BlockList& block_list_)
: stmt_pool{stmt_pool_}, inst_pool{inst_pool_}, block_pool{block_pool_}, func{func_}, : stmt_pool{stmt_pool_}, inst_pool{inst_pool_}, block_pool{block_pool_}, env{env_},
block_list{block_list_} { block_list{block_list_} {
Visit(root_stmt, nullptr, nullptr); Visit(root_stmt, nullptr, nullptr);
} }
private: private:
void Visit(Statement& parent, Block* continue_block, Block* break_block) { void Visit(Statement& parent, IR::Block* continue_block, IR::Block* break_block) {
Tree& tree{parent.children}; Tree& tree{parent.children};
Block* current_block{nullptr}; IR::Block* current_block{nullptr};
for (auto it = tree.begin(); it != tree.end(); ++it) { for (auto it = tree.begin(); it != tree.end(); ++it) {
Statement& stmt{*it}; Statement& stmt{*it};
@ -611,11 +640,10 @@ private:
break; break;
case StatementType::Code: { case StatementType::Code: {
if (current_block && current_block != stmt.code) { if (current_block && current_block != stmt.code) {
IREmitter ir{*current_block}; IR::IREmitter{*current_block}.Branch(stmt.code);
ir.Branch(stmt.code);
} }
current_block = stmt.code; current_block = stmt.code;
func(stmt.code); Translate(env, stmt.code);
block_list.push_back(stmt.code); block_list.push_back(stmt.code);
break; break;
} }
@ -623,7 +651,7 @@ private:
if (!current_block) { if (!current_block) {
current_block = MergeBlock(parent, stmt); current_block = MergeBlock(parent, stmt);
} }
IREmitter ir{*current_block}; IR::IREmitter ir{*current_block};
ir.SetGotoVariable(stmt.id, VisitExpr(ir, *stmt.op)); ir.SetGotoVariable(stmt.id, VisitExpr(ir, *stmt.op));
break; break;
} }
@ -632,16 +660,16 @@ private:
current_block = block_pool.Create(inst_pool); current_block = block_pool.Create(inst_pool);
block_list.push_back(current_block); block_list.push_back(current_block);
} }
Block* const merge_block{MergeBlock(parent, stmt)}; IR::Block* const merge_block{MergeBlock(parent, stmt)};
// Visit children // Visit children
const size_t first_block_index{block_list.size()}; const size_t first_block_index{block_list.size()};
Visit(stmt, merge_block, break_block); Visit(stmt, merge_block, break_block);
// Implement if header block // Implement if header block
Block* const first_if_block{block_list.at(first_block_index)}; IR::Block* const first_if_block{block_list.at(first_block_index)};
IREmitter ir{*current_block}; IR::IREmitter ir{*current_block};
const U1 cond{VisitExpr(ir, *stmt.cond)}; const IR::U1 cond{VisitExpr(ir, *stmt.cond)};
ir.SelectionMerge(merge_block); ir.SelectionMerge(merge_block);
ir.BranchConditional(cond, first_if_block, merge_block); ir.BranchConditional(cond, first_if_block, merge_block);
@ -649,14 +677,14 @@ private:
break; break;
} }
case StatementType::Loop: { case StatementType::Loop: {
Block* const loop_header_block{block_pool.Create(inst_pool)}; IR::Block* const loop_header_block{block_pool.Create(inst_pool)};
if (current_block) { if (current_block) {
IREmitter{*current_block}.Branch(loop_header_block); IR::IREmitter{*current_block}.Branch(loop_header_block);
} }
block_list.push_back(loop_header_block); block_list.push_back(loop_header_block);
Block* const new_continue_block{block_pool.Create(inst_pool)}; IR::Block* const new_continue_block{block_pool.Create(inst_pool)};
Block* const merge_block{MergeBlock(parent, stmt)}; IR::Block* const merge_block{MergeBlock(parent, stmt)};
// Visit children // Visit children
const size_t first_block_index{block_list.size()}; const size_t first_block_index{block_list.size()};
@ -666,14 +694,14 @@ private:
block_list.push_back(new_continue_block); block_list.push_back(new_continue_block);
// Implement loop header block // Implement loop header block
Block* const first_loop_block{block_list.at(first_block_index)}; IR::Block* const first_loop_block{block_list.at(first_block_index)};
IREmitter ir{*loop_header_block}; IR::IREmitter ir{*loop_header_block};
ir.LoopMerge(merge_block, new_continue_block); ir.LoopMerge(merge_block, new_continue_block);
ir.Branch(first_loop_block); ir.Branch(first_loop_block);
// Implement continue block // Implement continue block
IREmitter continue_ir{*new_continue_block}; IR::IREmitter continue_ir{*new_continue_block};
const U1 continue_cond{VisitExpr(continue_ir, *stmt.cond)}; const IR::U1 continue_cond{VisitExpr(continue_ir, *stmt.cond)};
continue_ir.BranchConditional(continue_cond, ir.block, merge_block); continue_ir.BranchConditional(continue_cond, ir.block, merge_block);
current_block = merge_block; current_block = merge_block;
@ -684,9 +712,9 @@ private:
current_block = block_pool.Create(inst_pool); current_block = block_pool.Create(inst_pool);
block_list.push_back(current_block); block_list.push_back(current_block);
} }
Block* const skip_block{MergeBlock(parent, stmt)}; IR::Block* const skip_block{MergeBlock(parent, stmt)};
IREmitter ir{*current_block}; IR::IREmitter ir{*current_block};
ir.BranchConditional(VisitExpr(ir, *stmt.cond), break_block, skip_block); ir.BranchConditional(VisitExpr(ir, *stmt.cond), break_block, skip_block);
current_block = skip_block; current_block = skip_block;
@ -697,7 +725,7 @@ private:
current_block = block_pool.Create(inst_pool); current_block = block_pool.Create(inst_pool);
block_list.push_back(current_block); block_list.push_back(current_block);
} }
IREmitter{*current_block}.Return(); IR::IREmitter{*current_block}.Return();
current_block = nullptr; current_block = nullptr;
break; break;
} }
@ -706,39 +734,37 @@ private:
} }
} }
if (current_block && continue_block) { if (current_block && continue_block) {
IREmitter ir{*current_block}; IR::IREmitter{*current_block}.Branch(continue_block);
ir.Branch(continue_block);
} }
} }
Block* MergeBlock(Statement& parent, Statement& stmt) { IR::Block* MergeBlock(Statement& parent, Statement& stmt) {
if (Block* const block{TryFindForwardBlock(stmt)}) { if (IR::Block* const block{TryFindForwardBlock(stmt)}) {
return block; return block;
} }
// Create a merge block we can visit later // Create a merge block we can visit later
Block* const block{block_pool.Create(inst_pool)}; IR::Block* const block{block_pool.Create(inst_pool)};
Statement* const merge_stmt{stmt_pool.Create(block, &parent)}; Statement* const merge_stmt{stmt_pool.Create(block, &parent)};
parent.children.insert(std::next(Tree::s_iterator_to(stmt)), *merge_stmt); parent.children.insert(std::next(Tree::s_iterator_to(stmt)), *merge_stmt);
return block; return block;
} }
ObjectPool<Statement>& stmt_pool; ObjectPool<Statement>& stmt_pool;
ObjectPool<Inst>& inst_pool; ObjectPool<IR::Inst>& inst_pool;
ObjectPool<Block>& block_pool; ObjectPool<IR::Block>& block_pool;
const std::function<void(IR::Block*)>& func; Environment& env;
BlockList& block_list; IR::BlockList& block_list;
}; };
} // Anonymous namespace } // Anonymous namespace
BlockList VisitAST(ObjectPool<Inst>& inst_pool, ObjectPool<Block>& block_pool, IR::BlockList VisitAST(ObjectPool<IR::Inst>& inst_pool, ObjectPool<IR::Block>& block_pool,
std::span<Block* const> unordered_blocks, Environment& env, Flow::CFG& cfg) {
const std::function<void(Block*)>& func) {
ObjectPool<Statement> stmt_pool{64}; ObjectPool<Statement> stmt_pool{64};
GotoPass goto_pass{unordered_blocks, stmt_pool}; GotoPass goto_pass{cfg, inst_pool, block_pool, stmt_pool};
BlockList block_list; Statement& root{goto_pass.RootStatement()};
TranslatePass translate_pass{inst_pool, block_pool, stmt_pool, goto_pass.RootStatement(), IR::BlockList block_list;
func, block_list}; TranslatePass{inst_pool, block_pool, stmt_pool, env, root, block_list};
return block_list; return block_list;
} }
} // namespace Shader::IR } // namespace Shader::Maxwell

@ -9,14 +9,16 @@
#include <boost/intrusive/list.hpp> #include <boost/intrusive/list.hpp>
#include "shader_recompiler/environment.h"
#include "shader_recompiler/frontend/ir/basic_block.h" #include "shader_recompiler/frontend/ir/basic_block.h"
#include "shader_recompiler/frontend/ir/microinstruction.h" #include "shader_recompiler/frontend/ir/microinstruction.h"
#include "shader_recompiler/frontend/maxwell/control_flow.h"
#include "shader_recompiler/object_pool.h" #include "shader_recompiler/object_pool.h"
namespace Shader::IR { namespace Shader::Maxwell {
[[nodiscard]] BlockList VisitAST(ObjectPool<Inst>& inst_pool, ObjectPool<Block>& block_pool, [[nodiscard]] IR::BlockList VisitAST(ObjectPool<IR::Inst>& inst_pool,
std::span<Block* const> unordered_blocks, ObjectPool<IR::Block>& block_pool, Environment& env,
const std::function<void(Block*)>& func); Flow::CFG& cfg);
} // namespace Shader::IR } // namespace Shader::Maxwell

@ -62,7 +62,7 @@ public:
void BRA(u64 insn); void BRA(u64 insn);
void BRK(u64 insn); void BRK(u64 insn);
void BRX(u64 insn); void BRX(u64 insn);
void CAL(u64 insn); void CAL();
void CCTL(u64 insn); void CCTL(u64 insn);
void CCTLL(u64 insn); void CCTLL(u64 insn);
void CONT(u64 insn); void CONT(u64 insn);

@ -65,8 +65,8 @@ void TranslatorVisitor::BRX(u64) {
ThrowNotImplemented(Opcode::BRX); ThrowNotImplemented(Opcode::BRX);
} }
void TranslatorVisitor::CAL(u64) { void TranslatorVisitor::CAL() {
ThrowNotImplemented(Opcode::CAL); // CAL is a no-op
} }
void TranslatorVisitor::CCTL(u64) { void TranslatorVisitor::CCTL(u64) {

@ -296,13 +296,11 @@ void Visit(Info& info, IR::Inst& inst) {
void CollectShaderInfoPass(IR::Program& program) { void CollectShaderInfoPass(IR::Program& program) {
Info& info{program.info}; Info& info{program.info};
for (IR::Function& function : program.functions) { for (IR::Block* const block : program.post_order_blocks) {
for (IR::Block* const block : function.post_order_blocks) {
for (IR::Inst& inst : block->Instructions()) { for (IR::Inst& inst : block->Instructions()) {
Visit(info, inst); Visit(info, inst);
} }
} }
}
} }
} // namespace Shader::Optimization } // namespace Shader::Optimization

@ -371,9 +371,11 @@ void ConstantPropagation(IR::Block& block, IR::Inst& inst) {
} }
} // Anonymous namespace } // Anonymous namespace
void ConstantPropagationPass(IR::Block& block) { void ConstantPropagationPass(IR::Program& program) {
for (IR::Inst& inst : block) { for (IR::Block* const block : program.post_order_blocks) {
ConstantPropagation(block, inst); for (IR::Inst& inst : block->Instructions()) {
ConstantPropagation(*block, inst);
}
} }
} }

@ -10,14 +10,16 @@
namespace Shader::Optimization { namespace Shader::Optimization {
void DeadCodeEliminationPass(IR::Block& block) { void DeadCodeEliminationPass(IR::Program& program) {
// We iterate over the instructions in reverse order. // We iterate over the instructions in reverse order.
// This is because removing an instruction reduces the number of uses for earlier instructions. // This is because removing an instruction reduces the number of uses for earlier instructions.
for (IR::Inst& inst : block | std::views::reverse) { for (IR::Block* const block : program.post_order_blocks) {
for (IR::Inst& inst : block->Instructions() | std::views::reverse) {
if (!inst.HasUses() && !inst.MayHaveSideEffects()) { if (!inst.HasUses() && !inst.MayHaveSideEffects()) {
inst.Invalidate(); inst.Invalidate();
} }
} }
}
} }
} // namespace Shader::Optimization } // namespace Shader::Optimization

@ -351,8 +351,7 @@ void GlobalMemoryToStorageBufferPass(IR::Program& program) {
StorageBufferSet storage_buffers; StorageBufferSet storage_buffers;
StorageInstVector to_replace; StorageInstVector to_replace;
for (IR::Function& function : program.functions) { for (IR::Block* const block : program.post_order_blocks) {
for (IR::Block* const block : function.post_order_blocks) {
for (IR::Inst& inst : block->Instructions()) { for (IR::Inst& inst : block->Instructions()) {
if (!IsGlobalMemory(inst)) { if (!IsGlobalMemory(inst)) {
continue; continue;
@ -360,7 +359,6 @@ void GlobalMemoryToStorageBufferPass(IR::Program& program) {
CollectStorageBuffers(*block, inst, storage_buffers, to_replace); CollectStorageBuffers(*block, inst, storage_buffers, to_replace);
} }
} }
}
Info& info{program.info}; Info& info{program.info};
u32 storage_index{}; u32 storage_index{};
for (const StorageBufferAddr& storage_buffer : storage_buffers) { for (const StorageBufferAddr& storage_buffer : storage_buffers) {

@ -10,10 +10,10 @@
namespace Shader::Optimization { namespace Shader::Optimization {
void IdentityRemovalPass(IR::Function& function) { void IdentityRemovalPass(IR::Program& program) {
std::vector<IR::Inst*> to_invalidate; std::vector<IR::Inst*> to_invalidate;
for (IR::Block* const block : function.blocks) { for (IR::Block* const block : program.blocks) {
for (auto inst = block->begin(); inst != block->end();) { for (auto inst = block->begin(); inst != block->end();) {
const size_t num_args{inst->NumArgs()}; const size_t num_args{inst->NumArgs()};
for (size_t i = 0; i < num_args; ++i) { for (size_t i = 0; i < num_args; ++i) {

@ -77,13 +77,11 @@ IR::Opcode Replace(IR::Opcode op) {
} // Anonymous namespace } // Anonymous namespace
void LowerFp16ToFp32(IR::Program& program) { void LowerFp16ToFp32(IR::Program& program) {
for (IR::Function& function : program.functions) { for (IR::Block* const block : program.blocks) {
for (IR::Block* const block : function.blocks) {
for (IR::Inst& inst : block->Instructions()) { for (IR::Inst& inst : block->Instructions()) {
inst.ReplaceOpcode(Replace(inst.Opcode())); inst.ReplaceOpcode(Replace(inst.Opcode()));
} }
} }
}
} }
} // namespace Shader::Optimization } // namespace Shader::Optimization

@ -8,26 +8,18 @@
#include "shader_recompiler/environment.h" #include "shader_recompiler/environment.h"
#include "shader_recompiler/frontend/ir/basic_block.h" #include "shader_recompiler/frontend/ir/basic_block.h"
#include "shader_recompiler/frontend/ir/function.h"
#include "shader_recompiler/frontend/ir/program.h" #include "shader_recompiler/frontend/ir/program.h"
namespace Shader::Optimization { namespace Shader::Optimization {
template <typename Func>
void PostOrderInvoke(Func&& func, IR::Function& function) {
for (const auto& block : function.post_order_blocks) {
func(*block);
}
}
void CollectShaderInfoPass(IR::Program& program); void CollectShaderInfoPass(IR::Program& program);
void ConstantPropagationPass(IR::Block& block); void ConstantPropagationPass(IR::Program& program);
void DeadCodeEliminationPass(IR::Block& block); void DeadCodeEliminationPass(IR::Program& program);
void GlobalMemoryToStorageBufferPass(IR::Program& program); void GlobalMemoryToStorageBufferPass(IR::Program& program);
void IdentityRemovalPass(IR::Function& function); void IdentityRemovalPass(IR::Program& program);
void LowerFp16ToFp32(IR::Program& program); void LowerFp16ToFp32(IR::Program& program);
void SsaRewritePass(std::span<IR::Block* const> post_order_blocks); void SsaRewritePass(IR::Program& program);
void TexturePass(Environment& env, IR::Program& program); void TexturePass(Environment& env, IR::Program& program);
void VerificationPass(const IR::Function& function); void VerificationPass(const IR::Program& program);
} // namespace Shader::Optimization } // namespace Shader::Optimization

@ -23,7 +23,6 @@
#include <boost/container/flat_set.hpp> #include <boost/container/flat_set.hpp>
#include "shader_recompiler/frontend/ir/basic_block.h" #include "shader_recompiler/frontend/ir/basic_block.h"
#include "shader_recompiler/frontend/ir/function.h"
#include "shader_recompiler/frontend/ir/microinstruction.h" #include "shader_recompiler/frontend/ir/microinstruction.h"
#include "shader_recompiler/frontend/ir/opcodes.h" #include "shader_recompiler/frontend/ir/opcodes.h"
#include "shader_recompiler/frontend/ir/pred.h" #include "shader_recompiler/frontend/ir/pred.h"
@ -262,9 +261,9 @@ void VisitBlock(Pass& pass, IR::Block* block) {
} }
} // Anonymous namespace } // Anonymous namespace
void SsaRewritePass(std::span<IR::Block* const> post_order_blocks) { void SsaRewritePass(IR::Program& program) {
Pass pass; Pass pass;
for (IR::Block* const block : post_order_blocks | std::views::reverse) { for (IR::Block* const block : program.post_order_blocks | std::views::reverse) {
VisitBlock(pass, block); VisitBlock(pass, block);
} }
} }

@ -164,8 +164,7 @@ private:
void TexturePass(Environment& env, IR::Program& program) { void TexturePass(Environment& env, IR::Program& program) {
TextureInstVector to_replace; TextureInstVector to_replace;
for (IR::Function& function : program.functions) { for (IR::Block* const block : program.post_order_blocks) {
for (IR::Block* const block : function.post_order_blocks) {
for (IR::Inst& inst : block->Instructions()) { for (IR::Inst& inst : block->Instructions()) {
if (!IsTextureInstruction(inst)) { if (!IsTextureInstruction(inst)) {
continue; continue;
@ -173,7 +172,6 @@ void TexturePass(Environment& env, IR::Program& program) {
to_replace.push_back(MakeInst(env, block, inst)); to_replace.push_back(MakeInst(env, block, inst));
} }
} }
}
// Sort instructions to visit textures by constant buffer index, then by offset // Sort instructions to visit textures by constant buffer index, then by offset
std::ranges::sort(to_replace, [](const auto& lhs, const auto& rhs) { std::ranges::sort(to_replace, [](const auto& lhs, const auto& rhs) {
return lhs.cbuf.offset < rhs.cbuf.offset; return lhs.cbuf.offset < rhs.cbuf.offset;

@ -11,8 +11,8 @@
namespace Shader::Optimization { namespace Shader::Optimization {
static void ValidateTypes(const IR::Function& function) { static void ValidateTypes(const IR::Program& program) {
for (const auto& block : function.blocks) { for (const auto& block : program.blocks) {
for (const IR::Inst& inst : *block) { for (const IR::Inst& inst : *block) {
if (inst.Opcode() == IR::Opcode::Phi) { if (inst.Opcode() == IR::Opcode::Phi) {
// Skip validation on phi nodes // Skip validation on phi nodes
@ -30,9 +30,9 @@ static void ValidateTypes(const IR::Function& function) {
} }
} }
static void ValidateUses(const IR::Function& function) { static void ValidateUses(const IR::Program& program) {
std::map<IR::Inst*, int> actual_uses; std::map<IR::Inst*, int> actual_uses;
for (const auto& block : function.blocks) { for (const auto& block : program.blocks) {
for (const IR::Inst& inst : *block) { for (const IR::Inst& inst : *block) {
const size_t num_args{inst.NumArgs()}; const size_t num_args{inst.NumArgs()};
for (size_t i = 0; i < num_args; ++i) { for (size_t i = 0; i < num_args; ++i) {
@ -45,14 +45,14 @@ static void ValidateUses(const IR::Function& function) {
} }
for (const auto [inst, uses] : actual_uses) { for (const auto [inst, uses] : actual_uses) {
if (inst->UseCount() != uses) { if (inst->UseCount() != uses) {
throw LogicError("Invalid uses in block:" /*, IR::DumpFunction(function)*/); throw LogicError("Invalid uses in block: {}", IR::DumpProgram(program));
} }
} }
} }
void VerificationPass(const IR::Function& function) { void VerificationPass(const IR::Program& program) {
ValidateTypes(function); ValidateTypes(program);
ValidateUses(function); ValidateUses(program);
} }
} // namespace Shader::Optimization } // namespace Shader::Optimization