2018-12-20 23:09:21 +01:00
|
|
|
// Copyright 2018 yuzu Emulator Project
|
|
|
|
// Licensed under GPLv2 or any later version
|
|
|
|
// Refer to the license.txt file included.
|
|
|
|
|
|
|
|
#include <cstring>
|
|
|
|
#include <set>
|
|
|
|
|
|
|
|
#include <fmt/format.h>
|
|
|
|
|
2018-12-21 07:18:54 +01:00
|
|
|
#include "common/assert.h"
|
2018-12-20 23:09:21 +01:00
|
|
|
#include "common/common_types.h"
|
|
|
|
#include "video_core/engines/shader_bytecode.h"
|
|
|
|
#include "video_core/engines/shader_header.h"
|
2019-06-25 01:46:49 +02:00
|
|
|
#include "video_core/shader/control_flow.h"
|
2019-06-05 03:44:06 +02:00
|
|
|
#include "video_core/shader/node_helper.h"
|
2018-12-20 23:09:21 +01:00
|
|
|
#include "video_core/shader/shader_ir.h"
|
|
|
|
|
|
|
|
namespace VideoCommon::Shader {
|
|
|
|
|
|
|
|
using Tegra::Shader::Instruction;
|
|
|
|
using Tegra::Shader::OpCode;
|
|
|
|
|
2018-12-21 07:39:46 +01:00
|
|
|
namespace {
|
|
|
|
|
2018-12-20 23:09:21 +01:00
|
|
|
/**
|
|
|
|
* Returns whether the instruction at the specified offset is a 'sched' instruction.
|
|
|
|
* Sched instructions always appear before a sequence of 3 instructions.
|
|
|
|
*/
|
|
|
|
constexpr bool IsSchedInstruction(u32 offset, u32 main_offset) {
|
|
|
|
constexpr u32 SchedPeriod = 4;
|
|
|
|
u32 absolute_offset = offset - main_offset;
|
|
|
|
|
|
|
|
return (absolute_offset % SchedPeriod) == 0;
|
|
|
|
}
|
|
|
|
|
2018-12-21 07:39:46 +01:00
|
|
|
} // namespace
|
|
|
|
|
2018-12-20 23:09:21 +01:00
|
|
|
void ShaderIR::Decode() {
|
|
|
|
std::memcpy(&header, program_code.data(), sizeof(Tegra::Shader::Header));
|
|
|
|
|
2019-06-25 01:46:49 +02:00
|
|
|
ShaderCharacteristics shader_info{};
|
2019-06-25 13:57:32 +02:00
|
|
|
bool can_proceed = ScanFlow(program_code, program_code.size(), main_offset, shader_info);
|
2019-06-25 01:46:49 +02:00
|
|
|
if (can_proceed) {
|
|
|
|
coverage_begin = shader_info.start;
|
|
|
|
coverage_end = shader_info.end;
|
|
|
|
if (shader_info.decompilable) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
// we can't decompile it, fallback to standard method
|
|
|
|
for (const auto& block : shader_info.blocks) {
|
|
|
|
basic_blocks.insert({block.start, DecodeRange(block.start, block.end + 1)});
|
|
|
|
}
|
2018-12-20 23:09:21 +01:00
|
|
|
return;
|
|
|
|
}
|
2019-06-25 13:57:32 +02:00
|
|
|
LOG_WARNING(HW_GPU, "Flow Analysis failed, falling back to brute force compiling");
|
2019-06-25 01:46:49 +02:00
|
|
|
|
|
|
|
// Now we need to deal with an undecompilable shader. We need to brute force
|
|
|
|
// a shader that captures every position.
|
|
|
|
coverage_begin = shader_info.start;
|
2019-06-25 13:57:32 +02:00
|
|
|
const u32 shader_end = static_cast<u32>(program_size / sizeof(u64));
|
2019-06-25 01:46:49 +02:00
|
|
|
coverage_end = shader_end;
|
|
|
|
for (u32 label = main_offset; label < shader_end; label++) {
|
|
|
|
basic_blocks.insert({label, DecodeRange(label, label + 1)});
|
2018-12-20 23:09:21 +01:00
|
|
|
}
|
2019-06-25 01:46:49 +02:00
|
|
|
return;
|
2018-12-20 23:09:21 +01:00
|
|
|
}
|
|
|
|
|
2019-01-30 06:09:40 +01:00
|
|
|
NodeBlock ShaderIR::DecodeRange(u32 begin, u32 end) {
|
|
|
|
NodeBlock basic_block;
|
2018-12-20 23:09:21 +01:00
|
|
|
for (u32 pc = begin; pc < (begin > end ? MAX_PROGRAM_LENGTH : end);) {
|
|
|
|
pc = DecodeInstr(basic_block, pc);
|
|
|
|
}
|
2019-01-28 13:43:19 +01:00
|
|
|
return basic_block;
|
2018-12-20 23:09:21 +01:00
|
|
|
}
|
|
|
|
|
2019-01-30 06:09:40 +01:00
|
|
|
u32 ShaderIR::DecodeInstr(NodeBlock& bb, u32 pc) {
|
2018-12-20 23:09:21 +01:00
|
|
|
// Ignore sched instructions when generating code.
|
|
|
|
if (IsSchedInstruction(pc, main_offset)) {
|
|
|
|
return pc + 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
const Instruction instr = {program_code[pc]};
|
|
|
|
const auto opcode = OpCode::Decode(instr);
|
|
|
|
|
|
|
|
// Decoding failure
|
|
|
|
if (!opcode) {
|
|
|
|
UNIMPLEMENTED_MSG("Unhandled instruction: {0:x}", instr.value);
|
|
|
|
return pc + 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
bb.push_back(
|
|
|
|
Comment(fmt::format("{}: {} (0x{:016x})", pc, opcode->get().GetName(), instr.value)));
|
|
|
|
|
|
|
|
using Tegra::Shader::Pred;
|
|
|
|
UNIMPLEMENTED_IF_MSG(instr.pred.full_pred == Pred::NeverExecute,
|
|
|
|
"NeverExecute predicate not implemented");
|
|
|
|
|
2019-01-30 06:09:40 +01:00
|
|
|
static const std::map<OpCode::Type, u32 (ShaderIR::*)(NodeBlock&, u32)> decoders = {
|
|
|
|
{OpCode::Type::Arithmetic, &ShaderIR::DecodeArithmetic},
|
|
|
|
{OpCode::Type::ArithmeticImmediate, &ShaderIR::DecodeArithmeticImmediate},
|
|
|
|
{OpCode::Type::Bfe, &ShaderIR::DecodeBfe},
|
|
|
|
{OpCode::Type::Bfi, &ShaderIR::DecodeBfi},
|
|
|
|
{OpCode::Type::Shift, &ShaderIR::DecodeShift},
|
|
|
|
{OpCode::Type::ArithmeticInteger, &ShaderIR::DecodeArithmeticInteger},
|
|
|
|
{OpCode::Type::ArithmeticIntegerImmediate, &ShaderIR::DecodeArithmeticIntegerImmediate},
|
|
|
|
{OpCode::Type::ArithmeticHalf, &ShaderIR::DecodeArithmeticHalf},
|
|
|
|
{OpCode::Type::ArithmeticHalfImmediate, &ShaderIR::DecodeArithmeticHalfImmediate},
|
|
|
|
{OpCode::Type::Ffma, &ShaderIR::DecodeFfma},
|
|
|
|
{OpCode::Type::Hfma2, &ShaderIR::DecodeHfma2},
|
|
|
|
{OpCode::Type::Conversion, &ShaderIR::DecodeConversion},
|
|
|
|
{OpCode::Type::Memory, &ShaderIR::DecodeMemory},
|
2019-02-22 06:19:45 +01:00
|
|
|
{OpCode::Type::Texture, &ShaderIR::DecodeTexture},
|
2019-04-27 07:07:18 +02:00
|
|
|
{OpCode::Type::Image, &ShaderIR::DecodeImage},
|
2019-01-30 06:09:40 +01:00
|
|
|
{OpCode::Type::FloatSetPredicate, &ShaderIR::DecodeFloatSetPredicate},
|
|
|
|
{OpCode::Type::IntegerSetPredicate, &ShaderIR::DecodeIntegerSetPredicate},
|
|
|
|
{OpCode::Type::HalfSetPredicate, &ShaderIR::DecodeHalfSetPredicate},
|
|
|
|
{OpCode::Type::PredicateSetRegister, &ShaderIR::DecodePredicateSetRegister},
|
|
|
|
{OpCode::Type::PredicateSetPredicate, &ShaderIR::DecodePredicateSetPredicate},
|
|
|
|
{OpCode::Type::RegisterSetPredicate, &ShaderIR::DecodeRegisterSetPredicate},
|
|
|
|
{OpCode::Type::FloatSet, &ShaderIR::DecodeFloatSet},
|
|
|
|
{OpCode::Type::IntegerSet, &ShaderIR::DecodeIntegerSet},
|
|
|
|
{OpCode::Type::HalfSet, &ShaderIR::DecodeHalfSet},
|
|
|
|
{OpCode::Type::Video, &ShaderIR::DecodeVideo},
|
|
|
|
{OpCode::Type::Xmad, &ShaderIR::DecodeXmad},
|
|
|
|
};
|
2018-12-29 00:00:36 +01:00
|
|
|
|
|
|
|
std::vector<Node> tmp_block;
|
2018-12-20 23:09:21 +01:00
|
|
|
if (const auto decoder = decoders.find(opcode->get().GetType()); decoder != decoders.end()) {
|
2019-01-30 05:56:33 +01:00
|
|
|
pc = (this->*decoder->second)(tmp_block, pc);
|
2018-12-20 23:09:21 +01:00
|
|
|
} else {
|
2019-01-30 05:56:33 +01:00
|
|
|
pc = DecodeOther(tmp_block, pc);
|
2018-12-20 23:09:21 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// Some instructions (like SSY) don't have a predicate field, they are always unconditionally
|
|
|
|
// executed.
|
|
|
|
const bool can_be_predicated = OpCode::IsPredicatedInstruction(opcode->get().GetId());
|
|
|
|
const auto pred_index = static_cast<u32>(instr.pred.pred_index);
|
|
|
|
|
|
|
|
if (can_be_predicated && pred_index != static_cast<u32>(Pred::UnusedIndex)) {
|
2019-01-30 05:56:33 +01:00
|
|
|
const Node conditional =
|
|
|
|
Conditional(GetPredicate(pred_index, instr.negate_pred != 0), std::move(tmp_block));
|
|
|
|
global_code.push_back(conditional);
|
|
|
|
bb.push_back(conditional);
|
2018-12-20 23:09:21 +01:00
|
|
|
} else {
|
2018-12-29 00:00:36 +01:00
|
|
|
for (auto& node : tmp_block) {
|
2019-01-30 05:56:33 +01:00
|
|
|
global_code.push_back(node);
|
|
|
|
bb.push_back(node);
|
2018-12-20 23:09:21 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return pc + 1;
|
|
|
|
}
|
|
|
|
|
2019-04-03 09:33:36 +02:00
|
|
|
} // namespace VideoCommon::Shader
|