Merge pull request #246 from Subv/gpu_macro_calls
GPU: Store uploaded GPU macros and keep track of the number of method arguments.
This commit is contained in:
commit
46f9d4b4a3
8 changed files with 124 additions and 85 deletions
|
@ -24,12 +24,37 @@ namespace Tegra {
|
||||||
|
|
||||||
enum class BufferMethods {
|
enum class BufferMethods {
|
||||||
BindObject = 0,
|
BindObject = 0,
|
||||||
|
SetGraphMacroCode = 0x45,
|
||||||
|
SetGraphMacroCodeArg = 0x46,
|
||||||
|
SetGraphMacroEntry = 0x47,
|
||||||
CountBufferMethods = 0x100,
|
CountBufferMethods = 0x100,
|
||||||
};
|
};
|
||||||
|
|
||||||
void GPU::WriteReg(u32 method, u32 subchannel, u32 value) {
|
void GPU::WriteReg(u32 method, u32 subchannel, u32 value, u32 remaining_params) {
|
||||||
LOG_WARNING(HW_GPU, "Processing method %08X on subchannel %u value %08X", method, subchannel,
|
LOG_WARNING(HW_GPU, "Processing method %08X on subchannel %u value %08X remaining params %u",
|
||||||
value);
|
method, subchannel, value, remaining_params);
|
||||||
|
|
||||||
|
if (method == static_cast<u32>(BufferMethods::SetGraphMacroEntry)) {
|
||||||
|
// Prepare to upload a new macro, reset the upload counter.
|
||||||
|
LOG_DEBUG(HW_GPU, "Uploading GPU macro %08X", value);
|
||||||
|
current_macro_entry = value;
|
||||||
|
current_macro_code.clear();
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (method == static_cast<u32>(BufferMethods::SetGraphMacroCodeArg)) {
|
||||||
|
// Append a new code word to the current macro.
|
||||||
|
current_macro_code.push_back(value);
|
||||||
|
|
||||||
|
// There are no more params remaining, submit the code to the 3D engine.
|
||||||
|
if (remaining_params == 0) {
|
||||||
|
maxwell_3d->SubmitMacroCode(current_macro_entry, std::move(current_macro_code));
|
||||||
|
current_macro_entry = InvalidGraphMacroEntry;
|
||||||
|
current_macro_code.clear();
|
||||||
|
}
|
||||||
|
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
if (method == static_cast<u32>(BufferMethods::BindObject)) {
|
if (method == static_cast<u32>(BufferMethods::BindObject)) {
|
||||||
// Bind the current subchannel to the desired engine id.
|
// Bind the current subchannel to the desired engine id.
|
||||||
|
@ -54,7 +79,7 @@ void GPU::WriteReg(u32 method, u32 subchannel, u32 value) {
|
||||||
fermi_2d->WriteReg(method, value);
|
fermi_2d->WriteReg(method, value);
|
||||||
break;
|
break;
|
||||||
case EngineID::MAXWELL_B:
|
case EngineID::MAXWELL_B:
|
||||||
maxwell_3d->WriteReg(method, value);
|
maxwell_3d->WriteReg(method, value, remaining_params);
|
||||||
break;
|
break;
|
||||||
case EngineID::MAXWELL_COMPUTE_B:
|
case EngineID::MAXWELL_COMPUTE_B:
|
||||||
maxwell_compute->WriteReg(method, value);
|
maxwell_compute->WriteReg(method, value);
|
||||||
|
@ -64,35 +89,6 @@ void GPU::WriteReg(u32 method, u32 subchannel, u32 value) {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void GPU::CallMethod(u32 method, u32 subchannel, const std::vector<u32>& parameters) {
|
|
||||||
LOG_WARNING(HW_GPU, "Processing method %08X on subchannel %u num params %zu", method,
|
|
||||||
subchannel, parameters.size());
|
|
||||||
|
|
||||||
if (method < static_cast<u32>(BufferMethods::CountBufferMethods)) {
|
|
||||||
// TODO(Subv): Research and implement these methods.
|
|
||||||
LOG_ERROR(HW_GPU, "Special buffer methods other than Bind are not implemented");
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
|
|
||||||
ASSERT(bound_engines.find(subchannel) != bound_engines.end());
|
|
||||||
|
|
||||||
const EngineID engine = bound_engines[subchannel];
|
|
||||||
|
|
||||||
switch (engine) {
|
|
||||||
case EngineID::FERMI_TWOD_A:
|
|
||||||
fermi_2d->CallMethod(method, parameters);
|
|
||||||
break;
|
|
||||||
case EngineID::MAXWELL_B:
|
|
||||||
maxwell_3d->CallMethod(method, parameters);
|
|
||||||
break;
|
|
||||||
case EngineID::MAXWELL_COMPUTE_B:
|
|
||||||
maxwell_compute->CallMethod(method, parameters);
|
|
||||||
break;
|
|
||||||
default:
|
|
||||||
UNIMPLEMENTED();
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
void GPU::ProcessCommandList(GPUVAddr address, u32 size) {
|
void GPU::ProcessCommandList(GPUVAddr address, u32 size) {
|
||||||
// TODO(Subv): PhysicalToVirtualAddress is a misnomer, it converts a GPU VAddr into an
|
// TODO(Subv): PhysicalToVirtualAddress is a misnomer, it converts a GPU VAddr into an
|
||||||
// application VAddr.
|
// application VAddr.
|
||||||
|
@ -107,7 +103,8 @@ void GPU::ProcessCommandList(GPUVAddr address, u32 size) {
|
||||||
case SubmissionMode::Increasing: {
|
case SubmissionMode::Increasing: {
|
||||||
// Increase the method value with each argument.
|
// Increase the method value with each argument.
|
||||||
for (unsigned i = 0; i < header.arg_count; ++i) {
|
for (unsigned i = 0; i < header.arg_count; ++i) {
|
||||||
WriteReg(header.method + i, header.subchannel, Memory::Read32(current_addr));
|
WriteReg(header.method + i, header.subchannel, Memory::Read32(current_addr),
|
||||||
|
header.arg_count - i - 1);
|
||||||
current_addr += sizeof(u32);
|
current_addr += sizeof(u32);
|
||||||
}
|
}
|
||||||
break;
|
break;
|
||||||
|
@ -116,31 +113,31 @@ void GPU::ProcessCommandList(GPUVAddr address, u32 size) {
|
||||||
case SubmissionMode::NonIncreasing: {
|
case SubmissionMode::NonIncreasing: {
|
||||||
// Use the same method value for all arguments.
|
// Use the same method value for all arguments.
|
||||||
for (unsigned i = 0; i < header.arg_count; ++i) {
|
for (unsigned i = 0; i < header.arg_count; ++i) {
|
||||||
WriteReg(header.method, header.subchannel, Memory::Read32(current_addr));
|
WriteReg(header.method, header.subchannel, Memory::Read32(current_addr),
|
||||||
|
header.arg_count - i - 1);
|
||||||
current_addr += sizeof(u32);
|
current_addr += sizeof(u32);
|
||||||
}
|
}
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
case SubmissionMode::IncreaseOnce: {
|
case SubmissionMode::IncreaseOnce: {
|
||||||
ASSERT(header.arg_count.Value() >= 1);
|
ASSERT(header.arg_count.Value() >= 1);
|
||||||
|
|
||||||
// Use the original method for the first argument and then the next method for all other
|
// Use the original method for the first argument and then the next method for all other
|
||||||
// arguments.
|
// arguments.
|
||||||
|
WriteReg(header.method, header.subchannel, Memory::Read32(current_addr),
|
||||||
|
header.arg_count - 1);
|
||||||
|
current_addr += sizeof(u32);
|
||||||
|
|
||||||
// Process this command as a method call instead of a register write. Gather
|
for (unsigned i = 1; i < header.arg_count; ++i) {
|
||||||
// all the parameters first and then pass them at once to the CallMethod function.
|
WriteReg(header.method + 1, header.subchannel, Memory::Read32(current_addr),
|
||||||
std::vector<u32> parameters(header.arg_count);
|
header.arg_count - i - 1);
|
||||||
|
|
||||||
for (unsigned i = 0; i < header.arg_count; ++i) {
|
|
||||||
parameters[i] = Memory::Read32(current_addr);
|
|
||||||
current_addr += sizeof(u32);
|
current_addr += sizeof(u32);
|
||||||
}
|
}
|
||||||
|
|
||||||
CallMethod(header.method, header.subchannel, parameters);
|
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
case SubmissionMode::Inline: {
|
case SubmissionMode::Inline: {
|
||||||
// The register value is stored in the bits 16-28 as an immediate
|
// The register value is stored in the bits 16-28 as an immediate
|
||||||
WriteReg(header.method, header.subchannel, header.inline_data);
|
WriteReg(header.method, header.subchannel, header.inline_data, 0);
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
default:
|
default:
|
||||||
|
|
|
@ -8,7 +8,6 @@ namespace Tegra {
|
||||||
namespace Engines {
|
namespace Engines {
|
||||||
|
|
||||||
void Fermi2D::WriteReg(u32 method, u32 value) {}
|
void Fermi2D::WriteReg(u32 method, u32 value) {}
|
||||||
void Fermi2D::CallMethod(u32 method, const std::vector<u32>& parameters) {}
|
|
||||||
|
|
||||||
} // namespace Engines
|
} // namespace Engines
|
||||||
} // namespace Tegra
|
} // namespace Tegra
|
||||||
|
|
|
@ -4,7 +4,6 @@
|
||||||
|
|
||||||
#pragma once
|
#pragma once
|
||||||
|
|
||||||
#include <vector>
|
|
||||||
#include "common/common_types.h"
|
#include "common/common_types.h"
|
||||||
|
|
||||||
namespace Tegra {
|
namespace Tegra {
|
||||||
|
@ -17,13 +16,6 @@ public:
|
||||||
|
|
||||||
/// Write the value to the register identified by method.
|
/// Write the value to the register identified by method.
|
||||||
void WriteReg(u32 method, u32 value);
|
void WriteReg(u32 method, u32 value);
|
||||||
|
|
||||||
/**
|
|
||||||
* Handles a method call to this engine.
|
|
||||||
* @param method Method to call
|
|
||||||
* @param parameters Arguments to the method call
|
|
||||||
*/
|
|
||||||
void CallMethod(u32 method, const std::vector<u32>& parameters);
|
|
||||||
};
|
};
|
||||||
|
|
||||||
} // namespace Engines
|
} // namespace Engines
|
||||||
|
|
|
@ -8,28 +8,68 @@
|
||||||
namespace Tegra {
|
namespace Tegra {
|
||||||
namespace Engines {
|
namespace Engines {
|
||||||
|
|
||||||
|
/// First register id that is actually a Macro call.
|
||||||
|
constexpr u32 MacroRegistersStart = 0xE00;
|
||||||
|
|
||||||
const std::unordered_map<u32, Maxwell3D::MethodInfo> Maxwell3D::method_handlers = {
|
const std::unordered_map<u32, Maxwell3D::MethodInfo> Maxwell3D::method_handlers = {
|
||||||
{0xE24, {"SetShader", 5, &Maxwell3D::SetShader}},
|
{0xE24, {"SetShader", 5, &Maxwell3D::SetShader}},
|
||||||
};
|
};
|
||||||
|
|
||||||
Maxwell3D::Maxwell3D(MemoryManager& memory_manager) : memory_manager(memory_manager) {}
|
Maxwell3D::Maxwell3D(MemoryManager& memory_manager) : memory_manager(memory_manager) {}
|
||||||
|
|
||||||
void Maxwell3D::CallMethod(u32 method, const std::vector<u32>& parameters) {
|
void Maxwell3D::SubmitMacroCode(u32 entry, std::vector<u32> code) {
|
||||||
// TODO(Subv): Write an interpreter for the macros uploaded via registers 0x45 and 0x47
|
uploaded_macros[entry * 2 + MacroRegistersStart] = std::move(code);
|
||||||
auto itr = method_handlers.find(method);
|
|
||||||
if (itr == method_handlers.end()) {
|
|
||||||
LOG_ERROR(HW_GPU, "Unhandled method call %08X", method);
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
|
|
||||||
ASSERT(itr->second.arguments == parameters.size());
|
|
||||||
(this->*itr->second.handler)(parameters);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void Maxwell3D::WriteReg(u32 method, u32 value) {
|
void Maxwell3D::CallMacroMethod(u32 method, const std::vector<u32>& parameters) {
|
||||||
|
// TODO(Subv): Write an interpreter for the macros uploaded via registers 0x45 and 0x47
|
||||||
|
|
||||||
|
// The requested macro must have been uploaded already.
|
||||||
|
ASSERT_MSG(uploaded_macros.find(method) != uploaded_macros.end(), "Macro %08X was not uploaded",
|
||||||
|
method);
|
||||||
|
|
||||||
|
auto itr = method_handlers.find(method);
|
||||||
|
ASSERT_MSG(itr != method_handlers.end(), "Unhandled method call %08X", method);
|
||||||
|
|
||||||
|
ASSERT(itr->second.arguments == parameters.size());
|
||||||
|
|
||||||
|
(this->*itr->second.handler)(parameters);
|
||||||
|
|
||||||
|
// Reset the current macro and its parameters.
|
||||||
|
executing_macro = 0;
|
||||||
|
macro_params.clear();
|
||||||
|
}
|
||||||
|
|
||||||
|
void Maxwell3D::WriteReg(u32 method, u32 value, u32 remaining_params) {
|
||||||
ASSERT_MSG(method < Regs::NUM_REGS,
|
ASSERT_MSG(method < Regs::NUM_REGS,
|
||||||
"Invalid Maxwell3D register, increase the size of the Regs structure");
|
"Invalid Maxwell3D register, increase the size of the Regs structure");
|
||||||
|
|
||||||
|
// It is an error to write to a register other than the current macro's ARG register before it
|
||||||
|
// has finished execution.
|
||||||
|
if (executing_macro != 0) {
|
||||||
|
ASSERT(method == executing_macro + 1);
|
||||||
|
}
|
||||||
|
|
||||||
|
// Methods after 0xE00 are special, they're actually triggers for some microcode that was
|
||||||
|
// uploaded to the GPU during initialization.
|
||||||
|
if (method >= MacroRegistersStart) {
|
||||||
|
// We're trying to execute a macro
|
||||||
|
if (executing_macro == 0) {
|
||||||
|
// A macro call must begin by writing the macro method's register, not its argument.
|
||||||
|
ASSERT_MSG((method % 2) == 0,
|
||||||
|
"Can't start macro execution by writing to the ARGS register");
|
||||||
|
executing_macro = method;
|
||||||
|
}
|
||||||
|
|
||||||
|
macro_params.push_back(value);
|
||||||
|
|
||||||
|
// Call the macro when there are no more parameters in the command buffer
|
||||||
|
if (remaining_params == 0) {
|
||||||
|
CallMacroMethod(executing_macro, macro_params);
|
||||||
|
}
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
regs.reg_array[method] = value;
|
regs.reg_array[method] = value;
|
||||||
|
|
||||||
#define MAXWELL3D_REG_INDEX(field_name) (offsetof(Regs, field_name) / sizeof(u32))
|
#define MAXWELL3D_REG_INDEX(field_name) (offsetof(Regs, field_name) / sizeof(u32))
|
||||||
|
|
|
@ -21,14 +21,10 @@ public:
|
||||||
~Maxwell3D() = default;
|
~Maxwell3D() = default;
|
||||||
|
|
||||||
/// Write the value to the register identified by method.
|
/// Write the value to the register identified by method.
|
||||||
void WriteReg(u32 method, u32 value);
|
void WriteReg(u32 method, u32 value, u32 remaining_params);
|
||||||
|
|
||||||
/**
|
/// Uploads the code for a GPU macro program associated with the specified entry.
|
||||||
* Handles a method call to this engine.
|
void SubmitMacroCode(u32 entry, std::vector<u32> code);
|
||||||
* @param method Method to call
|
|
||||||
* @param parameters Arguments to the method call
|
|
||||||
*/
|
|
||||||
void CallMethod(u32 method, const std::vector<u32>& parameters);
|
|
||||||
|
|
||||||
/// Register structure of the Maxwell3D engine.
|
/// Register structure of the Maxwell3D engine.
|
||||||
/// TODO(Subv): This structure will need to be made bigger as more registers are discovered.
|
/// TODO(Subv): This structure will need to be made bigger as more registers are discovered.
|
||||||
|
@ -166,7 +162,11 @@ public:
|
||||||
INSERT_PADDING_WORDS(7);
|
INSERT_PADDING_WORDS(7);
|
||||||
} cb_bind[MaxShaderStage];
|
} cb_bind[MaxShaderStage];
|
||||||
|
|
||||||
INSERT_PADDING_WORDS(0x50A);
|
INSERT_PADDING_WORDS(0x56);
|
||||||
|
|
||||||
|
u32 tex_cb_index;
|
||||||
|
|
||||||
|
INSERT_PADDING_WORDS(0x4B3);
|
||||||
};
|
};
|
||||||
std::array<u32, NUM_REGS> reg_array;
|
std::array<u32, NUM_REGS> reg_array;
|
||||||
};
|
};
|
||||||
|
@ -201,6 +201,20 @@ public:
|
||||||
private:
|
private:
|
||||||
MemoryManager& memory_manager;
|
MemoryManager& memory_manager;
|
||||||
|
|
||||||
|
std::unordered_map<u32, std::vector<u32>> uploaded_macros;
|
||||||
|
|
||||||
|
/// Macro method that is currently being executed / being fed parameters.
|
||||||
|
u32 executing_macro = 0;
|
||||||
|
/// Parameters that have been submitted to the macro call so far.
|
||||||
|
std::vector<u32> macro_params;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Call a macro on this engine.
|
||||||
|
* @param method Method to call
|
||||||
|
* @param parameters Arguments to the method call
|
||||||
|
*/
|
||||||
|
void CallMacroMethod(u32 method, const std::vector<u32>& parameters);
|
||||||
|
|
||||||
/// Handles a write to the QUERY_GET register.
|
/// Handles a write to the QUERY_GET register.
|
||||||
void ProcessQueryGet();
|
void ProcessQueryGet();
|
||||||
|
|
||||||
|
@ -234,6 +248,7 @@ ASSERT_REG_POSITION(vertex_array_limit[0], 0x7C0);
|
||||||
ASSERT_REG_POSITION(shader_config[0], 0x800);
|
ASSERT_REG_POSITION(shader_config[0], 0x800);
|
||||||
ASSERT_REG_POSITION(const_buffer, 0x8E0);
|
ASSERT_REG_POSITION(const_buffer, 0x8E0);
|
||||||
ASSERT_REG_POSITION(cb_bind[0], 0x904);
|
ASSERT_REG_POSITION(cb_bind[0], 0x904);
|
||||||
|
ASSERT_REG_POSITION(tex_cb_index, 0x982);
|
||||||
|
|
||||||
#undef ASSERT_REG_POSITION
|
#undef ASSERT_REG_POSITION
|
||||||
|
|
||||||
|
|
|
@ -8,7 +8,6 @@ namespace Tegra {
|
||||||
namespace Engines {
|
namespace Engines {
|
||||||
|
|
||||||
void MaxwellCompute::WriteReg(u32 method, u32 value) {}
|
void MaxwellCompute::WriteReg(u32 method, u32 value) {}
|
||||||
void MaxwellCompute::CallMethod(u32 method, const std::vector<u32>& parameters) {}
|
|
||||||
|
|
||||||
} // namespace Engines
|
} // namespace Engines
|
||||||
} // namespace Tegra
|
} // namespace Tegra
|
||||||
|
|
|
@ -4,7 +4,6 @@
|
||||||
|
|
||||||
#pragma once
|
#pragma once
|
||||||
|
|
||||||
#include <vector>
|
|
||||||
#include "common/common_types.h"
|
#include "common/common_types.h"
|
||||||
|
|
||||||
namespace Tegra {
|
namespace Tegra {
|
||||||
|
@ -17,13 +16,6 @@ public:
|
||||||
|
|
||||||
/// Write the value to the register identified by method.
|
/// Write the value to the register identified by method.
|
||||||
void WriteReg(u32 method, u32 value);
|
void WriteReg(u32 method, u32 value);
|
||||||
|
|
||||||
/**
|
|
||||||
* Handles a method call to this engine.
|
|
||||||
* @param method Method to call
|
|
||||||
* @param parameters Arguments to the method call
|
|
||||||
*/
|
|
||||||
void CallMethod(u32 method, const std::vector<u32>& parameters);
|
|
||||||
};
|
};
|
||||||
|
|
||||||
} // namespace Engines
|
} // namespace Engines
|
||||||
|
|
|
@ -6,6 +6,7 @@
|
||||||
|
|
||||||
#include <memory>
|
#include <memory>
|
||||||
#include <unordered_map>
|
#include <unordered_map>
|
||||||
|
#include <vector>
|
||||||
#include "common/common_types.h"
|
#include "common/common_types.h"
|
||||||
#include "video_core/engines/fermi_2d.h"
|
#include "video_core/engines/fermi_2d.h"
|
||||||
#include "video_core/engines/maxwell_3d.h"
|
#include "video_core/engines/maxwell_3d.h"
|
||||||
|
@ -38,11 +39,10 @@ public:
|
||||||
std::unique_ptr<MemoryManager> memory_manager;
|
std::unique_ptr<MemoryManager> memory_manager;
|
||||||
|
|
||||||
private:
|
private:
|
||||||
/// Writes a single register in the engine bound to the specified subchannel
|
static constexpr u32 InvalidGraphMacroEntry = 0xFFFFFFFF;
|
||||||
void WriteReg(u32 method, u32 subchannel, u32 value);
|
|
||||||
|
|
||||||
/// Calls a method in the engine bound to the specified subchannel with the input parameters.
|
/// Writes a single register in the engine bound to the specified subchannel
|
||||||
void CallMethod(u32 method, u32 subchannel, const std::vector<u32>& parameters);
|
void WriteReg(u32 method, u32 subchannel, u32 value, u32 remaining_params);
|
||||||
|
|
||||||
/// Mapping of command subchannels to their bound engine ids.
|
/// Mapping of command subchannels to their bound engine ids.
|
||||||
std::unordered_map<u32, EngineID> bound_engines;
|
std::unordered_map<u32, EngineID> bound_engines;
|
||||||
|
@ -53,6 +53,11 @@ private:
|
||||||
std::unique_ptr<Engines::Fermi2D> fermi_2d;
|
std::unique_ptr<Engines::Fermi2D> fermi_2d;
|
||||||
/// Compute engine
|
/// Compute engine
|
||||||
std::unique_ptr<Engines::MaxwellCompute> maxwell_compute;
|
std::unique_ptr<Engines::MaxwellCompute> maxwell_compute;
|
||||||
|
|
||||||
|
/// Entry of the macro that is currently being uploaded
|
||||||
|
u32 current_macro_entry = InvalidGraphMacroEntry;
|
||||||
|
/// Code being uploaded for the current macro
|
||||||
|
std::vector<u32> current_macro_code;
|
||||||
};
|
};
|
||||||
|
|
||||||
} // namespace Tegra
|
} // namespace Tegra
|
||||||
|
|
Loading…
Reference in a new issue