forked from suyu/suyu
MacroHLE: Add Index Buffer size estimation.
This commit is contained in:
parent
c541559767
commit
93ac5a6a6d
5 changed files with 74 additions and 10 deletions
|
@ -179,6 +179,13 @@ u32 Maxwell3D::GetMaxCurrentVertices() {
|
||||||
return num_vertices;
|
return num_vertices;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
size_t Maxwell3D::EstimateIndexBufferSize() {
|
||||||
|
GPUVAddr start_address = regs.index_buffer.StartAddress();
|
||||||
|
GPUVAddr end_address = regs.index_buffer.EndAddress();
|
||||||
|
return std::min<size_t>(memory_manager.GetMemoryLayoutSize(start_address),
|
||||||
|
static_cast<size_t>(end_address - start_address));
|
||||||
|
}
|
||||||
|
|
||||||
u32 Maxwell3D::ProcessShadowRam(u32 method, u32 argument) {
|
u32 Maxwell3D::ProcessShadowRam(u32 method, u32 argument) {
|
||||||
// Keep track of the register value in shadow_state when requested.
|
// Keep track of the register value in shadow_state when requested.
|
||||||
const auto control = shadow_state.shadow_ram_control;
|
const auto control = shadow_state.shadow_ram_control;
|
||||||
|
|
|
@ -3077,6 +3077,8 @@ public:
|
||||||
|
|
||||||
u32 GetMaxCurrentVertices();
|
u32 GetMaxCurrentVertices();
|
||||||
|
|
||||||
|
size_t EstimateIndexBufferSize();
|
||||||
|
|
||||||
/// Handles a write to the CLEAR_BUFFERS register.
|
/// Handles a write to the CLEAR_BUFFERS register.
|
||||||
void ProcessClearBuffers(u32 layer_count);
|
void ProcessClearBuffers(u32 layer_count);
|
||||||
|
|
||||||
|
|
|
@ -163,12 +163,16 @@ public:
|
||||||
maxwell3d.RefreshParameters();
|
maxwell3d.RefreshParameters();
|
||||||
minimum_limit = std::max(parameters[3], minimum_limit);
|
minimum_limit = std::max(parameters[3], minimum_limit);
|
||||||
}
|
}
|
||||||
|
const u32 estimate = static_cast<u32>(maxwell3d.EstimateIndexBufferSize());
|
||||||
const u32 base_vertex = parameters[8];
|
const u32 base_size = std::max(minimum_limit, estimate);
|
||||||
const u32 base_instance = parameters[9];
|
const u32 element_base = parameters[4];
|
||||||
maxwell3d.regs.vertex_id_base = base_vertex;
|
const u32 base_instance = parameters[5];
|
||||||
|
maxwell3d.regs.index_buffer.first = 0;
|
||||||
|
maxwell3d.regs.index_buffer.count = base_size; // Use a fixed size, just for mapping
|
||||||
|
maxwell3d.regs.draw.topology.Assign(topology);
|
||||||
|
maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true;
|
||||||
maxwell3d.CallMethod(0x8e3, 0x640, true);
|
maxwell3d.CallMethod(0x8e3, 0x640, true);
|
||||||
maxwell3d.CallMethod(0x8e4, base_vertex, true);
|
maxwell3d.CallMethod(0x8e4, element_base, true);
|
||||||
maxwell3d.CallMethod(0x8e5, base_instance, true);
|
maxwell3d.CallMethod(0x8e5, base_instance, true);
|
||||||
auto& params = maxwell3d.draw_manager->GetIndirectParams();
|
auto& params = maxwell3d.draw_manager->GetIndirectParams();
|
||||||
params.is_indexed = true;
|
params.is_indexed = true;
|
||||||
|
@ -179,7 +183,7 @@ public:
|
||||||
params.max_draw_counts = 1;
|
params.max_draw_counts = 1;
|
||||||
params.stride = 0;
|
params.stride = 0;
|
||||||
maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true;
|
maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true;
|
||||||
maxwell3d.draw_manager->DrawIndexedIndirect(topology, 0, minimum_limit);
|
maxwell3d.draw_manager->DrawIndexedIndirect(topology, 0, base_size);
|
||||||
maxwell3d.CallMethod(0x8e3, 0x640, true);
|
maxwell3d.CallMethod(0x8e3, 0x640, true);
|
||||||
maxwell3d.CallMethod(0x8e4, 0x0, true);
|
maxwell3d.CallMethod(0x8e4, 0x0, true);
|
||||||
maxwell3d.CallMethod(0x8e5, 0x0, true);
|
maxwell3d.CallMethod(0x8e5, 0x0, true);
|
||||||
|
@ -271,9 +275,11 @@ public:
|
||||||
if (check_limit) {
|
if (check_limit) {
|
||||||
minimum_limit = std::max(highest_limit, minimum_limit);
|
minimum_limit = std::max(highest_limit, minimum_limit);
|
||||||
}
|
}
|
||||||
|
const u32 estimate = static_cast<u32>(maxwell3d.EstimateIndexBufferSize());
|
||||||
|
const u32 base_size = std::max(minimum_limit, estimate);
|
||||||
|
|
||||||
maxwell3d.regs.index_buffer.first = 0;
|
maxwell3d.regs.index_buffer.first = 0;
|
||||||
maxwell3d.regs.index_buffer.count = std::max(highest_limit, minimum_limit);
|
maxwell3d.regs.index_buffer.count = std::max(highest_limit, base_size);
|
||||||
maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true;
|
maxwell3d.dirty.flags[VideoCommon::Dirty::IndexBuffer] = true;
|
||||||
auto& params = maxwell3d.draw_manager->GetIndirectParams();
|
auto& params = maxwell3d.draw_manager->GetIndirectParams();
|
||||||
params.is_indexed = true;
|
params.is_indexed = true;
|
||||||
|
|
|
@ -325,9 +325,15 @@ template <bool is_big_pages, typename FuncMapped, typename FuncReserved, typenam
|
||||||
inline void MemoryManager::MemoryOperation(GPUVAddr gpu_src_addr, std::size_t size,
|
inline void MemoryManager::MemoryOperation(GPUVAddr gpu_src_addr, std::size_t size,
|
||||||
FuncMapped&& func_mapped, FuncReserved&& func_reserved,
|
FuncMapped&& func_mapped, FuncReserved&& func_reserved,
|
||||||
FuncUnmapped&& func_unmapped) const {
|
FuncUnmapped&& func_unmapped) const {
|
||||||
static constexpr bool BOOL_BREAK_MAPPED = std::is_same_v<FuncMapped, bool>;
|
using FuncMappedReturn =
|
||||||
static constexpr bool BOOL_BREAK_RESERVED = std::is_same_v<FuncReserved, bool>;
|
typename std::invoke_result<FuncMapped, std::size_t, std::size_t, std::size_t>::type;
|
||||||
static constexpr bool BOOL_BREAK_UNMAPPED = std::is_same_v<FuncUnmapped, bool>;
|
using FuncReservedReturn =
|
||||||
|
typename std::invoke_result<FuncReserved, std::size_t, std::size_t, std::size_t>::type;
|
||||||
|
using FuncUnmappedReturn =
|
||||||
|
typename std::invoke_result<FuncUnmapped, std::size_t, std::size_t, std::size_t>::type;
|
||||||
|
static constexpr bool BOOL_BREAK_MAPPED = std::is_same_v<FuncMappedReturn, bool>;
|
||||||
|
static constexpr bool BOOL_BREAK_RESERVED = std::is_same_v<FuncReservedReturn, bool>;
|
||||||
|
static constexpr bool BOOL_BREAK_UNMAPPED = std::is_same_v<FuncUnmappedReturn, bool>;
|
||||||
u64 used_page_size;
|
u64 used_page_size;
|
||||||
u64 used_page_mask;
|
u64 used_page_mask;
|
||||||
u64 used_page_bits;
|
u64 used_page_bits;
|
||||||
|
@ -571,6 +577,47 @@ size_t MemoryManager::MaxContinousRange(GPUVAddr gpu_addr, size_t size) const {
|
||||||
return range_so_far;
|
return range_so_far;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
size_t MemoryManager::GetMemoryLayoutSize(GPUVAddr gpu_addr) const {
|
||||||
|
PTEKind base_kind = GetPageKind(gpu_addr);
|
||||||
|
if (base_kind == PTEKind::INVALID) {
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
size_t range_so_far = 0;
|
||||||
|
bool result{false};
|
||||||
|
auto fail = [&]([[maybe_unused]] std::size_t page_index, [[maybe_unused]] std::size_t offset,
|
||||||
|
std::size_t copy_amount) {
|
||||||
|
result = true;
|
||||||
|
return true;
|
||||||
|
};
|
||||||
|
auto short_check = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) {
|
||||||
|
PTEKind base_kind_other = GetKind<false>((page_index << page_bits) + offset);
|
||||||
|
if (base_kind != base_kind_other) {
|
||||||
|
result = true;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
range_so_far += copy_amount;
|
||||||
|
return false;
|
||||||
|
};
|
||||||
|
auto big_check = [&](std::size_t page_index, std::size_t offset, std::size_t copy_amount) {
|
||||||
|
PTEKind base_kind_other = GetKind<true>((page_index << big_page_bits) + offset);
|
||||||
|
if (base_kind != base_kind_other) {
|
||||||
|
result = true;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
range_so_far += copy_amount;
|
||||||
|
return false;
|
||||||
|
};
|
||||||
|
auto check_short_pages = [&](std::size_t page_index, std::size_t offset,
|
||||||
|
std::size_t copy_amount) {
|
||||||
|
GPUVAddr base = (page_index << big_page_bits) + offset;
|
||||||
|
MemoryOperation<false>(base, copy_amount, short_check, fail, fail);
|
||||||
|
return result;
|
||||||
|
};
|
||||||
|
MemoryOperation<true>(gpu_addr, address_space_size - gpu_addr, big_check, fail,
|
||||||
|
check_short_pages);
|
||||||
|
return range_so_far;
|
||||||
|
}
|
||||||
|
|
||||||
void MemoryManager::InvalidateRegion(GPUVAddr gpu_addr, size_t size) const {
|
void MemoryManager::InvalidateRegion(GPUVAddr gpu_addr, size_t size) const {
|
||||||
auto do_nothing = [&]([[maybe_unused]] std::size_t page_index,
|
auto do_nothing = [&]([[maybe_unused]] std::size_t page_index,
|
||||||
[[maybe_unused]] std::size_t offset,
|
[[maybe_unused]] std::size_t offset,
|
||||||
|
|
|
@ -118,6 +118,8 @@ public:
|
||||||
|
|
||||||
PTEKind GetPageKind(GPUVAddr gpu_addr) const;
|
PTEKind GetPageKind(GPUVAddr gpu_addr) const;
|
||||||
|
|
||||||
|
size_t GetMemoryLayoutSize(GPUVAddr gpu_addr) const;
|
||||||
|
|
||||||
private:
|
private:
|
||||||
template <bool is_big_pages, typename FuncMapped, typename FuncReserved, typename FuncUnmapped>
|
template <bool is_big_pages, typename FuncMapped, typename FuncReserved, typename FuncUnmapped>
|
||||||
inline void MemoryOperation(GPUVAddr gpu_src_addr, std::size_t size, FuncMapped&& func_mapped,
|
inline void MemoryOperation(GPUVAddr gpu_src_addr, std::size_t size, FuncMapped&& func_mapped,
|
||||||
|
|
Loading…
Reference in a new issue