Merge pull request #2783 from FernandoS27/new-buffer-cache
Implement a New LLE Buffer Cache
This commit is contained in:
commit
e424615839
9 changed files with 684 additions and 330 deletions
|
@ -1,5 +1,7 @@
|
||||||
add_library(video_core STATIC
|
add_library(video_core STATIC
|
||||||
buffer_cache.h
|
buffer_cache/buffer_block.h
|
||||||
|
buffer_cache/buffer_cache.h
|
||||||
|
buffer_cache/map_interval.h
|
||||||
dma_pusher.cpp
|
dma_pusher.cpp
|
||||||
dma_pusher.h
|
dma_pusher.h
|
||||||
debug_utils/debug_utils.cpp
|
debug_utils/debug_utils.cpp
|
||||||
|
|
|
@ -1,299 +0,0 @@
|
||||||
// Copyright 2019 yuzu Emulator Project
|
|
||||||
// Licensed under GPLv2 or any later version
|
|
||||||
// Refer to the license.txt file included.
|
|
||||||
|
|
||||||
#pragma once
|
|
||||||
|
|
||||||
#include <array>
|
|
||||||
#include <memory>
|
|
||||||
#include <mutex>
|
|
||||||
#include <unordered_map>
|
|
||||||
#include <unordered_set>
|
|
||||||
#include <utility>
|
|
||||||
#include <vector>
|
|
||||||
|
|
||||||
#include "common/alignment.h"
|
|
||||||
#include "common/common_types.h"
|
|
||||||
#include "core/core.h"
|
|
||||||
#include "video_core/memory_manager.h"
|
|
||||||
#include "video_core/rasterizer_cache.h"
|
|
||||||
|
|
||||||
namespace VideoCore {
|
|
||||||
class RasterizerInterface;
|
|
||||||
}
|
|
||||||
|
|
||||||
namespace VideoCommon {
|
|
||||||
|
|
||||||
template <typename BufferStorageType>
|
|
||||||
class CachedBuffer final : public RasterizerCacheObject {
|
|
||||||
public:
|
|
||||||
explicit CachedBuffer(VAddr cpu_addr, u8* host_ptr)
|
|
||||||
: RasterizerCacheObject{host_ptr}, host_ptr{host_ptr}, cpu_addr{cpu_addr} {}
|
|
||||||
~CachedBuffer() override = default;
|
|
||||||
|
|
||||||
VAddr GetCpuAddr() const override {
|
|
||||||
return cpu_addr;
|
|
||||||
}
|
|
||||||
|
|
||||||
std::size_t GetSizeInBytes() const override {
|
|
||||||
return size;
|
|
||||||
}
|
|
||||||
|
|
||||||
u8* GetWritableHostPtr() const {
|
|
||||||
return host_ptr;
|
|
||||||
}
|
|
||||||
|
|
||||||
std::size_t GetSize() const {
|
|
||||||
return size;
|
|
||||||
}
|
|
||||||
|
|
||||||
std::size_t GetCapacity() const {
|
|
||||||
return capacity;
|
|
||||||
}
|
|
||||||
|
|
||||||
bool IsInternalized() const {
|
|
||||||
return is_internal;
|
|
||||||
}
|
|
||||||
|
|
||||||
const BufferStorageType& GetBuffer() const {
|
|
||||||
return buffer;
|
|
||||||
}
|
|
||||||
|
|
||||||
void SetSize(std::size_t new_size) {
|
|
||||||
size = new_size;
|
|
||||||
}
|
|
||||||
|
|
||||||
void SetInternalState(bool is_internal_) {
|
|
||||||
is_internal = is_internal_;
|
|
||||||
}
|
|
||||||
|
|
||||||
BufferStorageType ExchangeBuffer(BufferStorageType buffer_, std::size_t new_capacity) {
|
|
||||||
capacity = new_capacity;
|
|
||||||
std::swap(buffer, buffer_);
|
|
||||||
return buffer_;
|
|
||||||
}
|
|
||||||
|
|
||||||
private:
|
|
||||||
u8* host_ptr{};
|
|
||||||
VAddr cpu_addr{};
|
|
||||||
std::size_t size{};
|
|
||||||
std::size_t capacity{};
|
|
||||||
bool is_internal{};
|
|
||||||
BufferStorageType buffer;
|
|
||||||
};
|
|
||||||
|
|
||||||
template <typename BufferStorageType, typename BufferType, typename StreamBuffer>
|
|
||||||
class BufferCache : public RasterizerCache<std::shared_ptr<CachedBuffer<BufferStorageType>>> {
|
|
||||||
public:
|
|
||||||
using Buffer = std::shared_ptr<CachedBuffer<BufferStorageType>>;
|
|
||||||
using BufferInfo = std::pair<const BufferType*, u64>;
|
|
||||||
|
|
||||||
explicit BufferCache(VideoCore::RasterizerInterface& rasterizer, Core::System& system,
|
|
||||||
std::unique_ptr<StreamBuffer> stream_buffer)
|
|
||||||
: RasterizerCache<Buffer>{rasterizer}, system{system},
|
|
||||||
stream_buffer{std::move(stream_buffer)}, stream_buffer_handle{
|
|
||||||
this->stream_buffer->GetHandle()} {}
|
|
||||||
~BufferCache() = default;
|
|
||||||
|
|
||||||
void Unregister(const Buffer& entry) override {
|
|
||||||
std::lock_guard lock{RasterizerCache<Buffer>::mutex};
|
|
||||||
if (entry->IsInternalized()) {
|
|
||||||
internalized_entries.erase(entry->GetCacheAddr());
|
|
||||||
}
|
|
||||||
ReserveBuffer(entry);
|
|
||||||
RasterizerCache<Buffer>::Unregister(entry);
|
|
||||||
}
|
|
||||||
|
|
||||||
void TickFrame() {
|
|
||||||
marked_for_destruction_index =
|
|
||||||
(marked_for_destruction_index + 1) % marked_for_destruction_ring_buffer.size();
|
|
||||||
MarkedForDestruction().clear();
|
|
||||||
}
|
|
||||||
|
|
||||||
BufferInfo UploadMemory(GPUVAddr gpu_addr, std::size_t size, std::size_t alignment = 4,
|
|
||||||
bool internalize = false, bool is_written = false) {
|
|
||||||
std::lock_guard lock{RasterizerCache<Buffer>::mutex};
|
|
||||||
|
|
||||||
auto& memory_manager = system.GPU().MemoryManager();
|
|
||||||
const auto host_ptr = memory_manager.GetPointer(gpu_addr);
|
|
||||||
if (!host_ptr) {
|
|
||||||
return {GetEmptyBuffer(size), 0};
|
|
||||||
}
|
|
||||||
const auto cache_addr = ToCacheAddr(host_ptr);
|
|
||||||
|
|
||||||
// Cache management is a big overhead, so only cache entries with a given size.
|
|
||||||
// TODO: Figure out which size is the best for given games.
|
|
||||||
constexpr std::size_t max_stream_size = 0x800;
|
|
||||||
if (!internalize && size < max_stream_size &&
|
|
||||||
internalized_entries.find(cache_addr) == internalized_entries.end()) {
|
|
||||||
return StreamBufferUpload(host_ptr, size, alignment);
|
|
||||||
}
|
|
||||||
|
|
||||||
auto entry = RasterizerCache<Buffer>::TryGet(cache_addr);
|
|
||||||
if (!entry) {
|
|
||||||
return FixedBufferUpload(gpu_addr, host_ptr, size, internalize, is_written);
|
|
||||||
}
|
|
||||||
|
|
||||||
if (entry->GetSize() < size) {
|
|
||||||
IncreaseBufferSize(entry, size);
|
|
||||||
}
|
|
||||||
if (is_written) {
|
|
||||||
entry->MarkAsModified(true, *this);
|
|
||||||
}
|
|
||||||
return {ToHandle(entry->GetBuffer()), 0};
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Uploads from a host memory. Returns the OpenGL buffer where it's located and its offset.
|
|
||||||
BufferInfo UploadHostMemory(const void* raw_pointer, std::size_t size,
|
|
||||||
std::size_t alignment = 4) {
|
|
||||||
std::lock_guard lock{RasterizerCache<Buffer>::mutex};
|
|
||||||
return StreamBufferUpload(raw_pointer, size, alignment);
|
|
||||||
}
|
|
||||||
|
|
||||||
void Map(std::size_t max_size) {
|
|
||||||
std::tie(buffer_ptr, buffer_offset_base, invalidated) = stream_buffer->Map(max_size, 4);
|
|
||||||
buffer_offset = buffer_offset_base;
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Finishes the upload stream, returns true on bindings invalidation.
|
|
||||||
bool Unmap() {
|
|
||||||
stream_buffer->Unmap(buffer_offset - buffer_offset_base);
|
|
||||||
return std::exchange(invalidated, false);
|
|
||||||
}
|
|
||||||
|
|
||||||
virtual const BufferType* GetEmptyBuffer(std::size_t size) = 0;
|
|
||||||
|
|
||||||
protected:
|
|
||||||
void FlushObjectInner(const Buffer& entry) override {
|
|
||||||
DownloadBufferData(entry->GetBuffer(), 0, entry->GetSize(), entry->GetWritableHostPtr());
|
|
||||||
}
|
|
||||||
|
|
||||||
virtual BufferStorageType CreateBuffer(std::size_t size) = 0;
|
|
||||||
|
|
||||||
virtual const BufferType* ToHandle(const BufferStorageType& storage) = 0;
|
|
||||||
|
|
||||||
virtual void UploadBufferData(const BufferStorageType& buffer, std::size_t offset,
|
|
||||||
std::size_t size, const u8* data) = 0;
|
|
||||||
|
|
||||||
virtual void DownloadBufferData(const BufferStorageType& buffer, std::size_t offset,
|
|
||||||
std::size_t size, u8* data) = 0;
|
|
||||||
|
|
||||||
virtual void CopyBufferData(const BufferStorageType& src, const BufferStorageType& dst,
|
|
||||||
std::size_t src_offset, std::size_t dst_offset,
|
|
||||||
std::size_t size) = 0;
|
|
||||||
|
|
||||||
private:
|
|
||||||
BufferInfo StreamBufferUpload(const void* raw_pointer, std::size_t size,
|
|
||||||
std::size_t alignment) {
|
|
||||||
AlignBuffer(alignment);
|
|
||||||
const std::size_t uploaded_offset = buffer_offset;
|
|
||||||
std::memcpy(buffer_ptr, raw_pointer, size);
|
|
||||||
|
|
||||||
buffer_ptr += size;
|
|
||||||
buffer_offset += size;
|
|
||||||
return {&stream_buffer_handle, uploaded_offset};
|
|
||||||
}
|
|
||||||
|
|
||||||
BufferInfo FixedBufferUpload(GPUVAddr gpu_addr, u8* host_ptr, std::size_t size,
|
|
||||||
bool internalize, bool is_written) {
|
|
||||||
auto& memory_manager = Core::System::GetInstance().GPU().MemoryManager();
|
|
||||||
const auto cpu_addr = memory_manager.GpuToCpuAddress(gpu_addr);
|
|
||||||
ASSERT(cpu_addr);
|
|
||||||
|
|
||||||
auto entry = GetUncachedBuffer(*cpu_addr, host_ptr);
|
|
||||||
entry->SetSize(size);
|
|
||||||
entry->SetInternalState(internalize);
|
|
||||||
RasterizerCache<Buffer>::Register(entry);
|
|
||||||
|
|
||||||
if (internalize) {
|
|
||||||
internalized_entries.emplace(ToCacheAddr(host_ptr));
|
|
||||||
}
|
|
||||||
if (is_written) {
|
|
||||||
entry->MarkAsModified(true, *this);
|
|
||||||
}
|
|
||||||
|
|
||||||
if (entry->GetCapacity() < size) {
|
|
||||||
MarkedForDestruction().push_back(entry->ExchangeBuffer(CreateBuffer(size), size));
|
|
||||||
}
|
|
||||||
|
|
||||||
UploadBufferData(entry->GetBuffer(), 0, size, host_ptr);
|
|
||||||
return {ToHandle(entry->GetBuffer()), 0};
|
|
||||||
}
|
|
||||||
|
|
||||||
void IncreaseBufferSize(Buffer& entry, std::size_t new_size) {
|
|
||||||
const std::size_t old_size = entry->GetSize();
|
|
||||||
if (entry->GetCapacity() < new_size) {
|
|
||||||
const auto& old_buffer = entry->GetBuffer();
|
|
||||||
auto new_buffer = CreateBuffer(new_size);
|
|
||||||
|
|
||||||
// Copy bits from the old buffer to the new buffer.
|
|
||||||
CopyBufferData(old_buffer, new_buffer, 0, 0, old_size);
|
|
||||||
MarkedForDestruction().push_back(
|
|
||||||
entry->ExchangeBuffer(std::move(new_buffer), new_size));
|
|
||||||
|
|
||||||
// This buffer could have been used
|
|
||||||
invalidated = true;
|
|
||||||
}
|
|
||||||
// Upload the new bits.
|
|
||||||
const std::size_t size_diff = new_size - old_size;
|
|
||||||
UploadBufferData(entry->GetBuffer(), old_size, size_diff, entry->GetHostPtr() + old_size);
|
|
||||||
|
|
||||||
// Update entry's size in the object and in the cache.
|
|
||||||
Unregister(entry);
|
|
||||||
|
|
||||||
entry->SetSize(new_size);
|
|
||||||
RasterizerCache<Buffer>::Register(entry);
|
|
||||||
}
|
|
||||||
|
|
||||||
Buffer GetUncachedBuffer(VAddr cpu_addr, u8* host_ptr) {
|
|
||||||
if (auto entry = TryGetReservedBuffer(host_ptr)) {
|
|
||||||
return entry;
|
|
||||||
}
|
|
||||||
return std::make_shared<CachedBuffer<BufferStorageType>>(cpu_addr, host_ptr);
|
|
||||||
}
|
|
||||||
|
|
||||||
Buffer TryGetReservedBuffer(u8* host_ptr) {
|
|
||||||
const auto it = buffer_reserve.find(ToCacheAddr(host_ptr));
|
|
||||||
if (it == buffer_reserve.end()) {
|
|
||||||
return {};
|
|
||||||
}
|
|
||||||
auto& reserve = it->second;
|
|
||||||
auto entry = reserve.back();
|
|
||||||
reserve.pop_back();
|
|
||||||
return entry;
|
|
||||||
}
|
|
||||||
|
|
||||||
void ReserveBuffer(Buffer entry) {
|
|
||||||
buffer_reserve[entry->GetCacheAddr()].push_back(std::move(entry));
|
|
||||||
}
|
|
||||||
|
|
||||||
void AlignBuffer(std::size_t alignment) {
|
|
||||||
// Align the offset, not the mapped pointer
|
|
||||||
const std::size_t offset_aligned = Common::AlignUp(buffer_offset, alignment);
|
|
||||||
buffer_ptr += offset_aligned - buffer_offset;
|
|
||||||
buffer_offset = offset_aligned;
|
|
||||||
}
|
|
||||||
|
|
||||||
std::vector<BufferStorageType>& MarkedForDestruction() {
|
|
||||||
return marked_for_destruction_ring_buffer[marked_for_destruction_index];
|
|
||||||
}
|
|
||||||
|
|
||||||
Core::System& system;
|
|
||||||
|
|
||||||
std::unique_ptr<StreamBuffer> stream_buffer;
|
|
||||||
BufferType stream_buffer_handle{};
|
|
||||||
|
|
||||||
bool invalidated = false;
|
|
||||||
|
|
||||||
u8* buffer_ptr = nullptr;
|
|
||||||
u64 buffer_offset = 0;
|
|
||||||
u64 buffer_offset_base = 0;
|
|
||||||
|
|
||||||
std::size_t marked_for_destruction_index = 0;
|
|
||||||
std::array<std::vector<BufferStorageType>, 4> marked_for_destruction_ring_buffer;
|
|
||||||
|
|
||||||
std::unordered_set<CacheAddr> internalized_entries;
|
|
||||||
std::unordered_map<CacheAddr, std::vector<Buffer>> buffer_reserve;
|
|
||||||
};
|
|
||||||
|
|
||||||
} // namespace VideoCommon
|
|
77
src/video_core/buffer_cache/buffer_block.h
Normal file
77
src/video_core/buffer_cache/buffer_block.h
Normal file
|
@ -0,0 +1,77 @@
|
||||||
|
// Copyright 2019 yuzu Emulator Project
|
||||||
|
// Licensed under GPLv2 or any later version
|
||||||
|
// Refer to the license.txt file included.
|
||||||
|
|
||||||
|
#pragma once
|
||||||
|
|
||||||
|
#include <unordered_set>
|
||||||
|
#include <utility>
|
||||||
|
|
||||||
|
#include "common/alignment.h"
|
||||||
|
#include "common/common_types.h"
|
||||||
|
#include "video_core/gpu.h"
|
||||||
|
|
||||||
|
namespace VideoCommon {
|
||||||
|
|
||||||
|
class BufferBlock {
|
||||||
|
public:
|
||||||
|
bool Overlaps(const CacheAddr start, const CacheAddr end) const {
|
||||||
|
return (cache_addr < end) && (cache_addr_end > start);
|
||||||
|
}
|
||||||
|
|
||||||
|
bool IsInside(const CacheAddr other_start, const CacheAddr other_end) const {
|
||||||
|
return cache_addr <= other_start && other_end <= cache_addr_end;
|
||||||
|
}
|
||||||
|
|
||||||
|
u8* GetWritableHostPtr() const {
|
||||||
|
return FromCacheAddr(cache_addr);
|
||||||
|
}
|
||||||
|
|
||||||
|
u8* GetWritableHostPtr(std::size_t offset) const {
|
||||||
|
return FromCacheAddr(cache_addr + offset);
|
||||||
|
}
|
||||||
|
|
||||||
|
std::size_t GetOffset(const CacheAddr in_addr) {
|
||||||
|
return static_cast<std::size_t>(in_addr - cache_addr);
|
||||||
|
}
|
||||||
|
|
||||||
|
CacheAddr GetCacheAddr() const {
|
||||||
|
return cache_addr;
|
||||||
|
}
|
||||||
|
|
||||||
|
CacheAddr GetCacheAddrEnd() const {
|
||||||
|
return cache_addr_end;
|
||||||
|
}
|
||||||
|
|
||||||
|
void SetCacheAddr(const CacheAddr new_addr) {
|
||||||
|
cache_addr = new_addr;
|
||||||
|
cache_addr_end = new_addr + size;
|
||||||
|
}
|
||||||
|
|
||||||
|
std::size_t GetSize() const {
|
||||||
|
return size;
|
||||||
|
}
|
||||||
|
|
||||||
|
void SetEpoch(u64 new_epoch) {
|
||||||
|
epoch = new_epoch;
|
||||||
|
}
|
||||||
|
|
||||||
|
u64 GetEpoch() {
|
||||||
|
return epoch;
|
||||||
|
}
|
||||||
|
|
||||||
|
protected:
|
||||||
|
explicit BufferBlock(CacheAddr cache_addr, const std::size_t size) : size{size} {
|
||||||
|
SetCacheAddr(cache_addr);
|
||||||
|
}
|
||||||
|
~BufferBlock() = default;
|
||||||
|
|
||||||
|
private:
|
||||||
|
CacheAddr cache_addr{};
|
||||||
|
CacheAddr cache_addr_end{};
|
||||||
|
u64 pages{};
|
||||||
|
std::size_t size{};
|
||||||
|
u64 epoch{};
|
||||||
|
};
|
||||||
|
|
||||||
|
} // namespace VideoCommon
|
449
src/video_core/buffer_cache/buffer_cache.h
Normal file
449
src/video_core/buffer_cache/buffer_cache.h
Normal file
|
@ -0,0 +1,449 @@
|
||||||
|
// Copyright 2019 yuzu Emulator Project
|
||||||
|
// Licensed under GPLv2 or any later version
|
||||||
|
// Refer to the license.txt file included.
|
||||||
|
|
||||||
|
#pragma once
|
||||||
|
|
||||||
|
#include <array>
|
||||||
|
#include <memory>
|
||||||
|
#include <mutex>
|
||||||
|
#include <unordered_map>
|
||||||
|
#include <unordered_set>
|
||||||
|
#include <utility>
|
||||||
|
#include <vector>
|
||||||
|
|
||||||
|
#include "common/alignment.h"
|
||||||
|
#include "common/common_types.h"
|
||||||
|
#include "core/core.h"
|
||||||
|
#include "video_core/buffer_cache/buffer_block.h"
|
||||||
|
#include "video_core/buffer_cache/map_interval.h"
|
||||||
|
#include "video_core/memory_manager.h"
|
||||||
|
|
||||||
|
namespace VideoCore {
|
||||||
|
class RasterizerInterface;
|
||||||
|
}
|
||||||
|
|
||||||
|
namespace VideoCommon {
|
||||||
|
|
||||||
|
using MapInterval = std::shared_ptr<MapIntervalBase>;
|
||||||
|
|
||||||
|
template <typename TBuffer, typename TBufferType, typename StreamBuffer>
|
||||||
|
class BufferCache {
|
||||||
|
public:
|
||||||
|
using BufferInfo = std::pair<const TBufferType*, u64>;
|
||||||
|
|
||||||
|
BufferInfo UploadMemory(GPUVAddr gpu_addr, std::size_t size, std::size_t alignment = 4,
|
||||||
|
bool is_written = false) {
|
||||||
|
std::lock_guard lock{mutex};
|
||||||
|
|
||||||
|
auto& memory_manager = system.GPU().MemoryManager();
|
||||||
|
const auto host_ptr = memory_manager.GetPointer(gpu_addr);
|
||||||
|
if (!host_ptr) {
|
||||||
|
return {GetEmptyBuffer(size), 0};
|
||||||
|
}
|
||||||
|
const auto cache_addr = ToCacheAddr(host_ptr);
|
||||||
|
|
||||||
|
// Cache management is a big overhead, so only cache entries with a given size.
|
||||||
|
// TODO: Figure out which size is the best for given games.
|
||||||
|
constexpr std::size_t max_stream_size = 0x800;
|
||||||
|
if (size < max_stream_size) {
|
||||||
|
if (!is_written && !IsRegionWritten(cache_addr, cache_addr + size - 1)) {
|
||||||
|
return StreamBufferUpload(host_ptr, size, alignment);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
auto block = GetBlock(cache_addr, size);
|
||||||
|
auto map = MapAddress(block, gpu_addr, cache_addr, size);
|
||||||
|
if (is_written) {
|
||||||
|
map->MarkAsModified(true, GetModifiedTicks());
|
||||||
|
if (!map->IsWritten()) {
|
||||||
|
map->MarkAsWritten(true);
|
||||||
|
MarkRegionAsWritten(map->GetStart(), map->GetEnd() - 1);
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
if (map->IsWritten()) {
|
||||||
|
WriteBarrier();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
const u64 offset = static_cast<u64>(block->GetOffset(cache_addr));
|
||||||
|
|
||||||
|
return {ToHandle(block), offset};
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Uploads from a host memory. Returns the OpenGL buffer where it's located and its offset.
|
||||||
|
BufferInfo UploadHostMemory(const void* raw_pointer, std::size_t size,
|
||||||
|
std::size_t alignment = 4) {
|
||||||
|
std::lock_guard lock{mutex};
|
||||||
|
return StreamBufferUpload(raw_pointer, size, alignment);
|
||||||
|
}
|
||||||
|
|
||||||
|
void Map(std::size_t max_size) {
|
||||||
|
std::lock_guard lock{mutex};
|
||||||
|
|
||||||
|
std::tie(buffer_ptr, buffer_offset_base, invalidated) = stream_buffer->Map(max_size, 4);
|
||||||
|
buffer_offset = buffer_offset_base;
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Finishes the upload stream, returns true on bindings invalidation.
|
||||||
|
bool Unmap() {
|
||||||
|
std::lock_guard lock{mutex};
|
||||||
|
|
||||||
|
stream_buffer->Unmap(buffer_offset - buffer_offset_base);
|
||||||
|
return std::exchange(invalidated, false);
|
||||||
|
}
|
||||||
|
|
||||||
|
void TickFrame() {
|
||||||
|
++epoch;
|
||||||
|
while (!pending_destruction.empty()) {
|
||||||
|
if (pending_destruction.front()->GetEpoch() + 1 > epoch) {
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
pending_destruction.pop_front();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Write any cached resources overlapping the specified region back to memory
|
||||||
|
void FlushRegion(CacheAddr addr, std::size_t size) {
|
||||||
|
std::lock_guard lock{mutex};
|
||||||
|
|
||||||
|
std::vector<MapInterval> objects = GetMapsInRange(addr, size);
|
||||||
|
std::sort(objects.begin(), objects.end(), [](const MapInterval& a, const MapInterval& b) {
|
||||||
|
return a->GetModificationTick() < b->GetModificationTick();
|
||||||
|
});
|
||||||
|
for (auto& object : objects) {
|
||||||
|
if (object->IsModified() && object->IsRegistered()) {
|
||||||
|
FlushMap(object);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Mark the specified region as being invalidated
|
||||||
|
void InvalidateRegion(CacheAddr addr, u64 size) {
|
||||||
|
std::lock_guard lock{mutex};
|
||||||
|
|
||||||
|
std::vector<MapInterval> objects = GetMapsInRange(addr, size);
|
||||||
|
for (auto& object : objects) {
|
||||||
|
if (object->IsRegistered()) {
|
||||||
|
Unregister(object);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
virtual const TBufferType* GetEmptyBuffer(std::size_t size) = 0;
|
||||||
|
|
||||||
|
protected:
|
||||||
|
explicit BufferCache(VideoCore::RasterizerInterface& rasterizer, Core::System& system,
|
||||||
|
std::unique_ptr<StreamBuffer> stream_buffer)
|
||||||
|
: rasterizer{rasterizer}, system{system}, stream_buffer{std::move(stream_buffer)},
|
||||||
|
stream_buffer_handle{this->stream_buffer->GetHandle()} {}
|
||||||
|
|
||||||
|
~BufferCache() = default;
|
||||||
|
|
||||||
|
virtual const TBufferType* ToHandle(const TBuffer& storage) = 0;
|
||||||
|
|
||||||
|
virtual void WriteBarrier() = 0;
|
||||||
|
|
||||||
|
virtual TBuffer CreateBlock(CacheAddr cache_addr, std::size_t size) = 0;
|
||||||
|
|
||||||
|
virtual void UploadBlockData(const TBuffer& buffer, std::size_t offset, std::size_t size,
|
||||||
|
const u8* data) = 0;
|
||||||
|
|
||||||
|
virtual void DownloadBlockData(const TBuffer& buffer, std::size_t offset, std::size_t size,
|
||||||
|
u8* data) = 0;
|
||||||
|
|
||||||
|
virtual void CopyBlock(const TBuffer& src, const TBuffer& dst, std::size_t src_offset,
|
||||||
|
std::size_t dst_offset, std::size_t size) = 0;
|
||||||
|
|
||||||
|
/// Register an object into the cache
|
||||||
|
void Register(const MapInterval& new_map, bool inherit_written = false) {
|
||||||
|
const CacheAddr cache_ptr = new_map->GetStart();
|
||||||
|
const std::optional<VAddr> cpu_addr =
|
||||||
|
system.GPU().MemoryManager().GpuToCpuAddress(new_map->GetGpuAddress());
|
||||||
|
if (!cache_ptr || !cpu_addr) {
|
||||||
|
LOG_CRITICAL(HW_GPU, "Failed to register buffer with unmapped gpu_address 0x{:016x}",
|
||||||
|
new_map->GetGpuAddress());
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
const std::size_t size = new_map->GetEnd() - new_map->GetStart();
|
||||||
|
new_map->SetCpuAddress(*cpu_addr);
|
||||||
|
new_map->MarkAsRegistered(true);
|
||||||
|
const IntervalType interval{new_map->GetStart(), new_map->GetEnd()};
|
||||||
|
mapped_addresses.insert({interval, new_map});
|
||||||
|
rasterizer.UpdatePagesCachedCount(*cpu_addr, size, 1);
|
||||||
|
if (inherit_written) {
|
||||||
|
MarkRegionAsWritten(new_map->GetStart(), new_map->GetEnd() - 1);
|
||||||
|
new_map->MarkAsWritten(true);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Unregisters an object from the cache
|
||||||
|
void Unregister(MapInterval& map) {
|
||||||
|
const std::size_t size = map->GetEnd() - map->GetStart();
|
||||||
|
rasterizer.UpdatePagesCachedCount(map->GetCpuAddress(), size, -1);
|
||||||
|
map->MarkAsRegistered(false);
|
||||||
|
if (map->IsWritten()) {
|
||||||
|
UnmarkRegionAsWritten(map->GetStart(), map->GetEnd() - 1);
|
||||||
|
}
|
||||||
|
const IntervalType delete_interval{map->GetStart(), map->GetEnd()};
|
||||||
|
mapped_addresses.erase(delete_interval);
|
||||||
|
}
|
||||||
|
|
||||||
|
private:
|
||||||
|
MapInterval CreateMap(const CacheAddr start, const CacheAddr end, const GPUVAddr gpu_addr) {
|
||||||
|
return std::make_shared<MapIntervalBase>(start, end, gpu_addr);
|
||||||
|
}
|
||||||
|
|
||||||
|
MapInterval MapAddress(const TBuffer& block, const GPUVAddr gpu_addr,
|
||||||
|
const CacheAddr cache_addr, const std::size_t size) {
|
||||||
|
|
||||||
|
std::vector<MapInterval> overlaps = GetMapsInRange(cache_addr, size);
|
||||||
|
if (overlaps.empty()) {
|
||||||
|
const CacheAddr cache_addr_end = cache_addr + size;
|
||||||
|
MapInterval new_map = CreateMap(cache_addr, cache_addr_end, gpu_addr);
|
||||||
|
u8* host_ptr = FromCacheAddr(cache_addr);
|
||||||
|
UploadBlockData(block, block->GetOffset(cache_addr), size, host_ptr);
|
||||||
|
Register(new_map);
|
||||||
|
return new_map;
|
||||||
|
}
|
||||||
|
|
||||||
|
const CacheAddr cache_addr_end = cache_addr + size;
|
||||||
|
if (overlaps.size() == 1) {
|
||||||
|
MapInterval& current_map = overlaps[0];
|
||||||
|
if (current_map->IsInside(cache_addr, cache_addr_end)) {
|
||||||
|
return current_map;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
CacheAddr new_start = cache_addr;
|
||||||
|
CacheAddr new_end = cache_addr_end;
|
||||||
|
bool write_inheritance = false;
|
||||||
|
bool modified_inheritance = false;
|
||||||
|
// Calculate new buffer parameters
|
||||||
|
for (auto& overlap : overlaps) {
|
||||||
|
new_start = std::min(overlap->GetStart(), new_start);
|
||||||
|
new_end = std::max(overlap->GetEnd(), new_end);
|
||||||
|
write_inheritance |= overlap->IsWritten();
|
||||||
|
modified_inheritance |= overlap->IsModified();
|
||||||
|
}
|
||||||
|
GPUVAddr new_gpu_addr = gpu_addr + new_start - cache_addr;
|
||||||
|
for (auto& overlap : overlaps) {
|
||||||
|
Unregister(overlap);
|
||||||
|
}
|
||||||
|
UpdateBlock(block, new_start, new_end, overlaps);
|
||||||
|
MapInterval new_map = CreateMap(new_start, new_end, new_gpu_addr);
|
||||||
|
if (modified_inheritance) {
|
||||||
|
new_map->MarkAsModified(true, GetModifiedTicks());
|
||||||
|
}
|
||||||
|
Register(new_map, write_inheritance);
|
||||||
|
return new_map;
|
||||||
|
}
|
||||||
|
|
||||||
|
void UpdateBlock(const TBuffer& block, CacheAddr start, CacheAddr end,
|
||||||
|
std::vector<MapInterval>& overlaps) {
|
||||||
|
const IntervalType base_interval{start, end};
|
||||||
|
IntervalSet interval_set{};
|
||||||
|
interval_set.add(base_interval);
|
||||||
|
for (auto& overlap : overlaps) {
|
||||||
|
const IntervalType subtract{overlap->GetStart(), overlap->GetEnd()};
|
||||||
|
interval_set.subtract(subtract);
|
||||||
|
}
|
||||||
|
for (auto& interval : interval_set) {
|
||||||
|
std::size_t size = interval.upper() - interval.lower();
|
||||||
|
if (size > 0) {
|
||||||
|
u8* host_ptr = FromCacheAddr(interval.lower());
|
||||||
|
UploadBlockData(block, block->GetOffset(interval.lower()), size, host_ptr);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
std::vector<MapInterval> GetMapsInRange(CacheAddr addr, std::size_t size) {
|
||||||
|
if (size == 0) {
|
||||||
|
return {};
|
||||||
|
}
|
||||||
|
|
||||||
|
std::vector<MapInterval> objects{};
|
||||||
|
const IntervalType interval{addr, addr + size};
|
||||||
|
for (auto& pair : boost::make_iterator_range(mapped_addresses.equal_range(interval))) {
|
||||||
|
objects.push_back(pair.second);
|
||||||
|
}
|
||||||
|
|
||||||
|
return objects;
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Returns a ticks counter used for tracking when cached objects were last modified
|
||||||
|
u64 GetModifiedTicks() {
|
||||||
|
return ++modified_ticks;
|
||||||
|
}
|
||||||
|
|
||||||
|
void FlushMap(MapInterval map) {
|
||||||
|
std::size_t size = map->GetEnd() - map->GetStart();
|
||||||
|
TBuffer block = blocks[map->GetStart() >> block_page_bits];
|
||||||
|
u8* host_ptr = FromCacheAddr(map->GetStart());
|
||||||
|
DownloadBlockData(block, block->GetOffset(map->GetStart()), size, host_ptr);
|
||||||
|
map->MarkAsModified(false, 0);
|
||||||
|
}
|
||||||
|
|
||||||
|
BufferInfo StreamBufferUpload(const void* raw_pointer, std::size_t size,
|
||||||
|
std::size_t alignment) {
|
||||||
|
AlignBuffer(alignment);
|
||||||
|
const std::size_t uploaded_offset = buffer_offset;
|
||||||
|
std::memcpy(buffer_ptr, raw_pointer, size);
|
||||||
|
|
||||||
|
buffer_ptr += size;
|
||||||
|
buffer_offset += size;
|
||||||
|
return {&stream_buffer_handle, uploaded_offset};
|
||||||
|
}
|
||||||
|
|
||||||
|
void AlignBuffer(std::size_t alignment) {
|
||||||
|
// Align the offset, not the mapped pointer
|
||||||
|
const std::size_t offset_aligned = Common::AlignUp(buffer_offset, alignment);
|
||||||
|
buffer_ptr += offset_aligned - buffer_offset;
|
||||||
|
buffer_offset = offset_aligned;
|
||||||
|
}
|
||||||
|
|
||||||
|
TBuffer EnlargeBlock(TBuffer buffer) {
|
||||||
|
const std::size_t old_size = buffer->GetSize();
|
||||||
|
const std::size_t new_size = old_size + block_page_size;
|
||||||
|
const CacheAddr cache_addr = buffer->GetCacheAddr();
|
||||||
|
TBuffer new_buffer = CreateBlock(cache_addr, new_size);
|
||||||
|
CopyBlock(buffer, new_buffer, 0, 0, old_size);
|
||||||
|
buffer->SetEpoch(epoch);
|
||||||
|
pending_destruction.push_back(buffer);
|
||||||
|
const CacheAddr cache_addr_end = cache_addr + new_size - 1;
|
||||||
|
u64 page_start = cache_addr >> block_page_bits;
|
||||||
|
const u64 page_end = cache_addr_end >> block_page_bits;
|
||||||
|
while (page_start <= page_end) {
|
||||||
|
blocks[page_start] = new_buffer;
|
||||||
|
++page_start;
|
||||||
|
}
|
||||||
|
return new_buffer;
|
||||||
|
}
|
||||||
|
|
||||||
|
TBuffer MergeBlocks(TBuffer first, TBuffer second) {
|
||||||
|
const std::size_t size_1 = first->GetSize();
|
||||||
|
const std::size_t size_2 = second->GetSize();
|
||||||
|
const CacheAddr first_addr = first->GetCacheAddr();
|
||||||
|
const CacheAddr second_addr = second->GetCacheAddr();
|
||||||
|
const CacheAddr new_addr = std::min(first_addr, second_addr);
|
||||||
|
const std::size_t new_size = size_1 + size_2;
|
||||||
|
TBuffer new_buffer = CreateBlock(new_addr, new_size);
|
||||||
|
CopyBlock(first, new_buffer, 0, new_buffer->GetOffset(first_addr), size_1);
|
||||||
|
CopyBlock(second, new_buffer, 0, new_buffer->GetOffset(second_addr), size_2);
|
||||||
|
first->SetEpoch(epoch);
|
||||||
|
second->SetEpoch(epoch);
|
||||||
|
pending_destruction.push_back(first);
|
||||||
|
pending_destruction.push_back(second);
|
||||||
|
const CacheAddr cache_addr_end = new_addr + new_size - 1;
|
||||||
|
u64 page_start = new_addr >> block_page_bits;
|
||||||
|
const u64 page_end = cache_addr_end >> block_page_bits;
|
||||||
|
while (page_start <= page_end) {
|
||||||
|
blocks[page_start] = new_buffer;
|
||||||
|
++page_start;
|
||||||
|
}
|
||||||
|
return new_buffer;
|
||||||
|
}
|
||||||
|
|
||||||
|
TBuffer GetBlock(const CacheAddr cache_addr, const std::size_t size) {
|
||||||
|
TBuffer found{};
|
||||||
|
const CacheAddr cache_addr_end = cache_addr + size - 1;
|
||||||
|
u64 page_start = cache_addr >> block_page_bits;
|
||||||
|
const u64 page_end = cache_addr_end >> block_page_bits;
|
||||||
|
const u64 num_pages = page_end - page_start + 1;
|
||||||
|
while (page_start <= page_end) {
|
||||||
|
auto it = blocks.find(page_start);
|
||||||
|
if (it == blocks.end()) {
|
||||||
|
if (found) {
|
||||||
|
found = EnlargeBlock(found);
|
||||||
|
} else {
|
||||||
|
const CacheAddr start_addr = (page_start << block_page_bits);
|
||||||
|
found = CreateBlock(start_addr, block_page_size);
|
||||||
|
blocks[page_start] = found;
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
if (found) {
|
||||||
|
if (found == it->second) {
|
||||||
|
++page_start;
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
found = MergeBlocks(found, it->second);
|
||||||
|
} else {
|
||||||
|
found = it->second;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
++page_start;
|
||||||
|
}
|
||||||
|
return found;
|
||||||
|
}
|
||||||
|
|
||||||
|
void MarkRegionAsWritten(const CacheAddr start, const CacheAddr end) {
|
||||||
|
u64 page_start = start >> write_page_bit;
|
||||||
|
const u64 page_end = end >> write_page_bit;
|
||||||
|
while (page_start <= page_end) {
|
||||||
|
auto it = written_pages.find(page_start);
|
||||||
|
if (it != written_pages.end()) {
|
||||||
|
it->second = it->second + 1;
|
||||||
|
} else {
|
||||||
|
written_pages[page_start] = 1;
|
||||||
|
}
|
||||||
|
page_start++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void UnmarkRegionAsWritten(const CacheAddr start, const CacheAddr end) {
|
||||||
|
u64 page_start = start >> write_page_bit;
|
||||||
|
const u64 page_end = end >> write_page_bit;
|
||||||
|
while (page_start <= page_end) {
|
||||||
|
auto it = written_pages.find(page_start);
|
||||||
|
if (it != written_pages.end()) {
|
||||||
|
if (it->second > 1) {
|
||||||
|
it->second = it->second - 1;
|
||||||
|
} else {
|
||||||
|
written_pages.erase(it);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
page_start++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
bool IsRegionWritten(const CacheAddr start, const CacheAddr end) const {
|
||||||
|
u64 page_start = start >> write_page_bit;
|
||||||
|
const u64 page_end = end >> write_page_bit;
|
||||||
|
while (page_start <= page_end) {
|
||||||
|
if (written_pages.count(page_start) > 0) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
page_start++;
|
||||||
|
}
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
std::unique_ptr<StreamBuffer> stream_buffer;
|
||||||
|
TBufferType stream_buffer_handle{};
|
||||||
|
|
||||||
|
bool invalidated = false;
|
||||||
|
|
||||||
|
u8* buffer_ptr = nullptr;
|
||||||
|
u64 buffer_offset = 0;
|
||||||
|
u64 buffer_offset_base = 0;
|
||||||
|
|
||||||
|
using IntervalSet = boost::icl::interval_set<CacheAddr>;
|
||||||
|
using IntervalCache = boost::icl::interval_map<CacheAddr, MapInterval>;
|
||||||
|
using IntervalType = typename IntervalCache::interval_type;
|
||||||
|
IntervalCache mapped_addresses{};
|
||||||
|
|
||||||
|
static constexpr u64 write_page_bit{11};
|
||||||
|
std::unordered_map<u64, u32> written_pages{};
|
||||||
|
|
||||||
|
static constexpr u64 block_page_bits{21};
|
||||||
|
static constexpr u64 block_page_size{1 << block_page_bits};
|
||||||
|
std::unordered_map<u64, TBuffer> blocks{};
|
||||||
|
|
||||||
|
std::list<TBuffer> pending_destruction{};
|
||||||
|
u64 epoch{};
|
||||||
|
u64 modified_ticks{};
|
||||||
|
VideoCore::RasterizerInterface& rasterizer;
|
||||||
|
Core::System& system;
|
||||||
|
std::recursive_mutex mutex;
|
||||||
|
};
|
||||||
|
|
||||||
|
} // namespace VideoCommon
|
89
src/video_core/buffer_cache/map_interval.h
Normal file
89
src/video_core/buffer_cache/map_interval.h
Normal file
|
@ -0,0 +1,89 @@
|
||||||
|
// Copyright 2019 yuzu Emulator Project
|
||||||
|
// Licensed under GPLv2 or any later version
|
||||||
|
// Refer to the license.txt file included.
|
||||||
|
|
||||||
|
#pragma once
|
||||||
|
|
||||||
|
#include "common/common_types.h"
|
||||||
|
#include "video_core/gpu.h"
|
||||||
|
|
||||||
|
namespace VideoCommon {
|
||||||
|
|
||||||
|
class MapIntervalBase {
|
||||||
|
public:
|
||||||
|
MapIntervalBase(const CacheAddr start, const CacheAddr end, const GPUVAddr gpu_addr)
|
||||||
|
: start{start}, end{end}, gpu_addr{gpu_addr} {}
|
||||||
|
|
||||||
|
void SetCpuAddress(VAddr new_cpu_addr) {
|
||||||
|
cpu_addr = new_cpu_addr;
|
||||||
|
}
|
||||||
|
|
||||||
|
VAddr GetCpuAddress() const {
|
||||||
|
return cpu_addr;
|
||||||
|
}
|
||||||
|
|
||||||
|
GPUVAddr GetGpuAddress() const {
|
||||||
|
return gpu_addr;
|
||||||
|
}
|
||||||
|
|
||||||
|
bool IsInside(const CacheAddr other_start, const CacheAddr other_end) const {
|
||||||
|
return (start <= other_start && other_end <= end);
|
||||||
|
}
|
||||||
|
|
||||||
|
bool operator==(const MapIntervalBase& rhs) const {
|
||||||
|
return std::tie(start, end) == std::tie(rhs.start, rhs.end);
|
||||||
|
}
|
||||||
|
|
||||||
|
bool operator!=(const MapIntervalBase& rhs) const {
|
||||||
|
return !operator==(rhs);
|
||||||
|
}
|
||||||
|
|
||||||
|
void MarkAsRegistered(const bool registered) {
|
||||||
|
is_registered = registered;
|
||||||
|
}
|
||||||
|
|
||||||
|
bool IsRegistered() const {
|
||||||
|
return is_registered;
|
||||||
|
}
|
||||||
|
|
||||||
|
CacheAddr GetStart() const {
|
||||||
|
return start;
|
||||||
|
}
|
||||||
|
|
||||||
|
CacheAddr GetEnd() const {
|
||||||
|
return end;
|
||||||
|
}
|
||||||
|
|
||||||
|
void MarkAsModified(const bool is_modified_, const u64 tick) {
|
||||||
|
is_modified = is_modified_;
|
||||||
|
ticks = tick;
|
||||||
|
}
|
||||||
|
|
||||||
|
bool IsModified() const {
|
||||||
|
return is_modified;
|
||||||
|
}
|
||||||
|
|
||||||
|
u64 GetModificationTick() const {
|
||||||
|
return ticks;
|
||||||
|
}
|
||||||
|
|
||||||
|
void MarkAsWritten(const bool is_written_) {
|
||||||
|
is_written = is_written_;
|
||||||
|
}
|
||||||
|
|
||||||
|
bool IsWritten() const {
|
||||||
|
return is_written;
|
||||||
|
}
|
||||||
|
|
||||||
|
private:
|
||||||
|
CacheAddr start;
|
||||||
|
CacheAddr end;
|
||||||
|
GPUVAddr gpu_addr;
|
||||||
|
VAddr cpu_addr{};
|
||||||
|
bool is_written{};
|
||||||
|
bool is_modified{};
|
||||||
|
bool is_registered{};
|
||||||
|
u64 ticks{};
|
||||||
|
};
|
||||||
|
|
||||||
|
} // namespace VideoCommon
|
|
@ -19,6 +19,10 @@ inline CacheAddr ToCacheAddr(const void* host_ptr) {
|
||||||
return reinterpret_cast<CacheAddr>(host_ptr);
|
return reinterpret_cast<CacheAddr>(host_ptr);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
inline u8* FromCacheAddr(CacheAddr cache_addr) {
|
||||||
|
return reinterpret_cast<u8*>(cache_addr);
|
||||||
|
}
|
||||||
|
|
||||||
namespace Core {
|
namespace Core {
|
||||||
class System;
|
class System;
|
||||||
}
|
}
|
||||||
|
|
|
@ -7,28 +7,40 @@
|
||||||
#include <glad/glad.h>
|
#include <glad/glad.h>
|
||||||
|
|
||||||
#include "common/assert.h"
|
#include "common/assert.h"
|
||||||
|
#include "common/microprofile.h"
|
||||||
#include "video_core/renderer_opengl/gl_buffer_cache.h"
|
#include "video_core/renderer_opengl/gl_buffer_cache.h"
|
||||||
#include "video_core/renderer_opengl/gl_rasterizer.h"
|
#include "video_core/renderer_opengl/gl_rasterizer.h"
|
||||||
#include "video_core/renderer_opengl/gl_resource_manager.h"
|
#include "video_core/renderer_opengl/gl_resource_manager.h"
|
||||||
|
|
||||||
namespace OpenGL {
|
namespace OpenGL {
|
||||||
|
|
||||||
|
MICROPROFILE_DEFINE(OpenGL_Buffer_Download, "OpenGL", "Buffer Download", MP_RGB(192, 192, 128));
|
||||||
|
|
||||||
|
CachedBufferBlock::CachedBufferBlock(CacheAddr cache_addr, const std::size_t size)
|
||||||
|
: VideoCommon::BufferBlock{cache_addr, size} {
|
||||||
|
gl_buffer.Create();
|
||||||
|
glNamedBufferData(gl_buffer.handle, static_cast<GLsizeiptr>(size), nullptr, GL_DYNAMIC_DRAW);
|
||||||
|
}
|
||||||
|
|
||||||
|
CachedBufferBlock::~CachedBufferBlock() = default;
|
||||||
|
|
||||||
OGLBufferCache::OGLBufferCache(RasterizerOpenGL& rasterizer, Core::System& system,
|
OGLBufferCache::OGLBufferCache(RasterizerOpenGL& rasterizer, Core::System& system,
|
||||||
std::size_t stream_size)
|
std::size_t stream_size)
|
||||||
: VideoCommon::BufferCache<OGLBuffer, GLuint, OGLStreamBuffer>{
|
: VideoCommon::BufferCache<Buffer, GLuint, OGLStreamBuffer>{
|
||||||
rasterizer, system, std::make_unique<OGLStreamBuffer>(stream_size, true)} {}
|
rasterizer, system, std::make_unique<OGLStreamBuffer>(stream_size, true)} {}
|
||||||
|
|
||||||
OGLBufferCache::~OGLBufferCache() = default;
|
OGLBufferCache::~OGLBufferCache() = default;
|
||||||
|
|
||||||
OGLBuffer OGLBufferCache::CreateBuffer(std::size_t size) {
|
Buffer OGLBufferCache::CreateBlock(CacheAddr cache_addr, std::size_t size) {
|
||||||
OGLBuffer buffer;
|
return std::make_shared<CachedBufferBlock>(cache_addr, size);
|
||||||
buffer.Create();
|
|
||||||
glNamedBufferData(buffer.handle, static_cast<GLsizeiptr>(size), nullptr, GL_DYNAMIC_DRAW);
|
|
||||||
return buffer;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
const GLuint* OGLBufferCache::ToHandle(const OGLBuffer& buffer) {
|
void OGLBufferCache::WriteBarrier() {
|
||||||
return &buffer.handle;
|
glMemoryBarrier(GL_ALL_BARRIER_BITS);
|
||||||
|
}
|
||||||
|
|
||||||
|
const GLuint* OGLBufferCache::ToHandle(const Buffer& buffer) {
|
||||||
|
return buffer->GetHandle();
|
||||||
}
|
}
|
||||||
|
|
||||||
const GLuint* OGLBufferCache::GetEmptyBuffer(std::size_t) {
|
const GLuint* OGLBufferCache::GetEmptyBuffer(std::size_t) {
|
||||||
|
@ -36,23 +48,24 @@ const GLuint* OGLBufferCache::GetEmptyBuffer(std::size_t) {
|
||||||
return &null_buffer;
|
return &null_buffer;
|
||||||
}
|
}
|
||||||
|
|
||||||
void OGLBufferCache::UploadBufferData(const OGLBuffer& buffer, std::size_t offset, std::size_t size,
|
void OGLBufferCache::UploadBlockData(const Buffer& buffer, std::size_t offset, std::size_t size,
|
||||||
const u8* data) {
|
const u8* data) {
|
||||||
glNamedBufferSubData(buffer.handle, static_cast<GLintptr>(offset),
|
glNamedBufferSubData(*buffer->GetHandle(), static_cast<GLintptr>(offset),
|
||||||
static_cast<GLsizeiptr>(size), data);
|
static_cast<GLsizeiptr>(size), data);
|
||||||
}
|
}
|
||||||
|
|
||||||
void OGLBufferCache::DownloadBufferData(const OGLBuffer& buffer, std::size_t offset,
|
void OGLBufferCache::DownloadBlockData(const Buffer& buffer, std::size_t offset, std::size_t size,
|
||||||
std::size_t size, u8* data) {
|
u8* data) {
|
||||||
glGetNamedBufferSubData(buffer.handle, static_cast<GLintptr>(offset),
|
MICROPROFILE_SCOPE(OpenGL_Buffer_Download);
|
||||||
|
glGetNamedBufferSubData(*buffer->GetHandle(), static_cast<GLintptr>(offset),
|
||||||
static_cast<GLsizeiptr>(size), data);
|
static_cast<GLsizeiptr>(size), data);
|
||||||
}
|
}
|
||||||
|
|
||||||
void OGLBufferCache::CopyBufferData(const OGLBuffer& src, const OGLBuffer& dst,
|
void OGLBufferCache::CopyBlock(const Buffer& src, const Buffer& dst, std::size_t src_offset,
|
||||||
std::size_t src_offset, std::size_t dst_offset,
|
std::size_t dst_offset, std::size_t size) {
|
||||||
std::size_t size) {
|
glCopyNamedBufferSubData(*src->GetHandle(), *dst->GetHandle(),
|
||||||
glCopyNamedBufferSubData(src.handle, dst.handle, static_cast<GLintptr>(src_offset),
|
static_cast<GLintptr>(src_offset), static_cast<GLintptr>(dst_offset),
|
||||||
static_cast<GLintptr>(dst_offset), static_cast<GLsizeiptr>(size));
|
static_cast<GLsizeiptr>(size));
|
||||||
}
|
}
|
||||||
|
|
||||||
} // namespace OpenGL
|
} // namespace OpenGL
|
||||||
|
|
|
@ -7,7 +7,7 @@
|
||||||
#include <memory>
|
#include <memory>
|
||||||
|
|
||||||
#include "common/common_types.h"
|
#include "common/common_types.h"
|
||||||
#include "video_core/buffer_cache.h"
|
#include "video_core/buffer_cache/buffer_cache.h"
|
||||||
#include "video_core/rasterizer_cache.h"
|
#include "video_core/rasterizer_cache.h"
|
||||||
#include "video_core/renderer_opengl/gl_resource_manager.h"
|
#include "video_core/renderer_opengl/gl_resource_manager.h"
|
||||||
#include "video_core/renderer_opengl/gl_stream_buffer.h"
|
#include "video_core/renderer_opengl/gl_stream_buffer.h"
|
||||||
|
@ -21,7 +21,24 @@ namespace OpenGL {
|
||||||
class OGLStreamBuffer;
|
class OGLStreamBuffer;
|
||||||
class RasterizerOpenGL;
|
class RasterizerOpenGL;
|
||||||
|
|
||||||
class OGLBufferCache final : public VideoCommon::BufferCache<OGLBuffer, GLuint, OGLStreamBuffer> {
|
class CachedBufferBlock;
|
||||||
|
|
||||||
|
using Buffer = std::shared_ptr<CachedBufferBlock>;
|
||||||
|
|
||||||
|
class CachedBufferBlock : public VideoCommon::BufferBlock {
|
||||||
|
public:
|
||||||
|
explicit CachedBufferBlock(CacheAddr cache_addr, const std::size_t size);
|
||||||
|
~CachedBufferBlock();
|
||||||
|
|
||||||
|
const GLuint* GetHandle() const {
|
||||||
|
return &gl_buffer.handle;
|
||||||
|
}
|
||||||
|
|
||||||
|
private:
|
||||||
|
OGLBuffer gl_buffer{};
|
||||||
|
};
|
||||||
|
|
||||||
|
class OGLBufferCache final : public VideoCommon::BufferCache<Buffer, GLuint, OGLStreamBuffer> {
|
||||||
public:
|
public:
|
||||||
explicit OGLBufferCache(RasterizerOpenGL& rasterizer, Core::System& system,
|
explicit OGLBufferCache(RasterizerOpenGL& rasterizer, Core::System& system,
|
||||||
std::size_t stream_size);
|
std::size_t stream_size);
|
||||||
|
@ -30,17 +47,19 @@ public:
|
||||||
const GLuint* GetEmptyBuffer(std::size_t) override;
|
const GLuint* GetEmptyBuffer(std::size_t) override;
|
||||||
|
|
||||||
protected:
|
protected:
|
||||||
OGLBuffer CreateBuffer(std::size_t size) override;
|
Buffer CreateBlock(CacheAddr cache_addr, std::size_t size) override;
|
||||||
|
|
||||||
const GLuint* ToHandle(const OGLBuffer& buffer) override;
|
void WriteBarrier() override;
|
||||||
|
|
||||||
void UploadBufferData(const OGLBuffer& buffer, std::size_t offset, std::size_t size,
|
const GLuint* ToHandle(const Buffer& buffer) override;
|
||||||
|
|
||||||
|
void UploadBlockData(const Buffer& buffer, std::size_t offset, std::size_t size,
|
||||||
const u8* data) override;
|
const u8* data) override;
|
||||||
|
|
||||||
void DownloadBufferData(const OGLBuffer& buffer, std::size_t offset, std::size_t size,
|
void DownloadBlockData(const Buffer& buffer, std::size_t offset, std::size_t size,
|
||||||
u8* data) override;
|
u8* data) override;
|
||||||
|
|
||||||
void CopyBufferData(const OGLBuffer& src, const OGLBuffer& dst, std::size_t src_offset,
|
void CopyBlock(const Buffer& src, const Buffer& dst, std::size_t src_offset,
|
||||||
std::size_t dst_offset, std::size_t size) override;
|
std::size_t dst_offset, std::size_t size) override;
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|
|
@ -980,7 +980,7 @@ void RasterizerOpenGL::SetupGlobalMemory(const GLShader::GlobalMemoryEntry& entr
|
||||||
GPUVAddr gpu_addr, std::size_t size) {
|
GPUVAddr gpu_addr, std::size_t size) {
|
||||||
const auto alignment{device.GetShaderStorageBufferAlignment()};
|
const auto alignment{device.GetShaderStorageBufferAlignment()};
|
||||||
const auto [ssbo, buffer_offset] =
|
const auto [ssbo, buffer_offset] =
|
||||||
buffer_cache.UploadMemory(gpu_addr, size, alignment, true, entry.IsWritten());
|
buffer_cache.UploadMemory(gpu_addr, size, alignment, entry.IsWritten());
|
||||||
bind_ssbo_pushbuffer.Push(ssbo, buffer_offset, static_cast<GLsizeiptr>(size));
|
bind_ssbo_pushbuffer.Push(ssbo, buffer_offset, static_cast<GLsizeiptr>(size));
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
Loading…
Reference in a new issue