mirror of
https://git.eden-emu.dev/eden-emu/eden
synced 2026-04-09 22:58:54 +02:00
Small experiment
This commit is contained in:
parent
8200a7564c
commit
53060c9a91
2 changed files with 60 additions and 4 deletions
|
|
@ -113,6 +113,54 @@ TextureCache<P>::TextureCache(Runtime& runtime_, Tegra::MaxwellDeviceMemoryManag
|
|||
}
|
||||
}
|
||||
|
||||
template <class P>
|
||||
void TextureCache<P>::RunAllocationGarbageCollector(size_t requested_bytes) {
|
||||
if (requested_bytes == 0) {
|
||||
return;
|
||||
}
|
||||
|
||||
if (allocation_gc_frame != frame_tick) {
|
||||
allocation_gc_frame = frame_tick;
|
||||
allocation_gc_passes = 0;
|
||||
}
|
||||
if (allocation_gc_passes >= MAX_ALLOCATION_GC_PASSES_PER_FRAME) {
|
||||
return;
|
||||
}
|
||||
|
||||
if (runtime.CanReportMemoryUsage()) {
|
||||
total_used_memory = runtime.GetDeviceMemoryUsage();
|
||||
}
|
||||
|
||||
const u64 request = static_cast<u64>(requested_bytes);
|
||||
const u64 max_u64 = (std::numeric_limits<u64>::max)();
|
||||
const u64 projected_usage = request > (max_u64 - total_used_memory)
|
||||
? max_u64
|
||||
: total_used_memory + request;
|
||||
if (projected_usage < expected_memory) {
|
||||
return;
|
||||
}
|
||||
|
||||
RunGarbageCollector();
|
||||
++allocation_gc_passes;
|
||||
|
||||
if (runtime.CanReportMemoryUsage()) {
|
||||
total_used_memory = runtime.GetDeviceMemoryUsage();
|
||||
}
|
||||
|
||||
const u64 projected_after_gc = request > (max_u64 - total_used_memory)
|
||||
? max_u64
|
||||
: total_used_memory + request;
|
||||
if (projected_after_gc >= critical_memory &&
|
||||
allocation_gc_passes < MAX_ALLOCATION_GC_PASSES_PER_FRAME) {
|
||||
RunGarbageCollector();
|
||||
++allocation_gc_passes;
|
||||
|
||||
if (runtime.CanReportMemoryUsage()) {
|
||||
total_used_memory = runtime.GetDeviceMemoryUsage();
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
template <class P>
|
||||
void TextureCache<P>::RunGarbageCollector() {
|
||||
bool high_priority_mode = total_used_memory >= expected_memory;
|
||||
|
|
@ -1606,18 +1654,20 @@ bool TextureCache<P>::ScaleDown(Image& image) {
|
|||
template <class P>
|
||||
ImageId TextureCache<P>::InsertImage(const ImageInfo& info, GPUVAddr gpu_addr,
|
||||
RelaxedOptions options) {
|
||||
const size_t requested_size = CalculateGuestSizeInBytes(info);
|
||||
std::optional<DAddr> cpu_addr = gpu_memory->GpuToCpuAddress(gpu_addr);
|
||||
if (!cpu_addr) {
|
||||
const auto size = CalculateGuestSizeInBytes(info);
|
||||
cpu_addr = gpu_memory->GpuToCpuAddress(gpu_addr, size);
|
||||
cpu_addr = gpu_memory->GpuToCpuAddress(gpu_addr, requested_size);
|
||||
if (!cpu_addr) {
|
||||
const DAddr fake_addr = ~(1ULL << 40ULL) + virtual_invalid_space;
|
||||
virtual_invalid_space += Common::AlignUp(size, 32);
|
||||
virtual_invalid_space += Common::AlignUp(requested_size, 32);
|
||||
cpu_addr = std::optional<DAddr>(fake_addr);
|
||||
}
|
||||
}
|
||||
ASSERT_MSG(cpu_addr, "Tried to insert an image to an invalid gpu_addr=0x{:x}", gpu_addr);
|
||||
|
||||
RunAllocationGarbageCollector(requested_size);
|
||||
|
||||
const ImageId image_id = JoinImages(info, gpu_addr, *cpu_addr);
|
||||
const Image& image = slot_images[image_id];
|
||||
// Using "image.gpu_addr" instead of "gpu_addr" is important because it might be different
|
||||
|
|
@ -1634,6 +1684,8 @@ ImageId TextureCache<P>::JoinImages(const ImageInfo& info, GPUVAddr gpu_addr, DA
|
|||
ImageInfo new_info = info;
|
||||
const size_t size_bytes = CalculateGuestSizeInBytes(new_info);
|
||||
|
||||
RunAllocationGarbageCollector(size_bytes);
|
||||
|
||||
const bool broken_views = runtime.HasBrokenTextureViewFormats();
|
||||
const bool native_bgr = runtime.HasNativeBgr();
|
||||
join_overlap_ids.clear();
|
||||
|
|
|
|||
|
|
@ -120,7 +120,7 @@ class TextureCache : public VideoCommon::ChannelSetupCaches<TextureCacheChannelI
|
|||
|
||||
static constexpr s64 DEFAULT_EXPECTED_MEMORY = 1_GiB + 125_MiB;
|
||||
static constexpr s64 DEFAULT_CRITICAL_MEMORY = 1_GiB + 625_MiB;
|
||||
static constexpr size_t GC_EMERGENCY_COUNTS = 2;
|
||||
static constexpr u32 MAX_ALLOCATION_GC_PASSES_PER_FRAME = 2;
|
||||
|
||||
using Runtime = typename P::Runtime;
|
||||
using Image = typename P::Image;
|
||||
|
|
@ -310,6 +310,8 @@ private:
|
|||
/// Runs the Garbage Collector.
|
||||
void RunGarbageCollector();
|
||||
|
||||
void RunAllocationGarbageCollector(size_t requested_bytes);
|
||||
|
||||
/// Fills image_view_ids in the image views in indices
|
||||
template <bool has_blacklists>
|
||||
void FillImageViews(DescriptorTable<TICEntry>& table,
|
||||
|
|
@ -527,6 +529,8 @@ private:
|
|||
|
||||
u64 modification_tick = 0;
|
||||
u64 frame_tick = 0;
|
||||
u64 allocation_gc_frame = (std::numeric_limits<u64>::max)();
|
||||
u32 allocation_gc_passes = 0;
|
||||
u64 last_sampler_gc_frame = (std::numeric_limits<u64>::max)();
|
||||
|
||||
Common::ThreadWorker texture_decode_worker{1, "TextureDecoder"};
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue