Skip to content

Commit 1d6f31a

Browse files
committed
buffer_cache: Handle obtaining buffer views partially within buffers.
1 parent 8e7ec9e commit 1d6f31a

File tree

3 files changed

+16
-5
lines changed

3 files changed

+16
-5
lines changed

src/video_core/buffer_cache/buffer_cache.cpp

Lines changed: 9 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -360,7 +360,8 @@ std::pair<Buffer*, u32> BufferCache::ObtainBuffer(VAddr device_addr, u32 size, b
360360
return {&buffer, buffer.Offset(device_addr)};
361361
}
362362

363-
std::pair<Buffer*, u32> BufferCache::ObtainViewBuffer(VAddr gpu_addr, u32 size) {
363+
std::pair<Buffer*, u32> BufferCache::ObtainViewBuffer(VAddr gpu_addr, u32 size, bool prefer_gpu) {
364+
// Check if any buffer contains the full requested range.
364365
const u64 page = gpu_addr >> CACHING_PAGEBITS;
365366
const BufferId buffer_id = page_table[page];
366367
if (buffer_id) {
@@ -370,6 +371,13 @@ std::pair<Buffer*, u32> BufferCache::ObtainViewBuffer(VAddr gpu_addr, u32 size)
370371
return {&buffer, buffer.Offset(gpu_addr)};
371372
}
372373
}
374+
// If no buffer contains the full requested range but some buffer within was GPU-modified,
375+
// fall back to ObtainBuffer to create a full buffer and avoid losing GPU modifications.
376+
// This is only done if the request prefers to use GPU memory, otherwise we can skip it.
377+
if (prefer_gpu && memory_tracker.IsRegionGpuModified(gpu_addr, size)) {
378+
return ObtainBuffer(gpu_addr, size, false, false);
379+
}
380+
// In all other cases, just do a CPU copy to the staging buffer.
373381
const u32 offset = staging_buffer.Copy(gpu_addr, size, 16);
374382
return {&staging_buffer, offset};
375383
}

src/video_core/buffer_cache/buffer_cache.h

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -96,7 +96,8 @@ class BufferCache {
9696
BufferId buffer_id = {});
9797

9898
/// Attempts to obtain a buffer without modifying the cache contents.
99-
[[nodiscard]] std::pair<Buffer*, u32> ObtainViewBuffer(VAddr gpu_addr, u32 size);
99+
[[nodiscard]] std::pair<Buffer*, u32> ObtainViewBuffer(VAddr gpu_addr, u32 size,
100+
bool prefer_gpu);
100101

101102
/// Return true when a region is registered on the cache
102103
[[nodiscard]] bool IsRegionRegistered(VAddr addr, size_t size);

src/video_core/texture_cache/texture_cache.cpp

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -466,6 +466,9 @@ void TextureCache::RefreshImage(Image& image, Vulkan::Scheduler* custom_schedule
466466
const auto& num_mips = image.info.resources.levels;
467467
ASSERT(num_mips == image.info.mips_layout.size());
468468

469+
const bool is_gpu_modified = True(image.flags & ImageFlagBits::GpuModified);
470+
const bool is_gpu_dirty = True(image.flags & ImageFlagBits::GpuDirty);
471+
469472
boost::container::small_vector<vk::BufferImageCopy, 14> image_copy{};
470473
for (u32 m = 0; m < num_mips; m++) {
471474
const u32 width = std::max(image.info.size.width >> m, 1u);
@@ -475,8 +478,6 @@ void TextureCache::RefreshImage(Image& image, Vulkan::Scheduler* custom_schedule
475478
const auto& mip = image.info.mips_layout[m];
476479

477480
// Protect GPU modified resources from accidental CPU reuploads.
478-
const bool is_gpu_modified = True(image.flags & ImageFlagBits::GpuModified);
479-
const bool is_gpu_dirty = True(image.flags & ImageFlagBits::GpuDirty);
480481
if (is_gpu_modified && !is_gpu_dirty) {
481482
const u8* addr = std::bit_cast<u8*>(image.info.guest_address);
482483
const u64 hash = XXH3_64bits(addr + mip.offset, mip.size);
@@ -515,7 +516,8 @@ void TextureCache::RefreshImage(Image& image, Vulkan::Scheduler* custom_schedule
515516

516517
const VAddr image_addr = image.info.guest_address;
517518
const size_t image_size = image.info.guest_size_bytes;
518-
const auto [vk_buffer, buf_offset] = buffer_cache.ObtainViewBuffer(image_addr, image_size);
519+
const auto [vk_buffer, buf_offset] =
520+
buffer_cache.ObtainViewBuffer(image_addr, image_size, is_gpu_dirty);
519521
// The obtained buffer may be written by a shader so we need to emit a barrier to prevent RAW
520522
// hazard
521523
if (auto barrier = vk_buffer->GetBarrier(vk::AccessFlagBits2::eTransferRead,

0 commit comments

Comments
 (0)