mirror of
				https://git.suyu.dev/suyu/suyu.git
				synced 2025-10-22 10:26:52 +08:00 
			
		
		
		
	Buffer Cache: Tune to the levels of the new GC.
This commit is contained in:
		
							parent
							
								
									ecb3342145
								
							
						
					
					
						commit
						5e982a7812
					
				| @ -76,8 +76,9 @@ class BufferCache { | |||||||
| 
 | 
 | ||||||
|     static constexpr BufferId NULL_BUFFER_ID{0}; |     static constexpr BufferId NULL_BUFFER_ID{0}; | ||||||
| 
 | 
 | ||||||
|     static constexpr u64 EXPECTED_MEMORY = 512_MiB; |     static constexpr s64 DEFAULT_EXPECTED_MEMORY = 512_MiB; | ||||||
|     static constexpr u64 CRITICAL_MEMORY = 1_GiB; |     static constexpr s64 DEFAULT_CRITICAL_MEMORY = 1_GiB; | ||||||
|  |     static constexpr s64 TARGET_THRESHOLD = 4_GiB; | ||||||
| 
 | 
 | ||||||
|     using Maxwell = Tegra::Engines::Maxwell3D::Regs; |     using Maxwell = Tegra::Engines::Maxwell3D::Regs; | ||||||
| 
 | 
 | ||||||
| @ -436,6 +437,8 @@ private: | |||||||
|     Common::LeastRecentlyUsedCache<LRUItemParams> lru_cache; |     Common::LeastRecentlyUsedCache<LRUItemParams> lru_cache; | ||||||
|     u64 frame_tick = 0; |     u64 frame_tick = 0; | ||||||
|     u64 total_used_memory = 0; |     u64 total_used_memory = 0; | ||||||
|  |     u64 minimum_memory = 0; | ||||||
|  |     u64 critical_memory = 0; | ||||||
| 
 | 
 | ||||||
|     std::array<BufferId, ((1ULL << 39) >> PAGE_BITS)> page_table; |     std::array<BufferId, ((1ULL << 39) >> PAGE_BITS)> page_table; | ||||||
| }; | }; | ||||||
| @ -451,11 +454,30 @@ BufferCache<P>::BufferCache(VideoCore::RasterizerInterface& rasterizer_, | |||||||
|     // Ensure the first slot is used for the null buffer
 |     // Ensure the first slot is used for the null buffer
 | ||||||
|     void(slot_buffers.insert(runtime, NullBufferParams{})); |     void(slot_buffers.insert(runtime, NullBufferParams{})); | ||||||
|     common_ranges.clear(); |     common_ranges.clear(); | ||||||
|  | 
 | ||||||
|  |     if (!runtime.CanReportMemoryUsage()) { | ||||||
|  |         minimum_memory = DEFAULT_EXPECTED_MEMORY; | ||||||
|  |         critical_memory = DEFAULT_CRITICAL_MEMORY; | ||||||
|  |         return; | ||||||
|  |     } | ||||||
|  | 
 | ||||||
|  |     const s64 device_memory = static_cast<s64>(runtime.GetDeviceLocalMemory()); | ||||||
|  |     const s64 min_spacing_expected = device_memory - 1_GiB - 512_MiB; | ||||||
|  |     const s64 min_spacing_critical = device_memory - 1_GiB; | ||||||
|  |     const s64 mem_tresshold = std::min(device_memory, TARGET_THRESHOLD); | ||||||
|  |     const s64 min_vacancy_expected = (6 * mem_tresshold) / 10; | ||||||
|  |     const s64 min_vacancy_critical = (3 * mem_tresshold) / 10; | ||||||
|  |     minimum_memory = static_cast<u64>( | ||||||
|  |         std::max(std::min(device_memory - min_vacancy_expected, min_spacing_expected), | ||||||
|  |                  DEFAULT_EXPECTED_MEMORY)); | ||||||
|  |     critical_memory = static_cast<u64>( | ||||||
|  |         std::max(std::min(device_memory - min_vacancy_critical, min_spacing_critical), | ||||||
|  |                  DEFAULT_CRITICAL_MEMORY)); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| template <class P> | template <class P> | ||||||
| void BufferCache<P>::RunGarbageCollector() { | void BufferCache<P>::RunGarbageCollector() { | ||||||
|     const bool aggressive_gc = total_used_memory >= CRITICAL_MEMORY; |     const bool aggressive_gc = total_used_memory >= critical_memory; | ||||||
|     const u64 ticks_to_destroy = aggressive_gc ? 60 : 120; |     const u64 ticks_to_destroy = aggressive_gc ? 60 : 120; | ||||||
|     int num_iterations = aggressive_gc ? 64 : 32; |     int num_iterations = aggressive_gc ? 64 : 32; | ||||||
|     const auto clean_up = [this, &num_iterations](BufferId buffer_id) { |     const auto clean_up = [this, &num_iterations](BufferId buffer_id) { | ||||||
| @ -486,7 +508,11 @@ void BufferCache<P>::TickFrame() { | |||||||
|     const bool skip_preferred = hits * 256 < shots * 251; |     const bool skip_preferred = hits * 256 < shots * 251; | ||||||
|     uniform_buffer_skip_cache_size = skip_preferred ? DEFAULT_SKIP_CACHE_SIZE : 0; |     uniform_buffer_skip_cache_size = skip_preferred ? DEFAULT_SKIP_CACHE_SIZE : 0; | ||||||
| 
 | 
 | ||||||
|     if (total_used_memory >= EXPECTED_MEMORY) { |     // If we can obtain the memory info, use it instead of the estimate.
 | ||||||
|  |     if (runtime.CanReportMemoryUsage()) { | ||||||
|  |         total_used_memory = runtime.GetDeviceMemoryUsage(); | ||||||
|  |     } | ||||||
|  |     if (total_used_memory >= minimum_memory) { | ||||||
|         RunGarbageCollector(); |         RunGarbageCollector(); | ||||||
|     } |     } | ||||||
|     ++frame_tick; |     ++frame_tick; | ||||||
|  | |||||||
| @ -135,6 +135,24 @@ BufferCacheRuntime::BufferCacheRuntime(const Device& device_) | |||||||
|         buffer.Create(); |         buffer.Create(); | ||||||
|         glNamedBufferData(buffer.handle, 0x10'000, nullptr, GL_STREAM_COPY); |         glNamedBufferData(buffer.handle, 0x10'000, nullptr, GL_STREAM_COPY); | ||||||
|     } |     } | ||||||
|  | 
 | ||||||
|  |     device_access_memory = []() -> u64 { | ||||||
|  |         if (GLAD_GL_NVX_gpu_memory_info) { | ||||||
|  |             GLint cur_avail_mem_kb = 0; | ||||||
|  |             glGetIntegerv(GL_GPU_MEMORY_INFO_TOTAL_AVAILABLE_MEMORY_NVX, &cur_avail_mem_kb); | ||||||
|  |             return static_cast<u64>(cur_avail_mem_kb) * 1_KiB; | ||||||
|  |         } | ||||||
|  |         return 2_GiB; // Return minimum requirements
 | ||||||
|  |     }(); | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | u64 BufferCacheRuntime::GetDeviceMemoryUsage() const { | ||||||
|  |     if (GLAD_GL_NVX_gpu_memory_info) { | ||||||
|  |         GLint cur_avail_mem_kb = 0; | ||||||
|  |         glGetIntegerv(GL_GPU_MEMORY_INFO_CURRENT_AVAILABLE_VIDMEM_NVX, &cur_avail_mem_kb); | ||||||
|  |         return static_cast<u64>(cur_avail_mem_kb) * 1_KiB; | ||||||
|  |     } | ||||||
|  |     return 2_GiB; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| void BufferCacheRuntime::CopyBuffer(Buffer& dst_buffer, Buffer& src_buffer, | void BufferCacheRuntime::CopyBuffer(Buffer& dst_buffer, Buffer& src_buffer, | ||||||
|  | |||||||
| @ -151,6 +151,16 @@ public: | |||||||
|         use_storage_buffers = use_storage_buffers_; |         use_storage_buffers = use_storage_buffers_; | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|  |     u64 GetDeviceLocalMemory() const { | ||||||
|  |         return device_access_memory; | ||||||
|  |     } | ||||||
|  | 
 | ||||||
|  |     u64 GetDeviceMemoryUsage() const; | ||||||
|  | 
 | ||||||
|  |     bool CanReportMemoryUsage() const { | ||||||
|  |         return GLAD_GL_NVX_gpu_memory_info; | ||||||
|  |     } | ||||||
|  | 
 | ||||||
| private: | private: | ||||||
|     static constexpr std::array PABO_LUT{ |     static constexpr std::array PABO_LUT{ | ||||||
|         GL_VERTEX_PROGRAM_PARAMETER_BUFFER_NV,          GL_TESS_CONTROL_PROGRAM_PARAMETER_BUFFER_NV, |         GL_VERTEX_PROGRAM_PARAMETER_BUFFER_NV,          GL_TESS_CONTROL_PROGRAM_PARAMETER_BUFFER_NV, | ||||||
| @ -184,6 +194,8 @@ private: | |||||||
|     std::array<OGLBuffer, VideoCommon::NUM_COMPUTE_UNIFORM_BUFFERS> copy_compute_uniforms; |     std::array<OGLBuffer, VideoCommon::NUM_COMPUTE_UNIFORM_BUFFERS> copy_compute_uniforms; | ||||||
| 
 | 
 | ||||||
|     u32 index_buffer_offset = 0; |     u32 index_buffer_offset = 0; | ||||||
|  | 
 | ||||||
|  |     u64 device_access_memory; | ||||||
| }; | }; | ||||||
| 
 | 
 | ||||||
| struct BufferCacheParams { | struct BufferCacheParams { | ||||||
|  | |||||||
| @ -141,6 +141,18 @@ StagingBufferRef BufferCacheRuntime::DownloadStagingBuffer(size_t size) { | |||||||
|     return staging_pool.Request(size, MemoryUsage::Download); |     return staging_pool.Request(size, MemoryUsage::Download); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | u64 BufferCacheRuntime::GetDeviceLocalMemory() const { | ||||||
|  |     return device.GetDeviceLocalMemory(); | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | u64 BufferCacheRuntime::GetDeviceMemoryUsage() const { | ||||||
|  |     return device.GetDeviceMemoryUsage(); | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | bool BufferCacheRuntime::CanReportMemoryUsage() const { | ||||||
|  |     return device.CanReportMemoryUsage(); | ||||||
|  | } | ||||||
|  | 
 | ||||||
| void BufferCacheRuntime::Finish() { | void BufferCacheRuntime::Finish() { | ||||||
|     scheduler.Finish(); |     scheduler.Finish(); | ||||||
| } | } | ||||||
|  | |||||||
| @ -65,6 +65,12 @@ public: | |||||||
| 
 | 
 | ||||||
|     void Finish(); |     void Finish(); | ||||||
| 
 | 
 | ||||||
|  |     u64 GetDeviceLocalMemory() const; | ||||||
|  | 
 | ||||||
|  |     u64 GetDeviceMemoryUsage() const; | ||||||
|  | 
 | ||||||
|  |     bool CanReportMemoryUsage() const; | ||||||
|  | 
 | ||||||
|     [[nodiscard]] StagingBufferRef UploadStagingBuffer(size_t size); |     [[nodiscard]] StagingBufferRef UploadStagingBuffer(size_t size); | ||||||
| 
 | 
 | ||||||
|     [[nodiscard]] StagingBufferRef DownloadStagingBuffer(size_t size); |     [[nodiscard]] StagingBufferRef DownloadStagingBuffer(size_t size); | ||||||
|  | |||||||
| @ -60,8 +60,6 @@ class TextureCache { | |||||||
|     static constexpr bool HAS_DEVICE_MEMORY_INFO = P::HAS_DEVICE_MEMORY_INFO; |     static constexpr bool HAS_DEVICE_MEMORY_INFO = P::HAS_DEVICE_MEMORY_INFO; | ||||||
| 
 | 
 | ||||||
|     static constexpr s64 TARGET_THRESHOLD = 4_GiB; |     static constexpr s64 TARGET_THRESHOLD = 4_GiB; | ||||||
|     static constexpr s64 MIN_VACANCY_EXPECTED = (6 * TARGET_THRESHOLD) / 10; |  | ||||||
|     static constexpr s64 MIN_VACANCY_CRITICAL = (3 * TARGET_THRESHOLD) / 10; |  | ||||||
|     static constexpr s64 DEFAULT_EXPECTED_MEMORY = 1_GiB + 125_MiB; |     static constexpr s64 DEFAULT_EXPECTED_MEMORY = 1_GiB + 125_MiB; | ||||||
|     static constexpr s64 DEFAULT_CRITICAL_MEMORY = 1_GiB + 625_MiB; |     static constexpr s64 DEFAULT_CRITICAL_MEMORY = 1_GiB + 625_MiB; | ||||||
|     static constexpr size_t GC_EMERGENCY_COUNTS = 2; |     static constexpr size_t GC_EMERGENCY_COUNTS = 2; | ||||||
|  | |||||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user