fix memory count bug (#2717)

2025-12-16 01:49:05 +08:00 · 2025-10-30 14:27:15 -07:00
parent 793a31eeb6
commit 68c5fa1c95
2 changed files with 15 additions and 2 deletions
--- a/mlx/backend/cuda/allocator.cpp
+++ b/mlx/backend/cuda/allocator.cpp
@@ -97,7 +97,6 @@ CudaAllocator::CudaAllocator()

 Buffer CudaAllocator::malloc(size_t size) {
  // Find available buffer from cache.
-  auto orig_size = size;
  std::unique_lock lock(mutex_);
  if (size <= small_block_size) {
    size = 8;
@@ -131,7 +130,7 @@ Buffer CudaAllocator::malloc(size_t size) {
    }
    lock.lock();
  }
-  active_memory_ += size;
+  active_memory_ += buf->size;
  peak_memory_ = std::max(active_memory_, peak_memory_);

  // Maintain the cache below the requested limit.