mac: fix stale VRAM data (#12972)

The scheduler updates free VRAM based on current loaded models. This was mutating the persisted list of GPUs, and when coupled with the non-refreshing logic for Metal that lead to stale low VRAM reporting after unload. The fix is to make sure the GPU discovery always returns a copy so the schedulers GPU list is in fact ephemeral and doesn't leak any temporary adjustments back into the persistent list.
2025-12-21 14:26:30 +00:00 · 2025-11-05 11:55:17 -08:00
parent f89fc1cadd
commit 6aa7283076
1 changed files with 2 additions and 2 deletions
--- a/discover/runner.go
+++ b/discover/runner.go
@@ -237,7 +237,7 @@ func GPUDevices(ctx context.Context, runners []ml.FilteredRunnerDiscovery) []ml.
 	} else {
 		if runtime.GOOS == "darwin" && runtime.GOARCH == "arm64" {
 			// metal never updates free VRAM
-			return devices
+			return append([]ml.DeviceInfo{}, devices...)
 		}
 		slog.Debug("refreshing free memory")
@@ -336,7 +336,7 @@ func GPUDevices(ctx context.Context, runners []ml.FilteredRunnerDiscovery) []ml.
 		}
 	}
-	return devices
+	return append([]ml.DeviceInfo{}, devices...)
 }
 func filterOverlapByLibrary(supported map[string]map[string]map[string]int, needsDelete []bool) {