Bump VRAM buffer back up

Under stress scenarios we're seeing OOMs so this should help stabilize the allocations under heavy concurrency stress.
2025-07-28 16:13:35 +02:00 · 2024-05-10 09:15:28 -07:00
parent 200a18820e
commit 30a7d7096c
2 changed files with 3 additions and 3 deletions
--- a/gpu/gpu.go
+++ b/gpu/gpu.go
@@ -31,8 +31,8 @@ type handles struct {
 }

 const (
-	cudaMinimumMemory = 256 * format.MebiByte
-	rocmMinimumMemory = 256 * format.MebiByte
+	cudaMinimumMemory = 457 * format.MebiByte
+	rocmMinimumMemory = 457 * format.MebiByte
 )

 var gpuMutex sync.Mutex
--- a/gpu/gpu_darwin.go
+++ b/gpu/gpu_darwin.go
@@ -15,7 +15,7 @@ import (
 )

 const (
-	metalMinimumMemory = 384 * format.MebiByte
+	metalMinimumMemory = 512 * format.MebiByte
 )

 func GetGPUInfo() GpuInfoList {