mirror of
https://github.com/ollama/ollama.git
synced 2025-09-30 05:26:32 +02:00
update overhead to 15%
This commit is contained in:
@@ -131,9 +131,9 @@ func getCPUMem() (memInfo, error) {
|
|||||||
func CheckVRAM() (int64, error) {
|
func CheckVRAM() (int64, error) {
|
||||||
gpuInfo := GetGPUInfo()
|
gpuInfo := GetGPUInfo()
|
||||||
if gpuInfo.FreeMemory > 0 && (gpuInfo.Library == "cuda" || gpuInfo.Library == "rocm") {
|
if gpuInfo.FreeMemory > 0 && (gpuInfo.Library == "cuda" || gpuInfo.Library == "rocm") {
|
||||||
// leave 10% or 400MiB of VRAM free for overhead
|
// leave 15% or 400MiB of VRAM free for overhead
|
||||||
overhead := gpuInfo.FreeMemory / 10
|
overhead := gpuInfo.FreeMemory 3 / 20
|
||||||
minOverhead := 400 * 1024 * 1024
|
minOverhead := int64(400 * 1024 * 1024)
|
||||||
if overhead < minOverhead {
|
if overhead < minOverhead {
|
||||||
overhead = minOverhead
|
overhead = minOverhead
|
||||||
}
|
}
|
||||||
|
Reference in New Issue
Block a user