From 17df6520c8545a535f48de7e6316b5a60b93968d Mon Sep 17 00:00:00 2001 From: Daniel Hiltgen Date: Thu, 13 Jun 2024 09:59:36 -0700 Subject: [PATCH] Remove mmap related output calc logic --- llm/memory.go | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/llm/memory.go b/llm/memory.go index 223a18992..5afb1c2e9 100644 --- a/llm/memory.go +++ b/llm/memory.go @@ -197,8 +197,7 @@ func EstimateGPULayers(gpus []gpu.GpuInfo, ggml *GGML, projectors []string, opts } // Determine if we need to consider output then find where it fits - if ((gpus[0].Library == "metal" && opts.UseMMap) || (gpus[0].Library != "metal" || !opts.UseMMap)) && - memoryLayerOutput > 0 && (opts.NumGPU < 0 || layerCount < opts.NumGPU) { + if memoryLayerOutput > 0 && (opts.NumGPU < 0 || layerCount < opts.NumGPU) { for j := len(gpusWithSpace); j > 0; j-- { g := gpusWithSpace[layerCount%j] used := gpuAllocations[g.i] + max(graphPartialOffload, graphFullOffload)