mirror of
https://github.com/ollama/ollama.git
synced 2025-03-28 02:33:14 +01:00
add command-r graph estimate
This commit is contained in:
parent
483b81a863
commit
01f77ae25d
@ -327,7 +327,7 @@ func (llm GGML) GraphSize(context, batch int) (int64, bool) {
|
||||
}
|
||||
|
||||
switch llm.KV().Architecture() {
|
||||
case "gemma":
|
||||
case "gemma", "command-r":
|
||||
return 4 * int64(batch) * int64(embeddingLength+uint64(vocabLength)), true
|
||||
case "phi2":
|
||||
return max(
|
||||
|
Loading…
x
Reference in New Issue
Block a user