mirror of
https://github.com/ollama/ollama.git
synced 2025-04-08 03:48:21 +02:00
runner.go: Use correct index when retrieving embedding results
This doesn't have any impact currently because NUM_PARALLEL is forced to 1 for embeddings, so both indicies will always be 0.
This commit is contained in:
parent
ecf41eed05
commit
5f68fcab12
@ -454,7 +454,7 @@ func (s *Server) processBatch(tokenBatch *llama.Batch, embedBatch *llama.Batch)
|
||||
|
||||
// if done processing the prompt, generate an embedding and return
|
||||
if seq.embeddingOnly {
|
||||
embed := s.lc.GetEmbeddingsSeq(i)
|
||||
embed := s.lc.GetEmbeddingsSeq(seq.cache.Id)
|
||||
if embed == nil {
|
||||
embed = s.lc.GetEmbeddingsIth(seq.iBatch)
|
||||
}
|
||||
|
Loading…
x
Reference in New Issue
Block a user