mirror of
https://github.com/ollama/ollama.git
synced 2025-09-29 08:53:27 +02:00
runner.go: Use correct index when retrieving embedding results
This doesn't have any impact currently because NUM_PARALLEL is forced to 1 for embeddings, so both indicies will always be 0.
This commit is contained in:
@@ -454,7 +454,7 @@ func (s *Server) processBatch(tokenBatch *llama.Batch, embedBatch *llama.Batch)
|
|||||||
|
|
||||||
// if done processing the prompt, generate an embedding and return
|
// if done processing the prompt, generate an embedding and return
|
||||||
if seq.embeddingOnly {
|
if seq.embeddingOnly {
|
||||||
embed := s.lc.GetEmbeddingsSeq(i)
|
embed := s.lc.GetEmbeddingsSeq(seq.cache.Id)
|
||||||
if embed == nil {
|
if embed == nil {
|
||||||
embed = s.lc.GetEmbeddingsIth(seq.iBatch)
|
embed = s.lc.GetEmbeddingsIth(seq.iBatch)
|
||||||
}
|
}
|
||||||
|
Reference in New Issue
Block a user