Integration test improvements (#9654)

Add some new test coverage for various model architectures,
and switch from orca-mini to the small llama model.
This commit is contained in:
Daniel Hiltgen
2025-04-16 14:25:55 -07:00
committed by GitHub
parent 56dc316a57
commit ed4e139314
9 changed files with 709 additions and 67 deletions

View File

@@ -30,7 +30,7 @@ func TestMaxQueue(t *testing.T) {
t.Setenv("OLLAMA_MAX_QUEUE", strconv.Itoa(threadCount))
req := api.GenerateRequest{
Model: "orca-mini",
Model: smol,
Prompt: "write a long historical fiction story about christopher columbus. use at least 10 facts from his actual journey",
Options: map[string]any{
"seed": 42,
@@ -61,7 +61,7 @@ func TestMaxQueue(t *testing.T) {
}()
// Give the generate a chance to get started before we start hammering on embed requests
time.Sleep(5 * time.Millisecond)
time.Sleep(10 * time.Millisecond)
threadCount += 10 // Add a few extra to ensure we push the queue past its limit
busyCount := 0