Integration test improvements (#9654)

Add some new test coverage for various model architectures, and switch from orca-mini to the small llama model.
2025-11-11 02:57:45 +01:00 · 2025-04-16 14:25:55 -07:00
parent 56dc316a57
commit ed4e139314
9 changed files with 709 additions and 67 deletions
--- a/integration/max_queue_test.go
+++ b/integration/max_queue_test.go
@@ -30,7 +30,7 @@ func TestMaxQueue(t *testing.T) {
 	t.Setenv("OLLAMA_MAX_QUEUE", strconv.Itoa(threadCount))

 	req := api.GenerateRequest{
-		Model:  "orca-mini",
+		Model:  smol,
 		Prompt: "write a long historical fiction story about christopher columbus.  use at least 10 facts from his actual journey",
 		Options: map[string]any{
 			"seed":        42,
@@ -61,7 +61,7 @@ func TestMaxQueue(t *testing.T) {
 	}()

 	// Give the generate a chance to get started before we start hammering on embed requests
-	time.Sleep(5 * time.Millisecond)
+	time.Sleep(10 * time.Millisecond)

 	threadCount += 10 // Add a few extra to ensure we push the queue past its limit
 	busyCount := 0