use benchmark loop

2025-10-11 10:53:30 +02:00 · 2025-03-14 13:52:22 -07:00
parent ac6bc09fa3
commit bc46d0f2dd
1 changed files with 3 additions and 5 deletions
--- a/benchmark/server_benchmark_test.go
+++ b/benchmark/server_benchmark_test.go
@@ -83,8 +83,7 @@ func BenchmarkColdStart(b *testing.B) {
 			// Set number of tokens as our throughput metric
 			b.SetBytes(int64(tt.maxTokens))
-			b.ResetTimer()
+			for b.Loop() {
 			for range b.N {
 				b.StopTimer()
 				// Ensure model is unloaded before each iteration
 				unload(client, m, b)
@@ -122,12 +121,11 @@ func BenchmarkWarmStart(b *testing.B) {
 			// Set number of tokens as our throughput metric
 			b.SetBytes(int64(tt.maxTokens))
-			b.ResetTimer()
+			for b.Loop() {
 			for range b.N {
 				req := &api.GenerateRequest{
 					Model:   m,
 					Prompt:  tt.prompt,
-					Options: map[string]interface{}{"num_predict": tt.maxTokens, "temperature": 0.1},
+					Options: map[string]any{"num_predict": tt.maxTokens, "temperature": 0.1},
 				}
 				runGenerateBenchmark(b, ctx, client, req)