diff --git a/examples/server/bench/docker-compose.yml b/examples/server/bench/docker-compose.yml index 8a4b3b02d3fd6..493daed62cd90 100644 --- a/examples/server/bench/docker-compose.yml +++ b/examples/server/bench/docker-compose.yml @@ -17,6 +17,6 @@ services: export SERVER_BENCH_DATASET=/dataset.json export SERVER_BENCH_N_PROMPTS=50 export SERVER_BENCH_MAX_TOKENS=50 - ./k6 run /src/script.js --duration 5m --iterations 250 + ./k6 run /src/script.js --duration 5m --iterations 100 volumes: - ./:/src:Z diff --git a/examples/server/bench/script.js b/examples/server/bench/script.js index 6c2e6e0d3657f..69854efe9c4af 100644 --- a/examples/server/bench/script.js +++ b/examples/server/bench/script.js @@ -5,7 +5,7 @@ import {Counter, Rate, Trend} from 'k6/metrics' import exec from 'k6/execution'; // Number of virtual users -const n_uvs = 50; +const n_uvs = 16; // Server chat completions prefix const server_url = __ENV.SERVER_BENCH_URL ? __ENV.SERVER_BENCH_URL : 'http://localhost:8080/v1' @@ -130,9 +130,6 @@ export default function () { completions_tokens = chunk.usage.completion_tokens metric_completion_tokens.add(completions_tokens) metric_completion_tokens_total_counter.add(completions_tokens) - } else { - metric_completion_tokens.add(1) - metric_completion_tokens_total_counter.add(1) } })