Skip to content

Commit 71a88ea

Browse files
committed
fix bench script
Signed-off-by: jthomson04 <[email protected]>
1 parent e41b80d commit 71a88ea

File tree

1 file changed

+0
-20
lines changed
  • components/backends/trtllm/performance_sweeps/scripts

1 file changed

+0
-20
lines changed

components/backends/trtllm/performance_sweeps/scripts/bench.sh

Lines changed: 0 additions & 20 deletions
Original file line numberDiff line numberDiff line change
@@ -232,26 +232,6 @@ for concurrency in ${concurrency_list}; do
232232
-H 'Authorization: Bearer NOT USED' \
233233
-H 'Accept: text/event-stream'
234234
fi
235-
python3 ${SCRIPTS_DIR}/scripts/bench/benchmark_serving.py \
236-
--served-model-name ${model} \
237-
--model ${model_path} \
238-
--dataset-name random \
239-
--num-prompts "$num_prompts" \
240-
--random-input-len ${isl} \
241-
--random-output-len ${osl} \
242-
--random-range-ratio 0.8 \
243-
--use-chat-template \
244-
--ignore-eos \
245-
--use-chat-template \
246-
--backend "dynamo" \
247-
--endpoint "/v1/completions" \
248-
--percentile-metrics ttft,tpot,itl,e2el \
249-
--max-concurrency "$concurrency" \
250-
--host ${hostname} \
251-
--port ${port} \
252-
--save-result \
253-
--result-dir "${log_path}/results" \
254-
--result-filename "results_concurrency_${original_concurrency}_gpus_${total_gpus}_ctx_${prefill_gpus}_gen_${decode_gpus}.json"
255235

256236
echo "Benchmark with concurrency ${concurrency} done"
257237
done

0 commit comments

Comments
 (0)