File tree Expand file tree Collapse file tree 1 file changed +0
-20
lines changed
components/backends/trtllm/performance_sweeps/scripts Expand file tree Collapse file tree 1 file changed +0
-20
lines changed Original file line number Diff line number Diff line change @@ -232,26 +232,6 @@ for concurrency in ${concurrency_list}; do
232232 -H ' Authorization: Bearer NOT USED' \
233233 -H ' Accept: text/event-stream'
234234 fi
235- python3 ${SCRIPTS_DIR} /scripts/bench/benchmark_serving.py \
236- --served-model-name ${model} \
237- --model ${model_path} \
238- --dataset-name random \
239- --num-prompts " $num_prompts " \
240- --random-input-len ${isl} \
241- --random-output-len ${osl} \
242- --random-range-ratio 0.8 \
243- --use-chat-template \
244- --ignore-eos \
245- --use-chat-template \
246- --backend " dynamo" \
247- --endpoint " /v1/completions" \
248- --percentile-metrics ttft,tpot,itl,e2el \
249- --max-concurrency " $concurrency " \
250- --host ${hostname} \
251- --port ${port} \
252- --save-result \
253- --result-dir " ${log_path} /results" \
254- --result-filename " results_concurrency_${original_concurrency} _gpus_${total_gpus} _ctx_${prefill_gpus} _gen_${decode_gpus} .json"
255235
256236 echo " Benchmark with concurrency ${concurrency} done"
257237done
You can’t perform that action at this time.
0 commit comments