Skip to content

Commit

Permalink
add test script
Browse files Browse the repository at this point in the history
Signed-off-by: Chendi Xue <[email protected]>
  • Loading branch information
xuechendi committed Nov 27, 2024
1 parent 37f94dd commit 17af66c
Showing 1 changed file with 37 additions and 0 deletions.
37 changes: 37 additions & 0 deletions scripts/run_multi_models.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,37 @@
# VLLM_SKIP_WARMUP=true python3 -m \
# vllm.entrypoints.openai.mm_api_server \
# --model mistralai/Mistral-7B-Instruct-v0.3 meta-llama/Llama-3.1-8B-Instruct \
# --port 8080 --device hpu --dtype bfloat16 \
# --gpu-memory-utilization=0.3 --use-v2-block-manager --max-model-len 4096 2>&1 > multi_models.log &


bs=128
in_len=1024
out_len=1024


python benchmarks/benchmark_serving.py \
--backend vllm \
--model mistralai/Mistral-7B-Instruct-v0.3 \
--dataset-name sonnet \
--dataset-path benchmarks/sonnet.txt \
--request-rate 512 \
--num-prompts ${bs} \
--port 8080 \
--sonnet-input-len ${in_len} \
--sonnet-output-len ${out_len} \
--sonnet-prefix-len 100 \
--save-result 2>&1 > mistral-sonnet.log &

python benchmarks/benchmark_serving.py \
--backend vllm \
--model meta-llama/Llama-3.1-8B-Instruct \
--dataset-name sonnet \
--dataset-path benchmarks/sonnet.txt \
--request-rate 512 \
--num-prompts ${bs} \
--port 8080 \
--sonnet-input-len ${in_len} \
--sonnet-output-len ${out_len} \
--sonnet-prefix-len 100 \
--save-result 2>&1 > llama-sonnet.log &

0 comments on commit 17af66c

Please sign in to comment.