22log_sum=" log/service_model_device.txt"
33
44model_ids=(" TinyLlama/TinyLlama-1.1B-Chat-v1.0" ) # "facebook/opt-1.3b" "huggyllama/llama-7b")
5- num_devices=(1 2 4)
5+ num_devices=(2)
66
77current_datetime=$( date " +%Y-%m-%d %H:%M:%S" )
88echo " $current_datetime "
99echo " $current_datetime " >> ${log_sum}
1010
11- " " "
1211for model_id in " ${model_ids[@]} " ; do
1312 for num_device in " ${num_devices[@]} " ; do
1413 # IFS='\' read -ra parts <<< "$model_id"
@@ -19,12 +18,11 @@ for model_id in "${model_ids[@]}"; do
1918 echo " *********************************"
2019 python lpu_inference_arg.py -m ${model_id} -n ${num_device} > log/inference_${model_name} _${num_device} .txt
2120 echo " *********************************" >> ${log_sum}
22- echo " The Result of log/inference_${model_name} _${num_device} .txt" >> ${log_sum}
21+ echo " [Testbench] The Result of log/inference_${model_name} _${num_device} .txt" >> ${log_sum}
2322 tail -n 1 " log/inference_${model_name} _${num_device} .txt" >> ${log_sum}
2423 echo " " >> ${log_sum}
2524 done
2625done
27- " " "
2826
2927for model_id in " ${model_ids[@]} " ; do
3028 for num_device in " ${num_devices[@]} " ; do
@@ -36,10 +34,10 @@ for model_id in "${model_ids[@]}"; do
3634
3735 # Waiting for server
3836 while ! nc -z localhost " 8000" ; do
39- echo " Waiting for server..."
37+ echo " [Testbench] Waiting for server..."
4038 sleep 3
4139 done
42- echo " The server is ready!"
40+ echo " [Testbench] The server is ready!"
4341
4442 python lpu_client.py > log/vllm_serve_${model_name} _${num_device} .txt
4543
@@ -49,10 +47,10 @@ for model_id in "${model_ids[@]}"; do
4947 kill -SIGINT " $PID "
5048 while true ; do
5149 if ps -p " $PID " > /dev/null; then
52- echo " Kill the process..."
50+ echo " [Testbench] Kill the process..."
5351 sleep 3
5452 else
55- echo " Process (PID: $PID ) is killed."
53+ echo " [Testbench] Process (PID: $PID ) is killed."
5654 break
5755 fi
5856 done
0 commit comments