11name : offline_inference_test
2- on :
3- workflow_dispatch :
2+
3+ on :
4+ workflow_dispatch :
5+
6+ schedule :
7+ - cron : ' 0 19 * * *'
48
59jobs :
610 offline-inference :
7- runs-on : arc-runner-ucm
11+ runs-on : [self-hosted, gpu]
12+
813 steps :
9- - uses : actions/checkout@v4
14+ - name : Checkout code
15+ uses : actions/checkout@v4
16+ with :
17+ ref : ${{ github.event_name == 'schedule' && 'develop' || github.ref_name }}
18+
19+ - name : Show actual branch & commit
20+ run : |
21+ echo "== Working branch =="
22+ echo "Latest commit: $(git log --oneline -1)"
23+ echo "On branch : $(git branch --show-current || git describe --tags --exact-match 2>/dev/null || git rev-parse --short HEAD)"
24+
1025 - run : nvidia-smi
26+
1127 - name : Run offline_inference in container
1228 run : |
1329 docker run --rm \
1430 --gpus all \
31+ --network=host \
1532 -v ${{ github.workspace }}:/workspace/unified-cache-management \
16- -v /home_116 /models/Qwen2.5-1.5B-Instruct:/home/models/Qwen2.5-1.5B-Instruct \
33+ -v /home /models/Qwen2.5-1.5B-Instruct:/home/models/Qwen2.5-1.5B-Instruct \
1734 -w /workspace/unified-cache-management \
1835 --entrypoint /bin/bash \
1936 vllm/vllm-openai:v0.9.2 \
2037 -c "
21- set -euo pipefail
38+ set -euxo pipefail
2239 export PLATFORM=cuda
2340 export MODEL_PATH=/home/models/Qwen2.5-1.5B-Instruct
41+ export http_proxy=http://172.80.0.1:7890
2442 pip config set global.index-url https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple
43+ git config --global http.version HTTP/1.1
44+ git config --global http.sslVerify false
45+ git config --global http.proxy \$http_proxy
46+ git config --global https.proxy \$http_proxy
2547 pip install -v -e . --no-build-isolation
26- cd \$(pip show vllm | grep Location | awk '{print \$2}') &&
48+ cd \$(pip show vllm | grep Location | awk '{print \$2}')
2749 git apply /workspace/unified-cache-management/ucm/integration/vllm/patch/0.9.2/vllm-adapt.patch
2850 cd /workspace/unified-cache-management
2951 python3 examples/offline_inference.py
30- "
52+ "
0 commit comments