Skip to content

Commit fb5a89e

Browse files
author
Le Yao
committed
Using CPU_ISA as the accelerator env value
Signed-off-by: Le Yao <le.yao@intel.com>
1 parent c142110 commit fb5a89e

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

container/cnagc-fastchat-k8s/entrypoint.sh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -36,14 +36,14 @@ case "$DEPLOY_TYPE" in
3636
else
3737
../models/get_models.sh "$MODEL_NAME"
3838
fi
39-
log "Check ISA from environment: ATEN_CPU_CAPABILITY=${ATEN_CPU_CAPABILITY}"
39+
log "Check ISA from environment: ATEN_CPU_CAPABILITY=${CPU_ISA}"
4040
log "Check ISA from pytorch:"
4141
/opt/conda/bin/python -c 'import intel_extension_for_pytorch._C as core;print(core._get_current_isa_level())'
4242

4343
export LD_PRELOAD="/opt/conda/lib/libiomp5.so:/usr/lib/x86_64-linux-gnu/libtcmalloc.so"
4444
MODEL_PATH="$MODEL_NAME" # Adjust this path based on where the get_model script downloads the models
4545
log "Starting model worker on port ${MODEL_WORKER_PORT}..."
46-
/opt/conda/bin/python -m fastchat.serve.model_worker --model-path "${MODEL_PATH}" --model-names "${MODEL_NAME}-${ATEN_CPU_CAPABILITY}" --worker-address http://"${MODEL_WORKER_SVC}":"${MODEL_WORKER_PORT}" --controller-address http://"${CONTROLLER_SVC}":"${CONTROLLER_PORT}" --host 0.0.0.0 --port "${MODEL_WORKER_PORT}" --device cpu
46+
/opt/conda/bin/python -m fastchat.serve.model_worker --model-path "${MODEL_PATH}" --model-names "${MODEL_NAME}-${CPU_ISA}" --worker-address http://"${MODEL_WORKER_SVC}":"${MODEL_WORKER_PORT}" --controller-address http://"${CONTROLLER_SVC}":"${CONTROLLER_PORT}" --host 0.0.0.0 --port "${MODEL_WORKER_PORT}" --device cpu
4747
;;
4848
"openaiapi")
4949
log "Starting OpenAI API server on port ${OPENAI_API_PORT}..."

0 commit comments

Comments
 (0)