File size: 427 Bytes
264681b
 
946e50b
 
 
 
 
d487566
264681b
aa7ea36
 
 
 
 
 
 
 
6b752ad
946e50b
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
#!/bin/bash -xe

# TODO: remove 
nvm --version
node --version
npm --version

mkdir -p data

HF_MODEL_PATH=Qwen/Qwen2.5-1.5B-Instruct
HF_MODEL_NAME=$(basename ${HF_MODEL_PATH})
LOCAL_MODEL_PATH=./data/${HF_MODEL_NAME}

# download model
HF_HUB_ENABLE_HF_TRANSFER=1 huggingface-cli download ${HF_MODEL_PATH} --local-dir ${LOCAL_MODEL_PATH}

# start vllm server
vllm serve ${LOCAL_MODEL_PATH} --served-model-name ${HF_MODEL_NAME}