sicer
/

gbc-backup

Model card Files Files and versions Community

gbc-backup / content /open-o1 /vllm_server.sh

sicer's picture

Initial commit from existing repo

e9fa53a 5 months ago

history blame contribute delete

487 Bytes

	MODEL_PATH=$1
	MODEL_NAME=$2
	API_KEY=$3
	PORT=$4
	TP=$5
	VISIABLE_DEVICES=$(seq -s, $6 $7);

	echo "MODEL-PATH ${MODEL_PATH} API_key ${API_KEY} PORT ${PORT} TP ${TP} cuda visiable devices : ${VISIABLE_DEVICES}"
	CUDA_VISIBLE_DEVICES=${VISIABLE_DEVICES} vllm serve $MODEL_PATH \
	--port $PORT \
	--tensor-parallel-size $TP \
	--served-model-name $MODEL_NAME \
	--enable-chunked-prefill \
	--enforce-eager \
	--api-key $API_KEY \
	--disable-log-requests \
	--max_model_len 8192