File size: 324 Bytes
96ef4b5
 
 
 
 
 
 
 
 
 
8e33f66
96ef4b5
8e33f66
1
2
3
4
5
6
7
8
9
10
11
12
13
14
#!/bin/bash

python3 -m sglang.launch_server \
  --model-path $MODEL_ID \
  --kv-cache-dtype $KV_CACHE_DTYPE \
  --tensor-parallel-size $TP_SIZE \
  --expert-parallel-size $TP_SIZE \
  --quantization $QUANT_METHOD \
  --enable-torch-compile \
  --enable-ep-moe \
  --tool-call-parser qwen25 \
  --host 0.0.0.0 \
  --port 80