File size: 292 Bytes
ee78b3d
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
#!/usr/bin/env bash
set -ex

export MODEL_NAME="Dolphin"

python api_server.py \
    --hf_model_dir tmp/hf_models/${MODEL_NAME} \
    --visual_engine_dir tmp/trt_engines/${MODEL_NAME}/vision_encoder \
    --llm_engine_dir tmp/trt_engines/${MODEL_NAME}/1-gpu/bfloat16 \
    --max_batch_size 16