mfuntowicz's picture
mfuntowicz HF Staff
feat(quant): allow using native precision (#3)
43e8c6f verified
FROM lmsysorg/sglang:latest
ENV MODEL_ID="/repository"
ENV KV_CACHE_DTYPE="auto"
ENV TP_SIZE="1"
ENV QUANT_METHOD=""
EXPOSE 80
COPY entrypoint.sh /usr/local/endpoint/
RUN chmod +x /usr/local/endpoint/entrypoint.sh
ENTRYPOINT ["/usr/local/endpoint/entrypoint.sh"]