Morgan Funtowicz
feat(text-generation): default to transformers backend as much as we can
0727aa0
raw
history blame
304 Bytes
FROM lmsysorg/sglang:latest
ENV MODEL_ID="/repository"
ENV MODEL_IMPL="transformers"
ENV KV_CACHE_DTYPE="auto"
ENV TP_SIZE="1"
ENV QUANT_METHOD="w8a8_int8"
EXPOSE 80
COPY entrypoint.sh /usr/local/endpoint/
RUN chmod +x /usr/local/endpoint/entrypoint.sh
ENTRYPOINT ["/usr/local/endpoint/entrypoint.sh"]