chatbot / Dockerfile
kelvin-t-lu's picture
init
dbd2ac6
raw
history blame
794 Bytes
# devel needed for bitsandbytes requirement of libcudart.so, otherwise runtime sufficient
FROM nvidia/cuda:11.8.0-cudnn8-devel-ubuntu20.04
ENV DEBIAN_FRONTEND=noninteractive
ENV PATH="/h2ogpt_conda/bin:${PATH}"
ARG PATH="/h2ogpt_conda/bin:${PATH}"
ENV HOME=/workspace
ENV CUDA_HOME=/usr/local/cuda-11.8
ENV VLLM_CACHE=/workspace/.vllm_cache
WORKDIR /workspace
COPY . /workspace/
RUN cd /workspace && ./docker_build_script_ubuntu.sh
RUN chmod -R a+rwx /workspace
ARG user=h2ogpt
ARG group=h2ogpt
ARG uid=1000
ARG gid=1000
RUN groupadd -g ${gid} ${group} && useradd -u ${uid} -g ${group} -s /bin/bash ${user}
EXPOSE 8888
EXPOSE 7860
EXPOSE 5000
USER h2ogpt
# ENTRYPOINT ["python3.10"]
CMD ["python3.10", "generate.py", "--load_8bit", "True", "--base_model", "'EleutherAI/gpt-j-6B'"]