chatbot / Dockerfile
kelvin-t-lu's picture
Update Dockerfile
1ed6ca7
raw
history blame contribute delete
858 Bytes
# devel needed for bitsandbytes requirement of libcudart.so, otherwise runtime sufficient
FROM nvidia/cuda:11.8.0-cudnn8-devel-ubuntu20.04
ENV DEBIAN_FRONTEND=noninteractive
ENV PATH="/h2ogpt_conda/bin:${PATH}"
ARG PATH="/h2ogpt_conda/bin:${PATH}"
ENV HOME=/workspace
ENV CUDA_HOME=/usr/local/cuda-11.8
ENV VLLM_CACHE=/workspace/.vllm_cache
WORKDIR /workspace
COPY . /workspace/
RUN cd /workspace && chmod +x /workspace/docker_build_script_ubuntu.sh && ./docker_build_script_ubuntu.sh
RUN chmod -R a+rwx /workspace
ARG user=h2ogpt
ARG group=h2ogpt
ARG uid=1000
ARG gid=1000
RUN groupadd -g ${gid} ${group} && useradd -u ${uid} -g ${group} -s /bin/bash ${user}
EXPOSE 8888
EXPOSE 7860
EXPOSE 5000
USER h2ogpt
# ENTRYPOINT ["python3.10"]
CMD ["python3.10", "generate.py", "--load_8bit", "True", "--base_model", "h2oai/h2ogpt-4096-llama2-7b-chat"]