Spaces:
Paused
Paused
File size: 858 Bytes
dbd2ac6 8aedb74 dbd2ac6 1ed6ca7 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 |
# devel needed for bitsandbytes requirement of libcudart.so, otherwise runtime sufficient
FROM nvidia/cuda:11.8.0-cudnn8-devel-ubuntu20.04
ENV DEBIAN_FRONTEND=noninteractive
ENV PATH="/h2ogpt_conda/bin:${PATH}"
ARG PATH="/h2ogpt_conda/bin:${PATH}"
ENV HOME=/workspace
ENV CUDA_HOME=/usr/local/cuda-11.8
ENV VLLM_CACHE=/workspace/.vllm_cache
WORKDIR /workspace
COPY . /workspace/
RUN cd /workspace && chmod +x /workspace/docker_build_script_ubuntu.sh && ./docker_build_script_ubuntu.sh
RUN chmod -R a+rwx /workspace
ARG user=h2ogpt
ARG group=h2ogpt
ARG uid=1000
ARG gid=1000
RUN groupadd -g ${gid} ${group} && useradd -u ${uid} -g ${group} -s /bin/bash ${user}
EXPOSE 8888
EXPOSE 7860
EXPOSE 5000
USER h2ogpt
# ENTRYPOINT ["python3.10"]
CMD ["python3.10", "generate.py", "--load_8bit", "True", "--base_model", "h2oai/h2ogpt-4096-llama2-7b-chat"]
|