Spaces:
Paused
Paused
# devel needed for bitsandbytes requirement of libcudart.so, otherwise runtime sufficient | |
FROM nvidia/cuda:11.8.0-cudnn8-devel-ubuntu20.04 | |
ENV DEBIAN_FRONTEND=noninteractive | |
ENV PATH="/h2ogpt_conda/bin:${PATH}" | |
ARG PATH="/h2ogpt_conda/bin:${PATH}" | |
ENV HOME=/workspace | |
ENV CUDA_HOME=/usr/local/cuda-11.8 | |
ENV VLLM_CACHE=/workspace/.vllm_cache | |
WORKDIR /workspace | |
COPY . /workspace/ | |
RUN cd /workspace && chmod +x /workspace/docker_build_script_ubuntu.sh && ./docker_build_script_ubuntu.sh | |
RUN chmod -R a+rwx /workspace | |
ARG user=h2ogpt | |
ARG group=h2ogpt | |
ARG uid=1000 | |
ARG gid=1000 | |
RUN groupadd -g ${gid} ${group} && useradd -u ${uid} -g ${group} -s /bin/bash ${user} | |
EXPOSE 8888 | |
EXPOSE 7860 | |
EXPOSE 5000 | |
USER h2ogpt | |
# ENTRYPOINT ["python3.10"] | |
CMD ["python3.10", "generate.py", "--load_8bit", "True", "--base_model", "h2oai/h2ogpt-4096-llama2-7b-chat"] | |