File size: 858 Bytes
dbd2ac6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8aedb74
dbd2ac6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1ed6ca7
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
# devel needed for bitsandbytes requirement of libcudart.so, otherwise runtime sufficient
FROM nvidia/cuda:11.8.0-cudnn8-devel-ubuntu20.04

ENV DEBIAN_FRONTEND=noninteractive

ENV PATH="/h2ogpt_conda/bin:${PATH}"
ARG PATH="/h2ogpt_conda/bin:${PATH}"

ENV HOME=/workspace
ENV CUDA_HOME=/usr/local/cuda-11.8
ENV VLLM_CACHE=/workspace/.vllm_cache

WORKDIR /workspace

COPY . /workspace/

RUN cd /workspace && chmod +x /workspace/docker_build_script_ubuntu.sh && ./docker_build_script_ubuntu.sh

RUN chmod -R a+rwx /workspace

ARG user=h2ogpt
ARG group=h2ogpt
ARG uid=1000
ARG gid=1000

RUN groupadd -g ${gid} ${group} && useradd -u ${uid} -g ${group} -s /bin/bash ${user}

EXPOSE 8888
EXPOSE 7860
EXPOSE 5000

USER h2ogpt

# ENTRYPOINT ["python3.10"]

CMD ["python3.10", "generate.py", "--load_8bit", "True", "--base_model", "h2oai/h2ogpt-4096-llama2-7b-chat"]