Updated Dockefile to use cache (#2703)
Browse files### What problem does this PR solve?
Updated Dockefile to use cache
### Type of change
- [ ] Bug Fix (non-breaking change which fixes an issue)
- [ ] New Feature (non-breaking change which adds functionality)
- [ ] Documentation Update
- [ ] Refactoring
- [ ] Performance Improvement
- [x] Other (please describe): CI
- .github/workflows/tests.yml +1 -1
- Dockerfile +21 -14
- Dockerfile.slim +21 -14
- README.md +2 -2
- README_ja.md +2 -2
- README_ko.md +2 -2
- README_zh.md +2 -2
- docs/guides/develop/build_docker_image.md +2 -2
- download_deps.py +7 -2
.github/workflows/tests.yml
CHANGED
@@ -48,7 +48,7 @@ jobs:
|
|
48 |
- name: Build ragflow:dev-slim
|
49 |
run: |
|
50 |
RUNNER_WORKSPACE_PREFIX=${RUNNER_WORKSPACE_PREFIX:-$HOME}
|
51 |
-
cp -r ${RUNNER_WORKSPACE_PREFIX}/huggingface.co .
|
52 |
sudo docker build -f Dockerfile.slim -t infiniflow/ragflow:dev-slim .
|
53 |
|
54 |
- name: Build ragflow:dev
|
|
|
48 |
- name: Build ragflow:dev-slim
|
49 |
run: |
|
50 |
RUNNER_WORKSPACE_PREFIX=${RUNNER_WORKSPACE_PREFIX:-$HOME}
|
51 |
+
cp -r ${RUNNER_WORKSPACE_PREFIX}/huggingface.co ${RUNNER_WORKSPACE_PREFIX}/nltk_data .
|
52 |
sudo docker build -f Dockerfile.slim -t infiniflow/ragflow:dev-slim .
|
53 |
|
54 |
- name: Build ragflow:dev
|
Dockerfile
CHANGED
@@ -6,13 +6,18 @@ ENV LIGHTEN=0
|
|
6 |
|
7 |
WORKDIR /ragflow
|
8 |
|
9 |
-
RUN
|
|
|
|
|
|
|
|
|
10 |
|
11 |
# if you located in China, you can use tsinghua mirror to speed up apt
|
12 |
RUN sed -i 's|http://archive.ubuntu.com|https://mirrors.tuna.tsinghua.edu.cn|g' /etc/apt/sources.list.d/ubuntu.sources
|
13 |
|
14 |
-
RUN apt
|
15 |
-
&& apt
|
|
|
16 |
|
17 |
RUN curl -o libssl1.deb http://archive.ubuntu.com/ubuntu/pool/main/o/openssl1.0/libssl1.0.0_1.0.2n-1ubuntu5_amd64.deb && dpkg -i libssl1.deb && rm -f libssl1.deb
|
18 |
|
@@ -22,7 +27,6 @@ ENV PYTHONDONTWRITEBYTECODE=1 DOTNET_SYSTEM_GLOBALIZATION_INVARIANT=1
|
|
22 |
ENV POETRY_NO_INTERACTION=1
|
23 |
ENV POETRY_VIRTUALENVS_IN_PROJECT=true
|
24 |
ENV POETRY_VIRTUALENVS_CREATE=true
|
25 |
-
ENV POETRY_KEYRING_ENABLED=false
|
26 |
ENV POETRY_REQUESTS_TIMEOUT=15
|
27 |
|
28 |
# builder stage
|
@@ -31,16 +35,18 @@ USER root
|
|
31 |
|
32 |
WORKDIR /ragflow
|
33 |
|
34 |
-
RUN apt
|
35 |
-
|
|
|
36 |
|
37 |
COPY web web
|
38 |
-
RUN
|
|
|
39 |
|
40 |
# install dependencies from poetry.lock file
|
41 |
COPY pyproject.toml poetry.toml poetry.lock ./
|
42 |
|
43 |
-
RUN --mount=type=cache,target=/root/.cache/pypoetry,sharing=locked \
|
44 |
if [ "$LIGHTEN" -eq 0 ]; then \
|
45 |
poetry install --sync --no-cache --no-root --with=full; \
|
46 |
else \
|
@@ -55,8 +61,9 @@ WORKDIR /ragflow
|
|
55 |
|
56 |
# Install python packages' dependencies
|
57 |
# cv2 requires libGL.so.1
|
58 |
-
RUN apt
|
59 |
-
|
|
|
60 |
|
61 |
COPY web web
|
62 |
COPY api api
|
@@ -82,16 +89,16 @@ RUN --mount=type=bind,source=huggingface.co,target=/huggingface.co \
|
|
82 |
/huggingface.co/maidalun1020/bce-reranker-base_v1 \
|
83 |
| tar -xf - --strip-components=2 -C /root/.ragflow
|
84 |
|
|
|
|
|
|
|
85 |
# Copy compiled web pages
|
86 |
COPY --from=builder /ragflow/web/dist /ragflow/web/dist
|
87 |
|
88 |
# Copy Python environment and packages
|
89 |
ENV VIRTUAL_ENV=/ragflow/.venv
|
90 |
COPY --from=builder ${VIRTUAL_ENV} ${VIRTUAL_ENV}
|
91 |
-
ENV PATH="${VIRTUAL_ENV}/bin
|
92 |
-
|
93 |
-
# Download nltk data
|
94 |
-
RUN python3 -m nltk.downloader wordnet punkt punkt_tab
|
95 |
|
96 |
ENV PYTHONPATH=/ragflow/
|
97 |
|
|
|
6 |
|
7 |
WORKDIR /ragflow
|
8 |
|
9 |
+
RUN rm -f /etc/apt/apt.conf.d/docker-clean \
|
10 |
+
&& echo 'Binary::apt::APT::Keep-Downloaded-Packages "true";' > /etc/apt/apt.conf.d/keep-cache
|
11 |
+
|
12 |
+
RUN --mount=type=cache,id=ragflow_base_apt,target=/var/cache/apt,sharing=locked \
|
13 |
+
apt update && apt-get --no-install-recommends install -y ca-certificates
|
14 |
|
15 |
# if you located in China, you can use tsinghua mirror to speed up apt
|
16 |
RUN sed -i 's|http://archive.ubuntu.com|https://mirrors.tuna.tsinghua.edu.cn|g' /etc/apt/sources.list.d/ubuntu.sources
|
17 |
|
18 |
+
RUN --mount=type=cache,id=ragflow_base_apt,target=/var/cache/apt,sharing=locked \
|
19 |
+
apt update && apt install -y curl libpython3-dev nginx libglib2.0-0 libglx-mesa0 pkg-config libicu-dev libgdiplus python3-poetry \
|
20 |
+
&& rm -rf /var/lib/apt/lists/*
|
21 |
|
22 |
RUN curl -o libssl1.deb http://archive.ubuntu.com/ubuntu/pool/main/o/openssl1.0/libssl1.0.0_1.0.2n-1ubuntu5_amd64.deb && dpkg -i libssl1.deb && rm -f libssl1.deb
|
23 |
|
|
|
27 |
ENV POETRY_NO_INTERACTION=1
|
28 |
ENV POETRY_VIRTUALENVS_IN_PROJECT=true
|
29 |
ENV POETRY_VIRTUALENVS_CREATE=true
|
|
|
30 |
ENV POETRY_REQUESTS_TIMEOUT=15
|
31 |
|
32 |
# builder stage
|
|
|
35 |
|
36 |
WORKDIR /ragflow
|
37 |
|
38 |
+
RUN --mount=type=cache,id=ragflow_builder_apt,target=/var/cache/apt,sharing=locked \
|
39 |
+
apt update && apt install -y nodejs npm cargo && \
|
40 |
+
rm -rf /var/lib/apt/lists/*
|
41 |
|
42 |
COPY web web
|
43 |
+
RUN --mount=type=cache,id=ragflow_builder_npm,target=/root/.npm,sharing=locked \
|
44 |
+
cd web && npm i --force && npm run build
|
45 |
|
46 |
# install dependencies from poetry.lock file
|
47 |
COPY pyproject.toml poetry.toml poetry.lock ./
|
48 |
|
49 |
+
RUN --mount=type=cache,id=ragflow_builder_poetry,target=/root/.cache/pypoetry,sharing=locked \
|
50 |
if [ "$LIGHTEN" -eq 0 ]; then \
|
51 |
poetry install --sync --no-cache --no-root --with=full; \
|
52 |
else \
|
|
|
61 |
|
62 |
# Install python packages' dependencies
|
63 |
# cv2 requires libGL.so.1
|
64 |
+
RUN --mount=type=cache,id=ragflow_production_apt,target=/var/cache/apt,sharing=locked \
|
65 |
+
apt update && apt install -y --no-install-recommends nginx libgl1 vim less && \
|
66 |
+
rm -rf /var/lib/apt/lists/*
|
67 |
|
68 |
COPY web web
|
69 |
COPY api api
|
|
|
89 |
/huggingface.co/maidalun1020/bce-reranker-base_v1 \
|
90 |
| tar -xf - --strip-components=2 -C /root/.ragflow
|
91 |
|
92 |
+
# Copy nltk data downloaded via download_deps.py
|
93 |
+
COPY nltk_data /root/nltk_data
|
94 |
+
|
95 |
# Copy compiled web pages
|
96 |
COPY --from=builder /ragflow/web/dist /ragflow/web/dist
|
97 |
|
98 |
# Copy Python environment and packages
|
99 |
ENV VIRTUAL_ENV=/ragflow/.venv
|
100 |
COPY --from=builder ${VIRTUAL_ENV} ${VIRTUAL_ENV}
|
101 |
+
ENV PATH="${VIRTUAL_ENV}/bin:${PATH}"
|
|
|
|
|
|
|
102 |
|
103 |
ENV PYTHONPATH=/ragflow/
|
104 |
|
Dockerfile.slim
CHANGED
@@ -6,13 +6,18 @@ ENV LIGHTEN=1
|
|
6 |
|
7 |
WORKDIR /ragflow
|
8 |
|
9 |
-
RUN
|
|
|
|
|
|
|
|
|
10 |
|
11 |
# if you located in China, you can use tsinghua mirror to speed up apt
|
12 |
RUN sed -i 's|http://archive.ubuntu.com|https://mirrors.tuna.tsinghua.edu.cn|g' /etc/apt/sources.list.d/ubuntu.sources
|
13 |
|
14 |
-
RUN apt
|
15 |
-
&& apt
|
|
|
16 |
|
17 |
RUN curl -o libssl1.deb http://archive.ubuntu.com/ubuntu/pool/main/o/openssl1.0/libssl1.0.0_1.0.2n-1ubuntu5_amd64.deb && dpkg -i libssl1.deb && rm -f libssl1.deb
|
18 |
|
@@ -22,7 +27,6 @@ ENV PYTHONDONTWRITEBYTECODE=1 DOTNET_SYSTEM_GLOBALIZATION_INVARIANT=1
|
|
22 |
ENV POETRY_NO_INTERACTION=1
|
23 |
ENV POETRY_VIRTUALENVS_IN_PROJECT=true
|
24 |
ENV POETRY_VIRTUALENVS_CREATE=true
|
25 |
-
ENV POETRY_KEYRING_ENABLED=false
|
26 |
ENV POETRY_REQUESTS_TIMEOUT=15
|
27 |
|
28 |
# builder stage
|
@@ -31,16 +35,18 @@ USER root
|
|
31 |
|
32 |
WORKDIR /ragflow
|
33 |
|
34 |
-
RUN apt
|
35 |
-
|
|
|
36 |
|
37 |
COPY web web
|
38 |
-
RUN
|
|
|
39 |
|
40 |
# install dependencies from poetry.lock file
|
41 |
COPY pyproject.toml poetry.toml poetry.lock ./
|
42 |
|
43 |
-
RUN --mount=type=cache,target=/root/.cache/pypoetry,sharing=locked \
|
44 |
if [ "$LIGHTEN" -eq 0 ]; then \
|
45 |
poetry install --sync --no-cache --no-root --with=full; \
|
46 |
else \
|
@@ -55,8 +61,9 @@ WORKDIR /ragflow
|
|
55 |
|
56 |
# Install python packages' dependencies
|
57 |
# cv2 requires libGL.so.1
|
58 |
-
RUN apt
|
59 |
-
|
|
|
60 |
|
61 |
COPY web web
|
62 |
COPY api api
|
@@ -75,16 +82,16 @@ RUN --mount=type=bind,source=huggingface.co,target=/huggingface.co \
|
|
75 |
/huggingface.co/InfiniFlow/deepdoc \
|
76 |
| tar -xf - --strip-components=3 -C /ragflow/rag/res/deepdoc
|
77 |
|
|
|
|
|
|
|
78 |
# Copy compiled web pages
|
79 |
COPY --from=builder /ragflow/web/dist /ragflow/web/dist
|
80 |
|
81 |
# Copy Python environment and packages
|
82 |
ENV VIRTUAL_ENV=/ragflow/.venv
|
83 |
COPY --from=builder ${VIRTUAL_ENV} ${VIRTUAL_ENV}
|
84 |
-
ENV PATH="${VIRTUAL_ENV}/bin
|
85 |
-
|
86 |
-
# Download nltk data
|
87 |
-
RUN python3 -m nltk.downloader wordnet punkt punkt_tab
|
88 |
|
89 |
ENV PYTHONPATH=/ragflow/
|
90 |
|
|
|
6 |
|
7 |
WORKDIR /ragflow
|
8 |
|
9 |
+
RUN rm -f /etc/apt/apt.conf.d/docker-clean \
|
10 |
+
&& echo 'Binary::apt::APT::Keep-Downloaded-Packages "true";' > /etc/apt/apt.conf.d/keep-cache
|
11 |
+
|
12 |
+
RUN --mount=type=cache,id=ragflow_base_apt,target=/var/cache/apt,sharing=locked \
|
13 |
+
apt update && apt-get --no-install-recommends install -y ca-certificates
|
14 |
|
15 |
# if you located in China, you can use tsinghua mirror to speed up apt
|
16 |
RUN sed -i 's|http://archive.ubuntu.com|https://mirrors.tuna.tsinghua.edu.cn|g' /etc/apt/sources.list.d/ubuntu.sources
|
17 |
|
18 |
+
RUN --mount=type=cache,id=ragflow_base_apt,target=/var/cache/apt,sharing=locked \
|
19 |
+
apt update && apt install -y curl libpython3-dev nginx libglib2.0-0 libglx-mesa0 pkg-config libicu-dev libgdiplus python3-poetry \
|
20 |
+
&& rm -rf /var/lib/apt/lists/*
|
21 |
|
22 |
RUN curl -o libssl1.deb http://archive.ubuntu.com/ubuntu/pool/main/o/openssl1.0/libssl1.0.0_1.0.2n-1ubuntu5_amd64.deb && dpkg -i libssl1.deb && rm -f libssl1.deb
|
23 |
|
|
|
27 |
ENV POETRY_NO_INTERACTION=1
|
28 |
ENV POETRY_VIRTUALENVS_IN_PROJECT=true
|
29 |
ENV POETRY_VIRTUALENVS_CREATE=true
|
|
|
30 |
ENV POETRY_REQUESTS_TIMEOUT=15
|
31 |
|
32 |
# builder stage
|
|
|
35 |
|
36 |
WORKDIR /ragflow
|
37 |
|
38 |
+
RUN --mount=type=cache,id=ragflow_builder_apt,target=/var/cache/apt,sharing=locked \
|
39 |
+
apt update && apt install -y nodejs npm cargo && \
|
40 |
+
rm -rf /var/lib/apt/lists/*
|
41 |
|
42 |
COPY web web
|
43 |
+
RUN --mount=type=cache,id=ragflow_builder_npm,target=/root/.npm,sharing=locked \
|
44 |
+
cd web && npm i --force && npm run build
|
45 |
|
46 |
# install dependencies from poetry.lock file
|
47 |
COPY pyproject.toml poetry.toml poetry.lock ./
|
48 |
|
49 |
+
RUN --mount=type=cache,id=ragflow_builder_poetry,target=/root/.cache/pypoetry,sharing=locked \
|
50 |
if [ "$LIGHTEN" -eq 0 ]; then \
|
51 |
poetry install --sync --no-cache --no-root --with=full; \
|
52 |
else \
|
|
|
61 |
|
62 |
# Install python packages' dependencies
|
63 |
# cv2 requires libGL.so.1
|
64 |
+
RUN --mount=type=cache,id=ragflow_production_apt,target=/var/cache/apt,sharing=locked \
|
65 |
+
apt update && apt install -y --no-install-recommends nginx libgl1 vim less && \
|
66 |
+
rm -rf /var/lib/apt/lists/*
|
67 |
|
68 |
COPY web web
|
69 |
COPY api api
|
|
|
82 |
/huggingface.co/InfiniFlow/deepdoc \
|
83 |
| tar -xf - --strip-components=3 -C /ragflow/rag/res/deepdoc
|
84 |
|
85 |
+
# Copy nltk data downloaded via download_deps.py
|
86 |
+
COPY nltk_data /root/nltk_data
|
87 |
+
|
88 |
# Copy compiled web pages
|
89 |
COPY --from=builder /ragflow/web/dist /ragflow/web/dist
|
90 |
|
91 |
# Copy Python environment and packages
|
92 |
ENV VIRTUAL_ENV=/ragflow/.venv
|
93 |
COPY --from=builder ${VIRTUAL_ENV} ${VIRTUAL_ENV}
|
94 |
+
ENV PATH="${VIRTUAL_ENV}/bin:${PATH}"
|
|
|
|
|
|
|
95 |
|
96 |
ENV PYTHONPATH=/ragflow/
|
97 |
|
README.md
CHANGED
@@ -220,7 +220,7 @@ This image is approximately 1 GB in size and relies on external LLM and embeddin
|
|
220 |
```bash
|
221 |
git clone https://github.com/infiniflow/ragflow.git
|
222 |
cd ragflow/
|
223 |
-
pip3 install huggingface-hub
|
224 |
python3 download_deps.py
|
225 |
docker build -f Dockerfile.slim -t infiniflow/ragflow:dev-slim .
|
226 |
```
|
@@ -232,7 +232,7 @@ This image is approximately 9 GB in size. As it includes embedding models, it re
|
|
232 |
```bash
|
233 |
git clone https://github.com/infiniflow/ragflow.git
|
234 |
cd ragflow/
|
235 |
-
pip3 install huggingface-hub
|
236 |
python3 download_deps.py
|
237 |
docker build -f Dockerfile -t infiniflow/ragflow:dev .
|
238 |
```
|
|
|
220 |
```bash
|
221 |
git clone https://github.com/infiniflow/ragflow.git
|
222 |
cd ragflow/
|
223 |
+
pip3 install huggingface-hub nltk
|
224 |
python3 download_deps.py
|
225 |
docker build -f Dockerfile.slim -t infiniflow/ragflow:dev-slim .
|
226 |
```
|
|
|
232 |
```bash
|
233 |
git clone https://github.com/infiniflow/ragflow.git
|
234 |
cd ragflow/
|
235 |
+
pip3 install huggingface-hub nltk
|
236 |
python3 download_deps.py
|
237 |
docker build -f Dockerfile -t infiniflow/ragflow:dev .
|
238 |
```
|
README_ja.md
CHANGED
@@ -202,7 +202,7 @@
|
|
202 |
```bash
|
203 |
git clone https://github.com/infiniflow/ragflow.git
|
204 |
cd ragflow/
|
205 |
-
pip3 install huggingface-hub
|
206 |
python3 download_deps.py
|
207 |
docker build -f Dockerfile.slim -t infiniflow/ragflow:dev-slim .
|
208 |
```
|
@@ -214,7 +214,7 @@ docker build -f Dockerfile.slim -t infiniflow/ragflow:dev-slim .
|
|
214 |
```bash
|
215 |
git clone https://github.com/infiniflow/ragflow.git
|
216 |
cd ragflow/
|
217 |
-
pip3 install huggingface-hub
|
218 |
python3 download_deps.py
|
219 |
docker build -f Dockerfile -t infiniflow/ragflow:dev .
|
220 |
```
|
|
|
202 |
```bash
|
203 |
git clone https://github.com/infiniflow/ragflow.git
|
204 |
cd ragflow/
|
205 |
+
pip3 install huggingface-hub nltk
|
206 |
python3 download_deps.py
|
207 |
docker build -f Dockerfile.slim -t infiniflow/ragflow:dev-slim .
|
208 |
```
|
|
|
214 |
```bash
|
215 |
git clone https://github.com/infiniflow/ragflow.git
|
216 |
cd ragflow/
|
217 |
+
pip3 install huggingface-hub nltk
|
218 |
python3 download_deps.py
|
219 |
docker build -f Dockerfile -t infiniflow/ragflow:dev .
|
220 |
```
|
README_ko.md
CHANGED
@@ -204,7 +204,7 @@
|
|
204 |
```bash
|
205 |
git clone https://github.com/infiniflow/ragflow.git
|
206 |
cd ragflow/
|
207 |
-
pip3 install huggingface-hub
|
208 |
python3 download_deps.py
|
209 |
docker build -f Dockerfile.slim -t infiniflow/ragflow:dev-slim .
|
210 |
```
|
@@ -216,7 +216,7 @@ docker build -f Dockerfile.slim -t infiniflow/ragflow:dev-slim .
|
|
216 |
```bash
|
217 |
git clone https://github.com/infiniflow/ragflow.git
|
218 |
cd ragflow/
|
219 |
-
pip3 install huggingface-hub
|
220 |
python3 download_deps.py
|
221 |
docker build -f Dockerfile -t infiniflow/ragflow:dev .
|
222 |
```
|
|
|
204 |
```bash
|
205 |
git clone https://github.com/infiniflow/ragflow.git
|
206 |
cd ragflow/
|
207 |
+
pip3 install huggingface-hub nltk
|
208 |
python3 download_deps.py
|
209 |
docker build -f Dockerfile.slim -t infiniflow/ragflow:dev-slim .
|
210 |
```
|
|
|
216 |
```bash
|
217 |
git clone https://github.com/infiniflow/ragflow.git
|
218 |
cd ragflow/
|
219 |
+
pip3 install huggingface-hub nltk
|
220 |
python3 download_deps.py
|
221 |
docker build -f Dockerfile -t infiniflow/ragflow:dev .
|
222 |
```
|
README_zh.md
CHANGED
@@ -204,7 +204,7 @@
|
|
204 |
```bash
|
205 |
git clone https://github.com/infiniflow/ragflow.git
|
206 |
cd ragflow/
|
207 |
-
pip3 install huggingface-hub
|
208 |
python3 download_deps.py
|
209 |
docker build -f Dockerfile.slim -t infiniflow/ragflow:dev-slim .
|
210 |
```
|
@@ -216,7 +216,7 @@ docker build -f Dockerfile.slim -t infiniflow/ragflow:dev-slim .
|
|
216 |
```bash
|
217 |
git clone https://github.com/infiniflow/ragflow.git
|
218 |
cd ragflow/
|
219 |
-
pip3 install huggingface-hub
|
220 |
python3 download_deps.py
|
221 |
docker build -f Dockerfile -t infiniflow/ragflow:dev .
|
222 |
```
|
|
|
204 |
```bash
|
205 |
git clone https://github.com/infiniflow/ragflow.git
|
206 |
cd ragflow/
|
207 |
+
pip3 install huggingface-hub nltk
|
208 |
python3 download_deps.py
|
209 |
docker build -f Dockerfile.slim -t infiniflow/ragflow:dev-slim .
|
210 |
```
|
|
|
216 |
```bash
|
217 |
git clone https://github.com/infiniflow/ragflow.git
|
218 |
cd ragflow/
|
219 |
+
pip3 install huggingface-hub nltk
|
220 |
python3 download_deps.py
|
221 |
docker build -f Dockerfile -t infiniflow/ragflow:dev .
|
222 |
```
|
docs/guides/develop/build_docker_image.md
CHANGED
@@ -64,7 +64,7 @@ This image is approximately 1 GB in size and relies on external LLM services, as
|
|
64 |
|
65 |
On a `linux/amd64` host:
|
66 |
```bash
|
67 |
-
pip3 install huggingface-hub
|
68 |
python3 download_deps.py
|
69 |
docker build -f Dockerfile -t infiniflow/ragflow:dev-amd64 .
|
70 |
docker push infiniflow/ragflow:dev-amd64
|
@@ -72,7 +72,7 @@ docker push infiniflow/ragflow:dev-amd64
|
|
72 |
|
73 |
On a `linux/arm64` host:
|
74 |
```bash
|
75 |
-
pip3 install huggingface-hub
|
76 |
python3 download_deps.py
|
77 |
docker build -f Dockerfile -t infiniflow/ragflow:dev-arm64 .
|
78 |
docker push infiniflow/ragflow:dev-arm64
|
|
|
64 |
|
65 |
On a `linux/amd64` host:
|
66 |
```bash
|
67 |
+
pip3 install huggingface-hub nltk
|
68 |
python3 download_deps.py
|
69 |
docker build -f Dockerfile -t infiniflow/ragflow:dev-amd64 .
|
70 |
docker push infiniflow/ragflow:dev-amd64
|
|
|
72 |
|
73 |
On a `linux/arm64` host:
|
74 |
```bash
|
75 |
+
pip3 install huggingface-hub nltk
|
76 |
python3 download_deps.py
|
77 |
docker build -f Dockerfile -t infiniflow/ragflow:dev-arm64 .
|
78 |
docker push infiniflow/ragflow:dev-arm64
|
download_deps.py
CHANGED
@@ -1,6 +1,7 @@
|
|
1 |
#!/usr/bin/env python3
|
2 |
|
3 |
from huggingface_hub import snapshot_download
|
|
|
4 |
import os
|
5 |
|
6 |
repos = [
|
@@ -12,13 +13,17 @@ repos = [
|
|
12 |
"maidalun1020/bce-reranker-base_v1",
|
13 |
]
|
14 |
|
15 |
-
|
16 |
def download_model(repo_id):
|
17 |
-
local_dir = os.path.join("huggingface.co", repo_id)
|
18 |
os.makedirs(local_dir, exist_ok=True)
|
19 |
snapshot_download(repo_id=repo_id, local_dir=local_dir)
|
20 |
|
21 |
|
22 |
if __name__ == "__main__":
|
|
|
|
|
|
|
|
|
23 |
for repo_id in repos:
|
|
|
24 |
download_model(repo_id)
|
|
|
1 |
#!/usr/bin/env python3
|
2 |
|
3 |
from huggingface_hub import snapshot_download
|
4 |
+
import nltk
|
5 |
import os
|
6 |
|
7 |
repos = [
|
|
|
13 |
"maidalun1020/bce-reranker-base_v1",
|
14 |
]
|
15 |
|
|
|
16 |
def download_model(repo_id):
|
17 |
+
local_dir = os.path.abspath(os.path.join("huggingface.co", repo_id))
|
18 |
os.makedirs(local_dir, exist_ok=True)
|
19 |
snapshot_download(repo_id=repo_id, local_dir=local_dir)
|
20 |
|
21 |
|
22 |
if __name__ == "__main__":
|
23 |
+
local_dir = os.path.abspath('nltk_data')
|
24 |
+
for data in ['wordnet', 'punkt', 'wordnet']:
|
25 |
+
print(f"Downloading nltk {data}...")
|
26 |
+
nltk.download(data, download_dir=local_dir)
|
27 |
for repo_id in repos:
|
28 |
+
print(f"Downloading huggingface repo {repo_id}...")
|
29 |
download_model(repo_id)
|