From dd9bae29f3ba14a44f213c0ef19804358542fa7a Mon Sep 17 00:00:00 2001 From: Michele Dolfi Date: Thu, 13 Feb 2025 13:26:11 +0100 Subject: [PATCH] update example Dockerfile with download CLI Signed-off-by: Michele Dolfi --- Dockerfile | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/Dockerfile b/Dockerfile index c863f1c2..d210b5ad 100644 --- a/Dockerfile +++ b/Dockerfile @@ -16,8 +16,7 @@ ENV TORCH_HOME=/tmp/ COPY docs/examples/minimal.py /root/minimal.py -RUN python -c 'from deepsearch_glm.utils.load_pretrained_models import load_pretrained_nlp_models; load_pretrained_nlp_models(verbose=True);' -RUN python -c 'from docling.pipeline.standard_pdf_pipeline import StandardPdfPipeline; StandardPdfPipeline.download_models_hf(force=True);' +RUN docling-tools models download # On container environments, always set a thread budget to avoid undesired thread congestion. ENV OMP_NUM_THREADS=4 @@ -25,3 +24,6 @@ ENV OMP_NUM_THREADS=4 # On container shell: # > cd /root/ # > python minimal.py + +# Running as `docker run -e DOCLING_ARTIFACTS_PATH=/root/.cache/docling/models` will use the +# model weights included in the container image.