diff --git a/src/paddle_ocr/Dockerfile.cpu b/src/paddle_ocr/Dockerfile.cpu index f9c6bab..934c537 100644 --- a/src/paddle_ocr/Dockerfile.cpu +++ b/src/paddle_ocr/Dockerfile.cpu @@ -34,15 +34,9 @@ ARG REC_MODEL=PP-OCRv5_server_rec ENV PADDLE_DET_MODEL=${DET_MODEL} ENV PADDLE_REC_MODEL=${REC_MODEL} -# Download models during build (not at runtime) -RUN python -c "\ -import os; \ -from paddleocr import PaddleOCR; \ -det = os.environ.get('PADDLE_DET_MODEL', 'PP-OCRv5_server_det'); \ -rec = os.environ.get('PADDLE_REC_MODEL', 'PP-OCRv5_server_rec'); \ -print(f'Downloading models: det={det}, rec={rec}'); \ -ocr = PaddleOCR(text_detection_model_name=det, text_recognition_model_name=rec); \ -print('Models downloaded successfully!')" +# Note: Models download at first runtime +# First container start will take ~30s longer as models are fetched +# Use paddlex-cache volume to persist models across container restarts # Volume for dataset and optional additional model cache VOLUME ["/app/dataset", "/root/.paddlex"] diff --git a/src/paddle_ocr/Dockerfile.gpu b/src/paddle_ocr/Dockerfile.gpu index 66573e2..9e5f1a6 100644 --- a/src/paddle_ocr/Dockerfile.gpu +++ b/src/paddle_ocr/Dockerfile.gpu @@ -77,15 +77,9 @@ ARG REC_MODEL=PP-OCRv5_server_rec ENV PADDLE_DET_MODEL=${DET_MODEL} ENV PADDLE_REC_MODEL=${REC_MODEL} -# Download models during build (not at runtime) -RUN python -c "\ -import os; \ -from paddleocr import PaddleOCR; \ -det = os.environ.get('PADDLE_DET_MODEL', 'PP-OCRv5_server_det'); \ -rec = os.environ.get('PADDLE_REC_MODEL', 'PP-OCRv5_server_rec'); \ -print(f'Downloading models: det={det}, rec={rec}'); \ -ocr = PaddleOCR(text_detection_model_name=det, text_recognition_model_name=rec); \ -print('Models downloaded successfully!')" +# Note: Models download at first runtime (CI runner has no GPU for build-time download) +# First container start will take ~30s longer as models are fetched +# Use paddlex-cache volume to persist models across container restarts # Volume for dataset and optional additional model cache VOLUME ["/app/dataset", "/root/.paddlex"]