From ba70828f4a4f6ed1228e0189f102655587cca576 Mon Sep 17 00:00:00 2001 From: cragwolfe Date: Sun, 27 Aug 2023 18:30:17 -0700 Subject: [PATCH] build(image): bump Dockerfile to python3.10 (#1214) --- CHANGELOG.md | 12 +++++++++++- Dockerfile | 10 +++++----- unstructured/__version__.py | 2 +- 3 files changed, 17 insertions(+), 7 deletions(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index c7a64f67b5..d09b9f96ac 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,3 +1,13 @@ +## 0.10.8 + +### Enhancements + +* Release docker image that installs Python 3.10 rather than 3.8 + +### Features + +### Fixes + ## 0.10.7 ### Enhancements @@ -19,7 +29,7 @@ * Add functionality to sort elements using `xy-cut` sorting approach in `partition_pdf` for `hi_res` and `fast` strategies * Bump unstructured-inference * Set OMP_THREAD_LIMIT to 1 if not set for better tesseract perf (0.5.17) - + ### Features * Extract coordinates from PDFs and images when using OCR only strategy and add to metadata diff --git a/Dockerfile b/Dockerfile index dd7da6a003..356bdeaab5 100644 --- a/Dockerfile +++ b/Dockerfile @@ -1,5 +1,5 @@ # syntax=docker/dockerfile:experimental -FROM quay.io/unstructured-io/base-images:rocky8.7-3 as base +FROM quay.io/unstructured-io/base-images:rocky8.7-5 as base ARG PIP_VERSION @@ -15,7 +15,7 @@ FROM base as deps # Copy and install Unstructured COPY requirements requirements -RUN python3.8 -m pip install pip==${PIP_VERSION} && \ +RUN python3.10 -m pip install pip==${PIP_VERSION} && \ dnf -y groupinstall "Development Tools" && \ pip install --no-cache -r requirements/base.txt && \ pip install --no-cache -r requirements/test.txt && \ @@ -50,14 +50,14 @@ RUN python3.8 -m pip install pip==${PIP_VERSION} && \ dnf -y groupremove "Development Tools" && \ dnf clean all -RUN python3.8 -c "import nltk; nltk.download('punkt')" && \ - python3.8 -c "import nltk; nltk.download('averaged_perceptron_tagger')" +RUN python3.10 -c "import nltk; nltk.download('punkt')" && \ + python3.10 -c "import nltk; nltk.download('averaged_perceptron_tagger')" FROM deps as code COPY example-docs example-docs COPY unstructured unstructured -RUN python3.8 -c "from unstructured.ingest.doc_processor.generalized import initialize; initialize()" +RUN python3.10 -c "from unstructured.ingest.doc_processor.generalized import initialize; initialize()" CMD ["/bin/bash"] diff --git a/unstructured/__version__.py b/unstructured/__version__.py index 9d249465b8..923fa4143a 100644 --- a/unstructured/__version__.py +++ b/unstructured/__version__.py @@ -1 +1 @@ -__version__ = "0.10.7" # pragma: no cover +__version__ = "0.10.8" # pragma: no cover