Skip to content

Fix pdfminer-six dependencies. #417

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Open
wants to merge 4 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 4 additions & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
@@ -1,3 +1,7 @@
## 0.8.11-dev0

* fix: dependencies of pdfminer-six and python 3.9

## 0.8.10

* feat: unpin `numpy` and bump minimum for `onnxruntime` to be compatible with `numpy>=2`
Expand Down
14 changes: 9 additions & 5 deletions Makefile
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
PACKAGE_NAME := unstructured_inference
PIP_VERSION := 23.2.1
PIP_VERSION := 25.0.1
CURRENT_DIR := $(shell pwd)


Expand All @@ -14,7 +14,7 @@ help: Makefile

## install-base: installs core requirements needed for text processing bricks
.PHONY: install-base
install-base: install-base-pip-packages
install-base: install-base-pip-packages requirements/base.in
python3 -m pip install -r requirements/base.txt

## install: installs all test, dev, and experimental requirements
Expand All @@ -29,17 +29,21 @@ install-base-pip-packages:
python3 -m pip install pip==${PIP_VERSION}

.PHONY: install-test
install-test: install-base
install-test: install-base requirements/test.txt
python3 -m pip install -r requirements/test.txt

.PHONY: install-dev
install-dev: install-test
install-dev: install-test requirements/dev.txt
python3 -m pip install -r requirements/dev.txt

## pip-compile: compiles all base/dev/test requirements
.PHONY: pip-compile
pip-compile:
pip-compile \
requirements/base.txt requirements/base-3.10.txt requirements/test.txt \
requirements/dev.txt \
: requirements/base.in requirements/base-3.10.in requirements/test.in requirements/dev.in
pip-compile --upgrade requirements/base.in
pip-compile --upgrade requirements/base-3.10.in -o requirements/base-3.10.txt
pip-compile --upgrade requirements/test.in
pip-compile --upgrade requirements/dev.in

Expand Down
17 changes: 17 additions & 0 deletions requirements/base-3.10.in
Original file line number Diff line number Diff line change
@@ -0,0 +1,17 @@
-c constraints.in
python-multipart
huggingface-hub
numpy
opencv-python!=4.7.0.68
onnx
onnxruntime ; python_version >= '3.10'
matplotlib ; python_version >= '3.10'
torch
timm
# NOTE(alan): Pinned because this is when the most recent module we import appeared
transformers
rapidfuzz
pandas
scipy ; python_version >= '3.10'
pypdfium2
pdfminer-six>=20250327
19 changes: 11 additions & 8 deletions requirements/base.in
Original file line number Diff line number Diff line change
@@ -1,17 +1,20 @@
-c constraints.in
python-multipart
huggingface-hub
numpy
numpy==2.0.2
opencv-python!=4.7.0.68
onnx
onnxruntime>=1.18.0
matplotlib
torch
onnxruntime<1.20
matplotlib==3.9.4
contourpy==1.3.0
kiwisolver==1.4.7
torch==2.6.0
networkx==3.2.1
timm
# NOTE(alan): Pinned because this is when the most recent module we import appeared
transformers>=4.25.1
transformers
rapidfuzz
pandas
scipy
scipy==1.13.1
pypdfium2
pdfminer-six
pdfminer-six>=20250327

83 changes: 62 additions & 21 deletions requirements/base.txt
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
#
# This file is autogenerated by pip-compile with Python 3.9
# This file is autogenerated by pip-compile with Python 3.12
# by the following command:
#
# pip-compile requirements/base.in
Expand All @@ -15,25 +15,27 @@ charset-normalizer==3.4.1
coloredlogs==15.0.1
# via onnxruntime
contourpy==1.3.0
# via matplotlib
# via
# -r requirements/base.in
# matplotlib
cryptography==44.0.2
# via pdfminer-six
cycler==0.12.1
# via matplotlib
filelock==3.17.0
filelock==3.18.0
# via
# huggingface-hub
# torch
# transformers
flatbuffers==25.2.10
# via onnxruntime
fonttools==4.56.0
fonttools==4.57.0
# via matplotlib
fsspec==2025.3.0
fsspec==2025.3.2
# via
# huggingface-hub
# torch
huggingface-hub==0.29.3
huggingface-hub==0.30.2
# via
# -r requirements/base.in
# timm
Expand All @@ -43,20 +45,22 @@ humanfriendly==10.0
# via coloredlogs
idna==3.10
# via requests
importlib-resources==6.5.2
# via matplotlib
jinja2==3.1.6
# via torch
kiwisolver==1.4.7
# via matplotlib
# via
# -r requirements/base.in
# matplotlib
markupsafe==3.0.2
# via jinja2
matplotlib==3.9.4
# via -r requirements/base.in
mpmath==1.3.0
# via sympy
networkx==3.2.1
# via torch
# via
# -r requirements/base.in
# torch
numpy==2.0.2
# via
# -r requirements/base.in
Expand All @@ -69,6 +73,40 @@ numpy==2.0.2
# scipy
# torchvision
# transformers
nvidia-cublas-cu12==12.4.5.8
# via
# nvidia-cudnn-cu12
# nvidia-cusolver-cu12
# torch
nvidia-cuda-cupti-cu12==12.4.127
# via torch
nvidia-cuda-nvrtc-cu12==12.4.127
# via torch
nvidia-cuda-runtime-cu12==12.4.127
# via torch
nvidia-cudnn-cu12==9.1.0.70
# via torch
nvidia-cufft-cu12==11.2.1.3
# via torch
nvidia-curand-cu12==10.3.5.147
# via torch
nvidia-cusolver-cu12==11.6.1.9
# via torch
nvidia-cusparse-cu12==12.3.1.170
# via
# nvidia-cusolver-cu12
# torch
nvidia-cusparselt-cu12==0.6.2
# via torch
nvidia-nccl-cu12==2.21.5
# via torch
nvidia-nvjitlink-cu12==12.4.127
# via
# nvidia-cusolver-cu12
# nvidia-cusparse-cu12
# torch
nvidia-nvtx-cu12==12.4.127
# via torch
onnx==1.17.0
# via -r requirements/base.in
onnxruntime==1.19.2
Expand All @@ -83,19 +121,19 @@ packaging==24.2
# transformers
pandas==2.2.3
# via -r requirements/base.in
pdfminer-six==20240706
pdfminer-six==20250327
# via -r requirements/base.in
pillow==11.1.0
# via
# matplotlib
# torchvision
protobuf==6.30.0
protobuf==6.30.2
# via
# onnx
# onnxruntime
pycparser==2.22
# via cffi
pyparsing==3.2.1
pyparsing==3.2.3
# via matplotlib
pypdfium2==4.30.1
# via -r requirements/base.in
Expand All @@ -105,14 +143,14 @@ python-dateutil==2.9.0.post0
# pandas
python-multipart==0.0.20
# via -r requirements/base.in
pytz==2025.1
pytz==2025.2
# via pandas
pyyaml==6.0.2
# via
# huggingface-hub
# timm
# transformers
rapidfuzz==3.12.2
rapidfuzz==3.13.0
# via -r requirements/base.in
regex==2024.11.6
# via transformers
Expand Down Expand Up @@ -147,15 +185,18 @@ tqdm==4.67.1
# via
# huggingface-hub
# transformers
transformers==4.49.0
transformers==4.51.2
# via -r requirements/base.in
typing-extensions==4.12.2
triton==3.2.0
# via torch
typing-extensions==4.13.2
# via
# huggingface-hub
# torch
tzdata==2025.1
tzdata==2025.2
# via pandas
urllib3==2.3.0
urllib3==2.4.0
# via requests
zipp==3.21.0
# via importlib-resources

# The following packages are considered to be unsafe in a requirements file:
# setuptools
3 changes: 2 additions & 1 deletion requirements/dev.in
Original file line number Diff line number Diff line change
Expand Up @@ -2,6 +2,7 @@
-c base.txt
-c test.txt
jupyter
ipython
ipython<=8.19; python_version <= '3.9'
ipython; python_version >= '3.10'
pip-tools
matplotlib
Loading
Loading