diff --git a/Makefile b/Makefile index 528b1923d2..0d2f62f28b 100644 --- a/Makefile +++ b/Makefile @@ -103,7 +103,7 @@ install-xlsx: python3 -m pip install -r requirements/extra-xlsx.txt .PHONY: install-all-docs -install-all-docs: install-base install-csv install-docx install-epub install-odt install-pypandoc install-markdown install-msg install-pdf-image install-pptx install-xlsx install-googlevisionocr +install-all-docs: install-base install-csv install-docx install-epub install-odt install-pypandoc install-markdown install-msg install-pdf-image install-pptx install-xlsx .PHONY: install-all-ingest install-all-ingest: @@ -275,10 +275,6 @@ install-pandoc: install-paddleocr: ARCH=${ARCH} ./scripts/install-paddleocr.sh -.PHONY: install-googlevisionocr -install-googlevisionocr: - python3 -m pip install -r requirements/extra-googlevisionocr.txt - ## pip-compile: compiles all base/dev/test requirements .PHONY: pip-compile pip-compile: diff --git a/requirements/extra-googlevisionocr.in b/requirements/extra-googlevisionocr.in deleted file mode 100644 index 6a87053ede..0000000000 --- a/requirements/extra-googlevisionocr.in +++ /dev/null @@ -1,4 +0,0 @@ --c ./deps/constraints.txt --c base.txt - -google-cloud-vision diff --git a/requirements/extra-googlevisionocr.txt b/requirements/extra-googlevisionocr.txt deleted file mode 100644 index 919f4689ae..0000000000 --- a/requirements/extra-googlevisionocr.txt +++ /dev/null @@ -1,68 +0,0 @@ -# -# This file is autogenerated by pip-compile with Python 3.9 -# by the following command: -# -# pip-compile ./extra-googlevisionocr.in -# -cachetools==5.3.3 - # via google-auth -certifi==2024.2.2 - # via - # -c ././deps/constraints.txt - # -c ./base.txt - # requests -charset-normalizer==3.3.2 - # via - # -c ./base.txt - # requests -google-api-core[grpc]==2.18.0 - # via google-cloud-vision -google-auth==2.29.0 - # via - # google-api-core - # google-cloud-vision -google-cloud-vision==3.7.2 - # via -r ./extra-googlevisionocr.in -googleapis-common-protos==1.63.0 - # via - # google-api-core - # grpcio-status -grpcio==1.62.2 - # via - # google-api-core - # grpcio-status -grpcio-status==1.62.2 - # via google-api-core -idna==3.7 - # via - # -c ./base.txt - # requests -proto-plus==1.23.0 - # via - # google-api-core - # google-cloud-vision -protobuf==4.23.4 - # via - # -c ././deps/constraints.txt - # google-api-core - # google-cloud-vision - # googleapis-common-protos - # grpcio-status - # proto-plus -pyasn1==0.6.0 - # via - # pyasn1-modules - # rsa -pyasn1-modules==0.4.0 - # via google-auth -requests==2.31.0 - # via - # -c ./base.txt - # google-api-core -rsa==4.9 - # via google-auth -urllib3==1.26.18 - # via - # -c ././deps/constraints.txt - # -c ./base.txt - # requests diff --git a/requirements/extra-pdf-image.in b/requirements/extra-pdf-image.in index f6e003d1a3..b4e3f3b8ec 100644 --- a/requirements/extra-pdf-image.in +++ b/requirements/extra-pdf-image.in @@ -13,3 +13,4 @@ unstructured-inference==0.7.27 # unstructured fork of pytesseract that provides an interface to allow for multiple output formats # from one tesseract call unstructured.pytesseract>=0.3.12 +google-cloud-vision diff --git a/requirements/extra-pdf-image.txt b/requirements/extra-pdf-image.txt index 2d902f0194..2acc11122a 100644 --- a/requirements/extra-pdf-image.txt +++ b/requirements/extra-pdf-image.txt @@ -6,6 +6,8 @@ # antlr4-python3-runtime==4.9.3 # via omegaconf +cachetools==5.3.3 + # via google-auth certifi==2024.2.2 # via # -c ././deps/constraints.txt @@ -43,6 +45,24 @@ fsspec==2024.3.1 # via # huggingface-hub # torch +google-api-core[grpc]==2.18.0 + # via google-cloud-vision +google-auth==2.29.0 + # via + # google-api-core + # google-cloud-vision +google-cloud-vision==3.7.2 + # via -r ./extra-pdf-image.in +googleapis-common-protos==1.63.0 + # via + # google-api-core + # grpcio-status +grpcio==1.62.2 + # via + # google-api-core + # grpcio-status +grpcio-status==1.62.2 + # via google-api-core huggingface-hub==0.22.2 # via # timm @@ -147,11 +167,26 @@ pillow-heif==0.16.0 # via -r ./extra-pdf-image.in portalocker==2.8.2 # via iopath +proto-plus==1.23.0 + # via + # google-api-core + # google-cloud-vision protobuf==4.23.4 # via # -c ././deps/constraints.txt + # google-api-core + # google-cloud-vision + # googleapis-common-protos + # grpcio-status # onnx # onnxruntime + # proto-plus +pyasn1==0.6.0 + # via + # pyasn1-modules + # rsa +pyasn1-modules==0.4.0 + # via google-auth pycocotools==2.0.7 # via # -c ././deps/constraints.txt @@ -195,8 +230,11 @@ regex==2024.4.16 requests==2.31.0 # via # -c ./base.txt + # google-api-core # huggingface-hub # transformers +rsa==4.9 + # via google-auth safetensors==0.4.3 # via # timm