diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index 185012c73..5d483b483 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -2,7 +2,7 @@ name: CI on: push: - branches: [ main ] + branches: [ '**' ] pull_request: branches: [ main ] diff --git a/requirements/base.txt b/requirements/base.txt index 63eb2dd77..4314c3e77 100644 --- a/requirements/base.txt +++ b/requirements/base.txt @@ -8,7 +8,7 @@ annotated-types==0.6.0 # via pydantic antlr4-python3-runtime==4.9.3 # via omegaconf -anyio==4.2.0 +anyio==4.3.0 # via starlette backoff==2.2.1 # via @@ -38,14 +38,14 @@ coloredlogs==15.0.1 # via onnxruntime contourpy==1.2.0 # via matplotlib -cryptography==42.0.2 +cryptography==42.0.5 # via pdfminer-six cycler==0.12.1 # via matplotlib dataclasses-json==0.6.4 - # via unstructured -dataclasses-json-speakeasy==0.5.11 - # via unstructured-client + # via + # unstructured + # unstructured-client deprecated==1.2.14 # via pikepdf effdet==0.4.1 @@ -56,18 +56,19 @@ et-xmlfile==1.1.0 # via openpyxl exceptiongroup==1.2.0 # via anyio -fastapi==0.109.2 +fastapi==0.110.0 # via -r requirements/base.in filelock==3.13.1 # via # huggingface-hub # torch # transformers + # triton filetype==1.2.0 # via unstructured flatbuffers==23.5.26 # via onnxruntime -fonttools==4.48.1 +fonttools==4.49.0 # via matplotlib fsspec==2024.2.0 # via @@ -75,7 +76,7 @@ fsspec==2024.2.0 # torch h11==0.14.0 # via uvicorn -huggingface-hub==0.20.3 +huggingface-hub==0.21.3 # via # timm # tokenizers @@ -112,12 +113,11 @@ markdown==3.5.2 # via unstructured markupsafe==2.1.5 # via jinja2 -marshmallow==3.20.2 +marshmallow==3.21.0 # via # dataclasses-json - # dataclasses-json-speakeasy # unstructured-client -matplotlib==3.8.2 +matplotlib==3.8.3 # via pycocotools mpmath==1.3.0 # via sympy @@ -147,6 +147,37 @@ numpy==1.26.4 # torchvision # transformers # unstructured +nvidia-cublas-cu12==12.1.3.1 + # via + # nvidia-cudnn-cu12 + # nvidia-cusolver-cu12 + # torch +nvidia-cuda-cupti-cu12==12.1.105 + # via torch +nvidia-cuda-nvrtc-cu12==12.1.105 + # via torch +nvidia-cuda-runtime-cu12==12.1.105 + # via torch +nvidia-cudnn-cu12==8.9.2.26 + # via torch +nvidia-cufft-cu12==11.0.2.54 + # via torch +nvidia-curand-cu12==10.3.2.106 + # via torch +nvidia-cusolver-cu12==11.4.5.107 + # via torch +nvidia-cusparse-cu12==12.1.0.106 + # via + # nvidia-cusolver-cu12 + # torch +nvidia-nccl-cu12==2.19.3 + # via torch +nvidia-nvjitlink-cu12==12.3.101 + # via + # nvidia-cusolver-cu12 + # nvidia-cusparse-cu12 +nvidia-nvtx-cu12==12.1.105 + # via torch olefile==0.47 # via msg-parser omegaconf==2.3.0 @@ -174,7 +205,7 @@ packaging==23.2 # transformers # unstructured-client # unstructured-pytesseract -pandas==2.2.0 +pandas==2.2.1 # via # layoutparser # unstructured @@ -186,9 +217,9 @@ pdfminer-six==20221105 # via # pdfplumber # unstructured -pdfplumber==0.10.3 +pdfplumber==0.10.4 # via layoutparser -pikepdf==8.12.0 +pikepdf==8.13.0 # via unstructured pillow==10.2.0 # via @@ -197,13 +228,16 @@ pillow==10.2.0 # pdf2image # pdfplumber # pikepdf + # pillow-heif # pytesseract # python-pptx # torchvision # unstructured-pytesseract +pillow-heif==0.15.0 + # via unstructured portalocker==2.8.2 # via iopath -protobuf==4.25.2 +protobuf==4.25.3 # via # onnx # onnxruntime @@ -215,34 +249,34 @@ pycparser==2.21 # via cffi pycryptodome==3.20.0 # via -r requirements/base.in -pydantic==2.6.1 +pydantic==2.6.3 # via fastapi -pydantic-core==2.16.2 +pydantic-core==2.16.3 # via pydantic -pypandoc==1.12 +pypandoc==1.13 # via unstructured pyparsing==3.1.1 # via matplotlib -pypdf==4.0.1 +pypdf==4.1.0 # via # -r requirements/base.in # unstructured -pypdfium2==4.26.0 +pypdfium2==4.27.0 # via pdfplumber pytesseract==0.3.10 # via layoutparser -python-dateutil==2.8.2 +python-dateutil==2.9.0.post0 # via # matplotlib # pandas # unstructured-client python-docx==1.1.0 # via unstructured -python-iso639==2024.1.2 +python-iso639==2024.2.7 # via unstructured python-magic==0.4.27 # via unstructured -python-multipart==0.0.7 +python-multipart==0.0.9 # via unstructured-inference python-pptx==0.6.23 # via unstructured @@ -269,7 +303,6 @@ requests==2.31.0 # via # -r requirements/base.in # huggingface-hub - # torchvision # transformers # unstructured # unstructured-client @@ -285,7 +318,7 @@ six==1.16.0 # langdetect # python-dateutil # unstructured-client -sniffio==1.3.0 +sniffio==1.3.1 # via anyio soupsieve==2.5 # via beautifulsoup4 @@ -297,22 +330,22 @@ sympy==1.12 # torch tabulate==0.9.0 # via unstructured -timm==0.9.12 +timm==0.9.16 # via effdet -tokenizers==0.15.1 +tokenizers==0.15.2 # via transformers -torch==2.2.0 +torch==2.2.1 # via # effdet # layoutparser # timm # torchvision -torchvision==0.17.0 +torchvision==0.17.1 # via # effdet # layoutparser # timm -tqdm==4.66.1 +tqdm==4.66.2 # via # huggingface-hub # iopath @@ -320,7 +353,9 @@ tqdm==4.66.1 # transformers transformers==4.37.1 # via unstructured-inference -typing-extensions==4.9.0 +triton==2.2.0 + # via torch +typing-extensions==4.10.0 # via # anyio # fastapi @@ -337,23 +372,22 @@ typing-extensions==4.9.0 typing-inspect==0.9.0 # via # dataclasses-json - # dataclasses-json-speakeasy # unstructured-client -tzdata==2023.4 +tzdata==2024.1 # via pandas -unstructured[local-inference]==0.12.3 +unstructured[local-inference]==0.12.5 # via -r requirements/base.in -unstructured-client==0.17.0 +unstructured-client==0.21.0 # via unstructured unstructured-inference==0.7.23 # via unstructured unstructured-pytesseract==0.3.12 # via unstructured -urllib3==2.2.0 +urllib3==2.2.1 # via # requests # unstructured-client -uvicorn==0.27.0.post1 +uvicorn==0.27.1 # via -r requirements/base.in wrapt==1.16.0 # via @@ -361,5 +395,5 @@ wrapt==1.16.0 # unstructured xlrd==2.0.1 # via unstructured -xlsxwriter==3.1.9 +xlsxwriter==3.2.0 # via python-pptx diff --git a/requirements/test.txt b/requirements/test.txt index 72141304e..68318fdcd 100644 --- a/requirements/test.txt +++ b/requirements/test.txt @@ -12,14 +12,12 @@ antlr4-python3-runtime==4.9.3 # via # -r requirements/base.txt # omegaconf -anyio==4.2.0 +anyio==4.3.0 # via # -r requirements/base.txt # httpx # jupyter-server # starlette -appnope==0.1.4 - # via ipykernel argon2-cffi==23.1.0 # via jupyter-server argon2-cffi-bindings==21.2.0 @@ -49,7 +47,7 @@ beautifulsoup4==4.12.3 # -r requirements/base.txt # nbconvert # unstructured -black==24.1.1 +black==24.2.0 # via -r requirements/test.in bleach==6.1.0 # via nbconvert @@ -92,9 +90,9 @@ contourpy==1.2.0 # via # -r requirements/base.txt # matplotlib -coverage[toml]==7.4.1 +coverage[toml]==7.4.3 # via pytest-cov -cryptography==42.0.2 +cryptography==42.0.5 # via # -r requirements/base.txt # pdfminer-six @@ -106,11 +104,8 @@ dataclasses-json==0.6.4 # via # -r requirements/base.txt # unstructured -dataclasses-json-speakeasy==0.5.11 - # via - # -r requirements/base.txt # unstructured-client -debugpy==1.8.0 +debugpy==1.8.1 # via ipykernel decorator==5.1.1 # via ipython @@ -142,7 +137,7 @@ execnb==0.1.5 # via nbdev executing==2.0.1 # via stack-data -fastapi==0.109.2 +fastapi==0.110.0 # via -r requirements/base.txt fastcore==1.5.29 # via @@ -157,6 +152,7 @@ filelock==3.13.1 # huggingface-hub # torch # transformers + # triton filetype==1.2.0 # via # -r requirements/base.txt @@ -167,7 +163,7 @@ flatbuffers==23.5.26 # via # -r requirements/base.txt # onnxruntime -fonttools==4.48.1 +fonttools==4.49.0 # via # -r requirements/base.txt # matplotlib @@ -185,13 +181,13 @@ h11==0.14.0 # -r requirements/base.txt # httpcore # uvicorn -httpcore==1.0.2 +httpcore==1.0.4 # via httpx -httpx==0.26.0 +httpx==0.27.0 # via # -r requirements/test.in # jupyterlab -huggingface-hub==0.20.3 +huggingface-hub==0.21.3 # via # -r requirements/base.txt # timm @@ -216,14 +212,14 @@ iopath==0.1.10 # via # -r requirements/base.txt # layoutparser -ipykernel==6.29.1 +ipykernel==6.29.3 # via # ipywidgets # jupyter # jupyter-console # jupyterlab # qtconsole -ipython==8.21.0 +ipython==8.22.2 # via # execnb # ipykernel @@ -249,7 +245,7 @@ joblib==1.3.2 # via # -r requirements/base.txt # nltk -json5==0.9.14 +json5==0.9.20 # via jupyterlab-server jsonpath-python==1.0.6 # via @@ -288,9 +284,9 @@ jupyter-core==5.7.1 # qtconsole jupyter-events==0.9.0 # via jupyter-server -jupyter-lsp==2.2.2 +jupyter-lsp==2.2.3 # via jupyterlab -jupyter-server==2.12.5 +jupyter-server==2.13.0 # via # jupyter-lsp # jupyterlab @@ -299,15 +295,15 @@ jupyter-server==2.12.5 # notebook-shim jupyter-server-terminals==0.5.2 # via jupyter-server -jupyterlab==4.1.0 +jupyterlab==4.1.2 # via notebook jupyterlab-pygments==0.3.0 # via nbconvert -jupyterlab-server==2.25.2 +jupyterlab-server==2.25.3 # via # jupyterlab # notebook -jupyterlab-widgets==3.0.9 +jupyterlab-widgets==3.0.10 # via ipywidgets kiwisolver==1.4.5 # via @@ -337,13 +333,12 @@ markupsafe==2.1.5 # -r requirements/base.txt # jinja2 # nbconvert -marshmallow==3.20.2 +marshmallow==3.21.0 # via # -r requirements/base.txt # dataclasses-json - # dataclasses-json-speakeasy # unstructured-client -matplotlib==3.8.2 +matplotlib==3.8.3 # via # -r requirements/base.txt # pycocotools @@ -374,7 +369,7 @@ mypy-extensions==1.0.0 # unstructured-client nbclient==0.9.0 # via nbconvert -nbconvert==7.15.0 +nbconvert==7.16.2 # via # jupyter # jupyter-server @@ -396,9 +391,9 @@ nltk==3.8.1 # via # -r requirements/base.txt # unstructured -notebook==7.0.7 +notebook==7.1.1 # via jupyter -notebook-shim==0.2.3 +notebook-shim==0.2.4 # via # jupyterlab # notebook @@ -417,6 +412,58 @@ numpy==1.26.4 # torchvision # transformers # unstructured +nvidia-cublas-cu12==12.1.3.1 + # via + # -r requirements/base.txt + # nvidia-cudnn-cu12 + # nvidia-cusolver-cu12 + # torch +nvidia-cuda-cupti-cu12==12.1.105 + # via + # -r requirements/base.txt + # torch +nvidia-cuda-nvrtc-cu12==12.1.105 + # via + # -r requirements/base.txt + # torch +nvidia-cuda-runtime-cu12==12.1.105 + # via + # -r requirements/base.txt + # torch +nvidia-cudnn-cu12==8.9.2.26 + # via + # -r requirements/base.txt + # torch +nvidia-cufft-cu12==11.0.2.54 + # via + # -r requirements/base.txt + # torch +nvidia-curand-cu12==10.3.2.106 + # via + # -r requirements/base.txt + # torch +nvidia-cusolver-cu12==11.4.5.107 + # via + # -r requirements/base.txt + # torch +nvidia-cusparse-cu12==12.1.0.106 + # via + # -r requirements/base.txt + # nvidia-cusolver-cu12 + # torch +nvidia-nccl-cu12==2.19.3 + # via + # -r requirements/base.txt + # torch +nvidia-nvjitlink-cu12==12.3.101 + # via + # -r requirements/base.txt + # nvidia-cusolver-cu12 + # nvidia-cusparse-cu12 +nvidia-nvtx-cu12==12.1.105 + # via + # -r requirements/base.txt + # torch olefile==0.47 # via # -r requirements/base.txt @@ -468,7 +515,7 @@ packaging==23.2 # transformers # unstructured-client # unstructured-pytesseract -pandas==2.2.0 +pandas==2.2.1 # via # -r requirements/base.txt # layoutparser @@ -489,13 +536,13 @@ pdfminer-six==20221105 # -r requirements/base.txt # pdfplumber # unstructured -pdfplumber==0.10.3 +pdfplumber==0.10.4 # via # -r requirements/base.txt # layoutparser pexpect==4.9.0 # via ipython -pikepdf==8.12.0 +pikepdf==8.13.0 # via # -r requirements/base.txt # unstructured @@ -507,10 +554,15 @@ pillow==10.2.0 # pdf2image # pdfplumber # pikepdf + # pillow-heif # pytesseract # python-pptx # torchvision # unstructured-pytesseract +pillow-heif==0.15.0 + # via + # -r requirements/base.txt + # unstructured platformdirs==4.2.0 # via # black @@ -521,13 +573,13 @@ portalocker==2.8.2 # via # -r requirements/base.txt # iopath -prometheus-client==0.19.0 +prometheus-client==0.20.0 # via jupyter-server prompt-toolkit==3.0.43 # via # ipython # jupyter-console -protobuf==4.25.2 +protobuf==4.25.3 # via # -r requirements/base.txt # onnx @@ -554,11 +606,11 @@ pycparser==2.21 # cffi pycryptodome==3.20.0 # via -r requirements/base.txt -pydantic==2.6.1 +pydantic==2.6.3 # via # -r requirements/base.txt # fastapi -pydantic-core==2.16.2 +pydantic-core==2.16.3 # via # -r requirements/base.txt # pydantic @@ -570,7 +622,7 @@ pygments==2.17.2 # jupyter-console # nbconvert # qtconsole -pypandoc==1.12 +pypandoc==1.13 # via # -r requirements/base.txt # unstructured @@ -578,11 +630,11 @@ pyparsing==3.1.1 # via # -r requirements/base.txt # matplotlib -pypdf==4.0.1 +pypdf==4.1.0 # via # -r requirements/base.txt # unstructured -pypdfium2==4.26.0 +pypdfium2==4.27.0 # via # -r requirements/base.txt # pdfplumber @@ -590,7 +642,7 @@ pytesseract==0.3.10 # via # -r requirements/base.txt # layoutparser -pytest==8.0.0 +pytest==8.0.2 # via # pytest-cov # pytest-mock @@ -598,7 +650,7 @@ pytest-cov==4.1.0 # via -r requirements/test.in pytest-mock==3.12.0 # via -r requirements/test.in -python-dateutil==2.8.2 +python-dateutil==2.9.0.post0 # via # -r requirements/base.txt # arrow @@ -610,7 +662,7 @@ python-docx==1.1.0 # via # -r requirements/base.txt # unstructured -python-iso639==2024.1.2 +python-iso639==2024.2.7 # via # -r requirements/base.txt # unstructured @@ -620,7 +672,7 @@ python-magic==0.4.27 # via # -r requirements/base.txt # unstructured -python-multipart==0.0.7 +python-multipart==0.0.9 # via # -r requirements/base.txt # unstructured-inference @@ -675,7 +727,6 @@ requests==2.31.0 # -r requirements/base.txt # huggingface-hub # jupyterlab-server - # torchvision # transformers # unstructured # unstructured-client @@ -687,7 +738,7 @@ rfc3986-validator==0.1.1 # via # jsonschema # jupyter-events -rpds-py==0.17.1 +rpds-py==0.18.0 # via # jsonschema # referencing @@ -713,7 +764,7 @@ six==1.16.0 # python-dateutil # rfc3339-validator # unstructured-client -sniffio==1.3.0 +sniffio==1.3.1 # via # -r requirements/base.txt # anyio @@ -741,13 +792,13 @@ terminado==0.18.0 # via # jupyter-server # jupyter-server-terminals -timm==0.9.12 +timm==0.9.16 # via # -r requirements/base.txt # effdet tinycss2==1.2.1 # via nbconvert -tokenizers==0.15.1 +tokenizers==0.15.2 # via # -r requirements/base.txt # transformers @@ -758,14 +809,14 @@ tomli==2.0.1 # jupyterlab # mypy # pytest -torch==2.2.0 +torch==2.2.1 # via # -r requirements/base.txt # effdet # layoutparser # timm # torchvision -torchvision==0.17.0 +torchvision==0.17.1 # via # -r requirements/base.txt # effdet @@ -779,7 +830,7 @@ tornado==6.4 # jupyterlab # notebook # terminado -tqdm==4.66.1 +tqdm==4.66.2 # via # -r requirements/base.txt # huggingface-hub @@ -807,9 +858,13 @@ transformers==4.37.1 # via # -r requirements/base.txt # unstructured-inference +triton==2.2.0 + # via + # -r requirements/base.txt + # torch types-python-dateutil==2.8.19.20240106 # via arrow -typing-extensions==4.9.0 +typing-extensions==4.10.0 # via # -r requirements/base.txt # anyio @@ -831,15 +886,14 @@ typing-inspect==0.9.0 # via # -r requirements/base.txt # dataclasses-json - # dataclasses-json-speakeasy # unstructured-client -tzdata==2023.4 +tzdata==2024.1 # via # -r requirements/base.txt # pandas -unstructured[local-inference]==0.12.3 +unstructured[local-inference]==0.12.5 # via -r requirements/base.txt -unstructured-client==0.17.0 +unstructured-client==0.21.0 # via # -r requirements/base.txt # unstructured @@ -853,12 +907,12 @@ unstructured-pytesseract==0.3.12 # unstructured uri-template==1.3.0 # via jsonschema -urllib3==2.2.0 +urllib3==2.2.1 # via # -r requirements/base.txt # requests # unstructured-client -uvicorn==0.27.0.post1 +uvicorn==0.27.1 # via -r requirements/base.txt watchdog==4.0.0 # via nbdev @@ -874,7 +928,7 @@ websocket-client==1.7.0 # via jupyter-server wheel==0.42.0 # via astunparse -widgetsnbextension==4.0.9 +widgetsnbextension==4.0.10 # via ipywidgets wrapt==1.16.0 # via @@ -885,7 +939,7 @@ xlrd==2.0.1 # via # -r requirements/base.txt # unstructured -xlsxwriter==3.1.9 +xlsxwriter==3.2.0 # via # -r requirements/base.txt # python-pptx