diff --git a/comps/third_parties/pathway/src/requirements-cpu.txt b/comps/third_parties/pathway/src/requirements-cpu.txt index f6bd103a47..806aef910f 100644 --- a/comps/third_parties/pathway/src/requirements-cpu.txt +++ b/comps/third_parties/pathway/src/requirements-cpu.txt @@ -1,15 +1,15 @@ # This file was autogenerated by uv via the following command: # uv pip compile --python=/usr/local/bin/python3.11 --index-strategy unsafe-best-match ./comps/third_parties/pathway/src/requirements.in --universal -o ./comps/third_parties/pathway/src/requirements-cpu.txt -accelerate==1.10.1 +accelerate==1.12.0 # via # docling # docling-ibm-models # unstructured-inference -aiofiles==24.1.0 +aiofiles==25.1.0 # via unstructured-client aiohappyeyeballs==2.6.1 # via aiohttp -aiohttp==3.13.0 +aiohttp==3.13.2 # via # aiohttp-cors # instructor @@ -21,13 +21,13 @@ aiohttp-cors==0.8.1 # via pathway aiosignal==1.4.0 # via aiohttp -aiosqlite==0.21.0 +aiosqlite==0.22.1 # via llama-index-core annotated-types==0.7.0 # via pydantic antlr4-python3-runtime==4.9.3 # via omegaconf -anyio==4.11.0 +anyio==4.12.0 # via # httpx # mcp @@ -36,7 +36,7 @@ anyio==4.11.0 # starlette appdirs==1.4.4 # via fs -asttokens==3.0.0 +asttokens==3.0.1 # via stack-data async-lru==2.0.5 # via pathway @@ -47,7 +47,7 @@ attrs==25.4.0 # jsonlines # jsonschema # referencing -authlib==1.6.5 +authlib==1.6.6 # via fastmcp backoff==2.2.1 # via unstructured @@ -55,25 +55,25 @@ banks==2.2.0 # via llama-index-core beartype==0.15.0 # via pathway -beautifulsoup4==4.14.2 +beautifulsoup4==4.14.3 # via # docling # unstructured -bleach==6.2.0 +bleach==6.3.0 # via panel -bokeh==3.8.0 +bokeh==3.8.1 # via # jupyter-bokeh # panel -boto3==1.40.48 +boto3==1.42.18 # via pathway -botocore==1.40.48 +botocore==1.42.18 # via # boto3 # s3transfer -cachetools==6.2.0 +cachetools==6.2.4 # via google-auth -certifi==2025.10.5 +certifi==2025.11.12 # via # docling # httpcore @@ -81,44 +81,51 @@ certifi==2025.10.5 # requests cffi==2.0.0 ; platform_python_implementation != 'PyPy' # via cryptography -charset-normalizer==3.4.3 +cfgv==3.5.0 + # via pre-commit +charset-normalizer==3.4.4 # via # pdfminer-six # requests # unstructured -click==8.3.0 +click==8.3.1 # via # litellm # nltk + # ocrmac # pathway # python-oxmsg # typer # uvicorn -cohere==5.18.0 +cohere==5.20.1 # via pathway colorama==0.4.6 # via # click + # colorlog # griffe # ipython # tqdm coloredlogs==15.0.1 # via onnxruntime +colorlog==6.10.1 + # via rapidocr comm==0.2.3 # via ipywidgets contourpy==1.3.3 # via # bokeh # matplotlib -cryptography==46.0.2 +cryptography==46.0.3 # via # authlib # msoffcrypto-tool # pdfminer-six + # pyjwt # unstructured-client cycler==0.12.1 # via matplotlib -cyclopts==3.24.0 +cyclopts==4.4.3 # via fastmcp dataclasses-json==0.6.7 # via @@ -129,7 +136,7 @@ decorator==5.2.1 # via ipython deltalake==0.17.4 # via pathway -deprecated==1.2.18 +deprecated==1.3.1 # via # banks # llama-index-core @@ -143,29 +150,29 @@ diskcache==5.6.3 # via # instructor # pathway +distlib==0.4.0 + # via virtualenv distro==1.9.0 # via openai dnspython==2.8.0 # via email-validator -docling==2.55.1 +docling==2.66.0 # via -r ./comps/third_parties/pathway/src/requirements.in -docling-core==2.48.4 +docling-core==2.57.0 # via # docling # docling-ibm-models # docling-parse -docling-ibm-models==3.9.1 +docling-ibm-models==3.10.3 # via docling -docling-parse==4.5.0 +docling-parse==4.7.2 # via docling docstring-parser==0.17.0 # via # cyclopts # instructor -docutils==0.22.2 +docutils==0.22.4 # via rich-rst -easyocr==1.7.2 - # via docling effdet==0.4.1 # via unstructured email-validator==2.3.0 @@ -174,30 +181,31 @@ emoji==2.15.0 # via unstructured et-xmlfile==2.0.0 # via openpyxl -exceptiongroup==1.3.0 +exceptiongroup==1.3.1 # via fastmcp executing==2.2.1 # via stack-data -faker==37.11.0 +faker==40.1.0 # via polyfactory -fastavro==1.12.0 +fastavro==1.12.1 # via cohere fastmcp==2.12.4 # via pathway -fastuuid==0.13.5 +fastuuid==0.14.0 # via litellm -filelock==3.20.0 +filelock==3.20.1 # via # huggingface-hub # transformers + # virtualenv filetype==1.2.0 # via # docling # llama-index-core # unstructured -flatbuffers==25.9.23 +flatbuffers==25.12.19 # via onnxruntime -fonttools==4.60.1 +fonttools==4.61.1 # via matplotlib frozenlist==1.8.0 # via @@ -205,7 +213,7 @@ frozenlist==1.8.0 # aiosignal fs==2.4.16 # via pathway -fsspec==2025.9.0 +fsspec==2025.12.0 # via # huggingface-hub # llama-index-core @@ -229,11 +237,11 @@ google-api-core==2.24.2 # google-cloud-vision # google-generativeai # pathway -google-api-python-client==2.184.0 +google-api-python-client==2.187.0 # via # google-generativeai # pathway -google-auth==2.41.1 +google-auth==2.45.0 # via # google-ai-generativelanguage # google-api-core @@ -244,38 +252,39 @@ google-auth==2.41.1 # google-cloud-pubsub # google-cloud-vision # google-generativeai -google-auth-httplib2==0.2.0 +google-auth-httplib2==0.3.0 # via google-api-python-client google-cloud-bigquery==3.29.0 # via pathway -google-cloud-core==2.4.3 +google-cloud-core==2.5.0 # via google-cloud-bigquery -google-cloud-pubsub==2.31.1 +google-cloud-pubsub==2.34.0 # via pathway -google-cloud-vision==3.10.2 +google-cloud-vision==3.11.0 # via unstructured -google-crc32c==1.7.1 +google-crc32c==1.8.0 # via google-resumable-media -google-generativeai==0.8.5 +google-generativeai==0.8.6 # via pathway -google-resumable-media==2.7.2 +google-resumable-media==2.8.0 # via google-cloud-bigquery -googleapis-common-protos==1.70.0 +googleapis-common-protos==1.72.0 # via # google-api-core # grpc-google-iam-v1 # grpcio-status # opentelemetry-exporter-otlp-proto-grpc -greenlet==3.2.4 +greenlet==3.3.0 # via sqlalchemy -griffe==1.14.0 +griffe==1.15.0 # via banks -grpc-google-iam-v1==0.14.2 +grpc-google-iam-v1==0.14.3 # via google-cloud-pubsub -grpcio==1.75.1 +grpcio==1.76.0 # via # google-api-core # google-cloud-pubsub + # google-cloud-vision # googleapis-common-protos # grpc-google-iam-v1 # grpcio-status @@ -288,9 +297,9 @@ h11==0.16.0 # via # httpcore # uvicorn -h3==4.3.1 +h3==4.4.1 # via pathway -hf-xet==1.1.10 ; platform_machine == 'aarch64' or platform_machine == 'amd64' or platform_machine == 'arm64' or platform_machine == 'x86_64' +hf-xet==1.2.0 ; platform_machine == 'aarch64' or platform_machine == 'amd64' or platform_machine == 'arm64' or platform_machine == 'x86_64' # via huggingface-hub html5lib==1.1 # via unstructured @@ -312,12 +321,11 @@ httpx==0.28.1 # mcp # openai # unstructured-client -httpx-sse==0.4.0 +httpx-sse==0.4.3 # via - # cohere # langchain-community # mcp -huggingface-hub==0.35.3 +huggingface-hub==0.36.0 # via # accelerate # docling @@ -330,26 +338,26 @@ huggingface-hub==0.35.3 # unstructured-inference humanfriendly==10.0 # via coloredlogs -idna==3.10 +identify==2.6.15 + # via pre-commit +idna==3.11 # via # anyio # email-validator # httpx # requests # yarl -imageio==2.37.0 - # via scikit-image -importlib-metadata==8.7.0 +importlib-metadata==8.7.1 # via # litellm # opentelemetry-api -instructor==1.11.3 +instructor==1.12.0 # via pathway -ipython==9.6.0 +ipython==9.8.0 # via ipywidgets ipython-pygments-lexers==1.1.1 # via ipython -ipywidgets==8.1.7 +ipywidgets==8.1.8 # via jupyter-bokeh isodate==0.7.2 # via openapi-core @@ -370,11 +378,11 @@ jmespath==1.0.1 # boto3 # botocore # pathway -joblib==1.5.2 +joblib==1.5.3 # via # nltk # scikit-learn -jsonlines==3.1.0 +jsonlines==4.0.0 # via docling-ibm-models jsonpatch==1.33 # via langchain-core @@ -400,7 +408,7 @@ jsonschema-specifications==2025.9.1 # openapi-schema-validator jupyter-bokeh==4.0.5 # via pathway -jupyterlab-widgets==3.0.15 +jupyterlab-widgets==3.0.16 # via ipywidgets kiwisolver==1.4.9 # via matplotlib @@ -413,8 +421,9 @@ langchain-community==0.3.31 # via # -r ./comps/third_parties/pathway/src/requirements.in # pathway -langchain-core==0.3.78 +langchain-core==0.3.81 # via + # -r ./comps/third_parties/pathway/src/requirements.in # langchain # langchain-community # langchain-huggingface @@ -425,15 +434,13 @@ langchain-text-splitters==0.3.11 # via langchain langdetect==1.0.9 # via unstructured -langsmith==0.4.33 +langsmith==0.5.1 # via # langchain # langchain-community # langchain-core latex2mathml==3.78.1 # via docling-core -lazy-loader==0.4 - # via scikit-image lazy-object-proxy==1.12.0 # via openapi-spec-validator linkify-it-py==2.0.3 @@ -445,7 +452,7 @@ llama-index-core==0.12.52.post1 # llama-index-readers-pathway # llama-index-retrievers-pathway # pathway -llama-index-instrumentation==0.4.1 +llama-index-instrumentation==0.4.2 # via llama-index-workflows llama-index-readers-pathway==0.3.0 # via pathway @@ -453,14 +460,14 @@ llama-index-retrievers-pathway==0.3.0 # via pathway llama-index-workflows==1.3.0 # via llama-index-core -lxml==5.4.0 +lxml==6.0.2 # via # docling # pikepdf # python-docx # python-pptx # unstructured -markdown==3.9 +markdown==3.10 # via # panel # unstructured @@ -469,25 +476,27 @@ markdown-it-py==4.0.0 # mdit-py-plugins # panel # rich -marko==2.2.0 +marko==2.2.1 # via docling markupsafe==3.0.3 # via # jinja2 # werkzeug -marshmallow==3.26.1 +marshmallow==3.26.2 # via dataclasses-json -matplotlib==3.10.7 +matplotlib==3.10.8 # via unstructured-inference -matplotlib-inline==0.1.7 +matplotlib-inline==0.2.1 # via ipython -mcp==1.16.0 - # via fastmcp +mcp==1.25.0 + # via + # -r ./comps/third_parties/pathway/src/requirements.in + # fastmcp mdit-py-plugins==0.5.0 # via panel mdurl==0.1.2 # via markdown-it-py -ml-dtypes==0.5.3 +ml-dtypes==0.5.4 # via onnx more-itertools==10.8.0 # via openapi-core @@ -505,30 +514,29 @@ multiprocess==0.70.18 # via mpire mypy-extensions==1.1.0 # via typing-inspect -narwhals==2.7.0 - # via bokeh +narwhals==2.14.0 + # via + # bokeh + # panel nest-asyncio==1.6.0 # via llama-index-core -networkx==3.5 +networkx==3.6.1 # via # llama-index-core # pathway - # scikit-image # unstructured -ninja==1.13.0 - # via easyocr nltk==3.9.2 # via # llama-index-core # unstructured -numpy==2.3.3 +nodeenv==1.10.0 + # via pre-commit +numpy==2.4.0 # via # accelerate # bokeh # contourpy # docling-ibm-models - # easyocr - # imageio # langchain-community # llama-index-core # matplotlib @@ -536,30 +544,32 @@ numpy==2.3.3 # onnx # onnxruntime # opencv-python - # opencv-python-headless # pandas # pathway # pycocotools + # rapidocr # safetensors - # scikit-image # scikit-learn # scipy # shapely - # tifffile # transformers # unstructured # unstructured-inference +ocrmac==1.0.0 ; sys_platform == 'darwin' + # via docling olefile==0.47 # via # msoffcrypto-tool # python-oxmsg omegaconf==2.3.0 - # via effdet -onnx==1.19.0 + # via + # effdet + # rapidocr +onnx==1.20.0 # via # unstructured # unstructured-inference -onnxruntime==1.23.1 +onnxruntime==1.23.2 # via # unstructured # unstructured-inference @@ -569,7 +579,7 @@ openai==1.109.1 # instructor # litellm # pathway -openapi-core==0.19.5 +openapi-core==0.22.0 # via fastmcp openapi-pydantic==0.5.1 # via fastmcp @@ -580,38 +590,36 @@ openapi-schema-validator==0.6.3 openapi-spec-validator==0.7.2 # via openapi-core opencv-python==4.11.0.86 - # via unstructured-inference -opencv-python-headless==4.11.0.86 # via - # docling-ibm-models - # easyocr + # rapidocr + # unstructured-inference openpyxl==3.1.5 # via # docling # unstructured -opentelemetry-api==1.37.0 +opentelemetry-api==1.39.1 # via # google-cloud-pubsub # opentelemetry-exporter-otlp-proto-grpc # opentelemetry-sdk # opentelemetry-semantic-conventions # pathway -opentelemetry-exporter-otlp-proto-common==1.37.0 +opentelemetry-exporter-otlp-proto-common==1.39.1 # via opentelemetry-exporter-otlp-proto-grpc -opentelemetry-exporter-otlp-proto-grpc==1.37.0 +opentelemetry-exporter-otlp-proto-grpc==1.39.1 # via pathway -opentelemetry-proto==1.37.0 +opentelemetry-proto==1.39.1 # via # opentelemetry-exporter-otlp-proto-common # opentelemetry-exporter-otlp-proto-grpc -opentelemetry-sdk==1.37.0 +opentelemetry-sdk==1.39.1 # via # google-cloud-pubsub # opentelemetry-exporter-otlp-proto-grpc # pathway -opentelemetry-semantic-conventions==0.58b0 +opentelemetry-semantic-conventions==0.60b1 # via opentelemetry-sdk -orjson==3.11.3 ; platform_python_implementation != 'PyPy' +orjson==3.11.5 ; platform_python_implementation != 'PyPy' # via langsmith packaging==25.0 # via @@ -621,13 +629,12 @@ packaging==25.0 # huggingface-hub # langchain-core # langsmith - # lazy-loader # marshmallow # matplotlib # onnxruntime # panel # pikepdf - # scikit-image + # safetensors # transformers # unstructured-pytesseract pandas==2.3.3 @@ -639,23 +646,21 @@ pandas==2.3.3 # pathway # unstructured # unstructured-inference -panel==1.8.2 +panel==1.8.4 # via pathway -param==2.2.1 +param==2.3.1 # via # panel # pyviz-comms -parse==1.20.2 - # via openapi-core parso==0.8.5 # via jedi pathable==0.4.4 # via jsonschema-path -pathway==0.26.3 +pathway==0.27.1 # via -r ./comps/third_parties/pathway/src/requirements.in pdf2image==1.17.0 # via unstructured -pdfminer-six==20250506 +pdfminer-six==20251229 # via # unstructured # unstructured-inference @@ -663,7 +668,7 @@ pexpect==4.9.0 ; sys_platform != 'emscripten' and sys_platform != 'win32' # via ipython pi-heif==1.1.1 # via unstructured -pikepdf==9.11.0 +pikepdf==10.1.0 # via unstructured pillow==11.3.0 # via @@ -672,32 +677,33 @@ pillow==11.3.0 # docling-core # docling-ibm-models # docling-parse - # easyocr - # imageio # llama-index-core # matplotlib + # ocrmac # pdf2image # pi-heif # pikepdf # python-pptx - # scikit-image - # sentence-transformers + # rapidocr # unstructured-pytesseract -platformdirs==4.5.0 +platformdirs==4.5.1 # via # banks # llama-index-core + # virtualenv pluggy==1.6.0 # via docling -polyfactory==2.22.2 +polyfactory==3.2.0 # via docling +pre-commit==4.5.1 + # via instructor prompt-toolkit==3.0.52 # via ipython propcache==0.4.1 # via # aiohttp # yarl -proto-plus==1.26.1 +proto-plus==1.27.0 # via # google-ai-generativelanguage # google-api-core @@ -717,7 +723,7 @@ protobuf==5.29.5 # onnxruntime # opentelemetry-proto # proto-plus -psutil==7.1.0 +psutil==7.2.1 # via # accelerate # unstructured @@ -737,13 +743,13 @@ pyasn1==0.6.1 # rsa pyasn1-modules==0.4.2 # via google-auth -pyclipper==1.3.0.post6 - # via easyocr -pycocotools==2.0.10 +pyclipper==1.4.0 + # via rapidocr +pycocotools==2.0.11 # via effdet pycparser==2.23 ; implementation_name != 'PyPy' and platform_python_implementation != 'PyPy' # via cffi -pydantic==2.12.0 +pydantic==2.12.5 # via # banks # cohere @@ -767,12 +773,12 @@ pydantic==2.12.0 # pathway # pydantic-settings # unstructured-client -pydantic-core==2.41.1 +pydantic-core==2.41.5 # via # cohere # instructor # pydantic -pydantic-settings==2.11.0 +pydantic-settings==2.12.0 # via # docling # langchain-community @@ -783,15 +789,34 @@ pygments==2.19.2 # ipython-pygments-lexers # mpire # rich +pyjwt==2.10.1 + # via mcp pylatexenc==2.10 # via docling -pypandoc==1.15 +pyobjc-core==12.1 ; sys_platform == 'darwin' + # via + # pyobjc-framework-cocoa + # pyobjc-framework-coreml + # pyobjc-framework-quartz + # pyobjc-framework-vision +pyobjc-framework-cocoa==12.1 ; sys_platform == 'darwin' + # via + # pyobjc-framework-coreml + # pyobjc-framework-quartz + # pyobjc-framework-vision +pyobjc-framework-coreml==12.1 ; sys_platform == 'darwin' + # via pyobjc-framework-vision +pyobjc-framework-quartz==12.1 ; sys_platform == 'darwin' + # via pyobjc-framework-vision +pyobjc-framework-vision==12.1 ; sys_platform == 'darwin' + # via ocrmac +pypandoc==1.16.2 # via unstructured -pyparsing==3.2.5 +pyparsing==3.3.1 # via # httplib2 # matplotlib -pypdf==6.1.1 +pypdf==6.5.0 # via # unstructured # unstructured-client @@ -803,8 +828,6 @@ pyperclip==1.11.0 # via fastmcp pyreadline3==3.5.4 ; sys_platform == 'win32' # via humanfriendly -python-bidi==0.6.6 - # via easyocr python-dateutil==2.9.0.post0 # via # botocore @@ -815,16 +838,16 @@ python-docx==1.2.0 # via # docling # unstructured -python-dotenv==1.1.1 +python-dotenv==1.2.1 # via # fastmcp # litellm # pydantic-settings -python-iso639==2025.2.18 +python-iso639==2025.11.16 # via unstructured python-magic==0.4.27 # via unstructured -python-multipart==0.0.20 +python-multipart==0.0.21 # via # mcp # unstructured-inference @@ -834,7 +857,7 @@ python-pptx==1.0.2 # via # docling # unstructured -python-sat==1.8.dev23 +python-sat==1.8.dev26 # via pathway pytz==2025.2 # via pandas @@ -850,7 +873,6 @@ pyyaml==6.0.3 # accelerate # bokeh # docling-core - # easyocr # huggingface-hub # jsonschema-path # langchain @@ -858,18 +880,22 @@ pyyaml==6.0.3 # langchain-core # llama-index-core # omegaconf + # pre-commit + # rapidocr # timm # transformers -rapidfuzz==3.14.1 +rapidfuzz==3.14.3 # via # unstructured # unstructured-inference +rapidocr==3.4.5 + # via docling referencing==0.36.2 # via # jsonschema # jsonschema-path # jsonschema-specifications -regex==2025.9.18 +regex==2025.11.3 # via # nltk # tiktoken @@ -891,6 +917,7 @@ requests==2.32.5 # llama-index-retrievers-pathway # panel # pathway + # rapidocr # requests-toolbelt # tiktoken # transformers @@ -901,7 +928,7 @@ requests-toolbelt==1.0.0 # unstructured-client rfc3339-validator==0.1.4 # via openapi-schema-validator -rich==14.1.0 +rich==14.2.0 # via # cyclopts # fastmcp @@ -909,9 +936,9 @@ rich==14.1.0 # pathway # rich-rst # typer -rich-rst==1.3.1 +rich-rst==1.3.2 # via cyclopts -rpds-py==0.27.1 +rpds-py==0.30.0 # via # jsonschema # referencing @@ -921,31 +948,27 @@ rtree==1.4.1 # via # docling # docling-ibm-models -s3transfer==0.14.0 +s3transfer==0.16.0 # via boto3 -safetensors==0.6.2 +safetensors==0.7.0 # via # accelerate # docling-ibm-models # timm # transformers -scikit-image==0.25.2 - # via easyocr -scikit-learn==1.7.2 +scikit-learn==1.8.0 # via # pathway # sentence-transformers -scipy==1.16.2 +scipy==1.16.3 # via # docling - # easyocr - # scikit-image # scikit-learn # sentence-transformers # unstructured-inference semchunk==2.2.2 # via docling-core -sentence-transformers==5.1.1 +sentence-transformers==5.2.0 # via -r ./comps/third_parties/pathway/src/requirements.in setuptools==80.9.0 # via @@ -953,8 +976,8 @@ setuptools==80.9.0 # llama-index-core shapely==2.1.2 # via - # easyocr # pathway + # rapidocr shellingham==1.5.4 # via typer six==1.17.0 @@ -964,26 +987,28 @@ six==1.17.0 # langdetect # python-dateutil # python-sat + # rapidocr # rfc3339-validator smmap==5.0.2 # via gitdb sniffio==1.3.1 - # via - # anyio - # openai -soupsieve==2.8 + # via openai +soupsieve==2.8.1 # via beautifulsoup4 -sqlalchemy==2.0.43 +sqlalchemy==2.0.45 # via # langchain # langchain-community # llama-index-core -sse-starlette==3.0.2 +sse-starlette==3.1.1 # via mcp stack-data==0.6.3 # via ipython -starlette==0.48.0 - # via mcp +starlette==0.50.0 + # via + # -r ./comps/third_parties/pathway/src/requirements.in + # mcp + # sse-starlette sympy==1.14.0 # via # onnxruntime @@ -1000,15 +1025,13 @@ tenacity==9.1.2 # pathway threadpoolctl==3.6.0 # via scikit-learn -tifffile==2025.10.4 - # via scikit-image tiktoken==0.12.0 # via # -r ./comps/third_parties/pathway/src/requirements.in # litellm # llama-index-core # pathway -timm==1.0.20 +timm==1.0.22 # via # effdet # unstructured-inference @@ -1018,7 +1041,7 @@ tokenizers==0.22.1 # langchain-huggingface # litellm # transformers -tornado==6.5.2 ; sys_platform != 'emscripten' +tornado==6.5.4 ; sys_platform != 'emscripten' # via bokeh tqdm==4.67.1 # via @@ -1031,6 +1054,7 @@ tqdm==4.67.1 # nltk # openai # panel + # rapidocr # semchunk # sentence-transformers # transformers @@ -1040,12 +1064,24 @@ traitlets==5.14.3 # ipython # ipywidgets # matplotlib-inline -transformers==4.57.0 +transformers==4.57.3 # via # docling-core # docling-ibm-models # sentence-transformers # unstructured-inference +tree-sitter==0.25.2 + # via docling-core +tree-sitter-c==0.24.1 + # via docling-core +tree-sitter-java==0.23.5 + # via docling-core +tree-sitter-javascript==0.25.0 + # via docling-core +tree-sitter-python==0.25.0 + # via docling-core +tree-sitter-typescript==0.23.2 + # via docling-core typer==0.19.2 # via # docling @@ -1056,7 +1092,6 @@ types-requests==2.32.4.20250913 typing-extensions==4.15.0 # via # aiosignal - # aiosqlite # anyio # beautifulsoup4 # cohere @@ -1069,6 +1104,7 @@ typing-extensions==4.15.0 # langchain-core # llama-index-core # llama-index-workflows + # mcp # onnx # openai # openapi-core @@ -1098,42 +1134,48 @@ typing-inspect==0.9.0 # llama-index-core typing-inspection==0.4.2 # via + # mcp # pydantic # pydantic-settings -tzdata==2025.2 +tzdata==2025.3 # via # faker # pandas uc-micro-py==1.0.3 # via linkify-it-py -unstructured==0.18.15 +unstructured==0.18.21 # via -r ./comps/third_parties/pathway/src/requirements.in -unstructured-client==0.42.3 +unstructured-client==0.42.6 # via unstructured -unstructured-inference==1.0.5 +unstructured-inference==1.1.1 # via unstructured unstructured-pytesseract==0.3.15 # via unstructured uritemplate==4.2.0 # via google-api-python-client -urllib3==2.5.0 +urllib3==2.6.2 # via + # -r ./comps/third_parties/pathway/src/requirements.in # botocore # requests # types-requests -uvicorn==0.37.0 ; sys_platform != 'emscripten' +uuid-utils==0.12.0 + # via langsmith +uvicorn==0.40.0 ; sys_platform != 'emscripten' # via mcp +virtualenv==20.35.4 + # via pre-commit wcwidth==0.2.14 # via prompt-toolkit webencodings==0.5.1 # via # bleach # html5lib -werkzeug==3.1.1 +werkzeug==3.1.4 # via openapi-core -widgetsnbextension==4.0.14 +widgetsnbextension==4.0.15 # via ipywidgets -wrapt==1.17.3 +wrapt==2.0.1 # via # deprecated # llama-index-core @@ -1142,7 +1184,7 @@ xlrd==2.0.2 # via unstructured xlsxwriter==3.2.9 # via python-pptx -xyzservices==2025.4.0 +xyzservices==2025.11.0 # via bokeh yarl==1.22.0 # via aiohttp diff --git a/comps/third_parties/pathway/src/requirements-gpu.txt b/comps/third_parties/pathway/src/requirements-gpu.txt index e3f5bbe16b..de4af6cf16 100644 --- a/comps/third_parties/pathway/src/requirements-gpu.txt +++ b/comps/third_parties/pathway/src/requirements-gpu.txt @@ -1,12 +1,15 @@ # This file was autogenerated by uv via the following command: # uv pip compile --python=/usr/local/bin/python3.11 ./comps/third_parties/pathway/src/requirements.in --universal -o ./comps/third_parties/pathway/src/requirements-gpu.txt -accelerate==1.10.1 - # via unstructured-inference -aiofiles==24.1.0 +accelerate==1.12.0 + # via + # docling + # docling-ibm-models + # unstructured-inference +aiofiles==25.1.0 # via unstructured-client aiohappyeyeballs==2.6.1 # via aiohttp -aiohttp==3.13.0 +aiohttp==3.13.2 # via # aiohttp-cors # instructor @@ -18,13 +21,13 @@ aiohttp-cors==0.8.1 # via pathway aiosignal==1.4.0 # via aiohttp -aiosqlite==0.21.0 +aiosqlite==0.22.1 # via llama-index-core annotated-types==0.7.0 # via pydantic antlr4-python3-runtime==4.9.3 # via omegaconf -anyio==4.11.0 +anyio==4.12.0 # via # httpx # mcp @@ -33,7 +36,7 @@ anyio==4.11.0 # starlette appdirs==1.4.4 # via fs -asttokens==3.0.0 +asttokens==3.0.1 # via stack-data async-lru==2.0.5 # via pathway @@ -41,9 +44,10 @@ attrs==25.4.0 # via # aiohttp # cyclopts + # jsonlines # jsonschema # referencing -authlib==1.6.5 +authlib==1.6.6 # via fastmcp backoff==2.2.1 # via unstructured @@ -51,67 +55,77 @@ banks==2.2.0 # via llama-index-core beartype==0.15.0 # via pathway -beautifulsoup4==4.14.2 - # via unstructured -bleach==6.2.0 +beautifulsoup4==4.14.3 + # via + # docling + # unstructured +bleach==6.3.0 # via panel -bokeh==3.8.0 +bokeh==3.8.1 # via # jupyter-bokeh # panel -boto3==1.40.48 +boto3==1.42.18 # via pathway -botocore==1.40.48 +botocore==1.42.18 # via # boto3 # s3transfer -cachetools==6.2.0 +cachetools==6.2.4 # via google-auth -certifi==2025.10.5 +certifi==2025.11.12 # via + # docling # httpcore # httpx # requests cffi==2.0.0 ; platform_python_implementation != 'PyPy' # via cryptography -charset-normalizer==3.4.3 +cfgv==3.5.0 + # via pre-commit +charset-normalizer==3.4.4 # via # pdfminer-six # requests # unstructured -click==8.3.0 +click==8.3.1 # via # litellm # nltk + # ocrmac # pathway # python-oxmsg # typer # uvicorn -cohere==5.18.0 +cohere==5.20.1 # via pathway colorama==0.4.6 # via # click + # colorlog # griffe # ipython # tqdm coloredlogs==15.0.1 # via onnxruntime +colorlog==6.10.1 + # via rapidocr comm==0.2.3 # via ipywidgets contourpy==1.3.3 # via # bokeh # matplotlib -cryptography==46.0.2 +cryptography==46.0.3 # via # authlib # msoffcrypto-tool # pdfminer-six + # pyjwt # unstructured-client cycler==0.12.1 # via matplotlib -cyclopts==3.24.0 +cyclopts==4.4.3 # via fastmcp dataclasses-json==0.6.7 # via @@ -122,27 +136,42 @@ decorator==5.2.1 # via ipython deltalake==0.17.4 # via pathway -deprecated==1.2.18 +deprecated==1.3.1 # via # banks # llama-index-core # llama-index-instrumentation # pikepdf +dill==0.4.0 + # via multiprocess dirtyjson==1.0.8 # via llama-index-core diskcache==5.6.3 # via # instructor # pathway +distlib==0.4.0 + # via virtualenv distro==1.9.0 # via openai dnspython==2.8.0 # via email-validator +docling==2.66.0 + # via -r ./comps/third_parties/pathway/src/requirements.in +docling-core==2.57.0 + # via + # docling + # docling-ibm-models + # docling-parse +docling-ibm-models==3.10.3 + # via docling +docling-parse==4.7.2 + # via docling docstring-parser==0.17.0 # via # cyclopts # instructor -docutils==0.22.2 +docutils==0.22.4 # via rich-rst effdet==0.4.1 # via unstructured @@ -152,28 +181,32 @@ emoji==2.15.0 # via unstructured et-xmlfile==2.0.0 # via openpyxl -exceptiongroup==1.3.0 +exceptiongroup==1.3.1 # via fastmcp executing==2.2.1 # via stack-data -fastavro==1.12.0 +faker==40.1.0 + # via polyfactory +fastavro==1.12.1 # via cohere fastmcp==2.12.4 # via pathway -fastuuid==0.13.5 +fastuuid==0.14.0 # via litellm -filelock==3.20.0 +filelock==3.20.1 # via # huggingface-hub # torch # transformers + # virtualenv filetype==1.2.0 # via + # docling # llama-index-core # unstructured -flatbuffers==25.9.23 +flatbuffers==25.12.19 # via onnxruntime -fonttools==4.60.1 +fonttools==4.61.1 # via matplotlib frozenlist==1.8.0 # via @@ -181,7 +214,7 @@ frozenlist==1.8.0 # aiosignal fs==2.4.16 # via pathway -fsspec==2025.9.0 +fsspec==2025.12.0 # via # huggingface-hub # llama-index-core @@ -206,11 +239,11 @@ google-api-core==2.24.2 # google-cloud-vision # google-generativeai # pathway -google-api-python-client==2.184.0 +google-api-python-client==2.187.0 # via # google-generativeai # pathway -google-auth==2.41.1 +google-auth==2.45.0 # via # google-ai-generativelanguage # google-api-core @@ -221,38 +254,39 @@ google-auth==2.41.1 # google-cloud-pubsub # google-cloud-vision # google-generativeai -google-auth-httplib2==0.2.0 +google-auth-httplib2==0.3.0 # via google-api-python-client google-cloud-bigquery==3.29.0 # via pathway -google-cloud-core==2.4.3 +google-cloud-core==2.5.0 # via google-cloud-bigquery -google-cloud-pubsub==2.31.1 +google-cloud-pubsub==2.34.0 # via pathway -google-cloud-vision==3.10.2 +google-cloud-vision==3.11.0 # via unstructured -google-crc32c==1.7.1 +google-crc32c==1.8.0 # via google-resumable-media -google-generativeai==0.8.5 +google-generativeai==0.8.6 # via pathway -google-resumable-media==2.7.2 +google-resumable-media==2.8.0 # via google-cloud-bigquery -googleapis-common-protos==1.70.0 +googleapis-common-protos==1.72.0 # via # google-api-core # grpc-google-iam-v1 # grpcio-status # opentelemetry-exporter-otlp-proto-grpc -greenlet==3.2.4 +greenlet==3.3.0 # via sqlalchemy -griffe==1.14.0 +griffe==1.15.0 # via banks -grpc-google-iam-v1==0.14.2 +grpc-google-iam-v1==0.14.3 # via google-cloud-pubsub -grpcio==1.75.1 +grpcio==1.76.0 # via # google-api-core # google-cloud-pubsub + # google-cloud-vision # googleapis-common-protos # grpc-google-iam-v1 # grpcio-status @@ -265,9 +299,9 @@ h11==0.16.0 # via # httpcore # uvicorn -h3==4.3.1 +h3==4.4.1 # via pathway -hf-xet==1.1.10 ; platform_machine == 'aarch64' or platform_machine == 'amd64' or platform_machine == 'arm64' or platform_machine == 'x86_64' +hf-xet==1.2.0 ; platform_machine == 'aarch64' or platform_machine == 'amd64' or platform_machine == 'arm64' or platform_machine == 'x86_64' # via huggingface-hub html5lib==1.1 # via unstructured @@ -289,14 +323,15 @@ httpx==0.28.1 # mcp # openai # unstructured-client -httpx-sse==0.4.0 +httpx-sse==0.4.3 # via - # cohere # langchain-community # mcp -huggingface-hub==0.35.3 +huggingface-hub==0.36.0 # via # accelerate + # docling + # docling-ibm-models # langchain-huggingface # sentence-transformers # timm @@ -305,24 +340,26 @@ huggingface-hub==0.35.3 # unstructured-inference humanfriendly==10.0 # via coloredlogs -idna==3.10 +identify==2.6.15 + # via pre-commit +idna==3.11 # via # anyio # email-validator # httpx # requests # yarl -importlib-metadata==8.7.0 +importlib-metadata==8.7.1 # via # litellm # opentelemetry-api -instructor==1.11.3 +instructor==1.12.0 # via pathway -ipython==9.6.0 +ipython==9.8.0 # via ipywidgets ipython-pygments-lexers==1.1.1 # via ipython -ipywidgets==8.1.7 +ipywidgets==8.1.8 # via jupyter-bokeh isodate==0.7.2 # via openapi-core @@ -344,16 +381,21 @@ jmespath==1.0.1 # boto3 # botocore # pathway -joblib==1.5.2 +joblib==1.5.3 # via # nltk # scikit-learn +jsonlines==4.0.0 + # via docling-ibm-models jsonpatch==1.33 # via langchain-core jsonpointer==3.0.0 # via jsonpatch +jsonref==1.1.0 + # via docling-core jsonschema==4.25.1 # via + # docling-core # litellm # mcp # openapi-core @@ -369,7 +411,7 @@ jsonschema-specifications==2025.9.1 # openapi-schema-validator jupyter-bokeh==4.0.5 # via pathway -jupyterlab-widgets==3.0.15 +jupyterlab-widgets==3.0.16 # via ipywidgets kiwisolver==1.4.9 # via matplotlib @@ -382,8 +424,9 @@ langchain-community==0.3.31 # via # -r ./comps/third_parties/pathway/src/requirements.in # pathway -langchain-core==0.3.78 +langchain-core==0.3.81 # via + # -r ./comps/third_parties/pathway/src/requirements.in # langchain # langchain-community # langchain-huggingface @@ -394,11 +437,13 @@ langchain-text-splitters==0.3.11 # via langchain langdetect==1.0.9 # via unstructured -langsmith==0.4.33 +langsmith==0.5.1 # via # langchain # langchain-community # langchain-core +latex2mathml==3.78.1 + # via docling-core lazy-object-proxy==1.12.0 # via openapi-spec-validator linkify-it-py==2.0.3 @@ -410,7 +455,7 @@ llama-index-core==0.12.52.post1 # llama-index-readers-pathway # llama-index-retrievers-pathway # pathway -llama-index-instrumentation==0.4.1 +llama-index-instrumentation==0.4.2 # via llama-index-workflows llama-index-readers-pathway==0.3.0 # via pathway @@ -420,11 +465,12 @@ llama-index-workflows==1.3.0 # via llama-index-core lxml==6.0.2 # via + # docling # pikepdf # python-docx # python-pptx # unstructured -markdown==3.9 +markdown==3.10 # via # panel # unstructured @@ -433,26 +479,32 @@ markdown-it-py==4.0.0 # mdit-py-plugins # panel # rich +marko==2.2.1 + # via docling markupsafe==3.0.3 # via # jinja2 # werkzeug -marshmallow==3.26.1 +marshmallow==3.26.2 # via dataclasses-json -matplotlib==3.10.7 +matplotlib==3.10.8 # via unstructured-inference -matplotlib-inline==0.1.7 +matplotlib-inline==0.2.1 # via ipython -mcp==1.16.0 - # via fastmcp +mcp==1.25.0 + # via + # -r ./comps/third_parties/pathway/src/requirements.in + # fastmcp mdit-py-plugins==0.5.0 # via panel mdurl==0.1.2 # via markdown-it-py -ml-dtypes==0.5.3 +ml-dtypes==0.5.4 # via onnx more-itertools==10.8.0 # via openapi-core +mpire==2.10.2 + # via semchunk mpmath==1.3.0 # via sympy msoffcrypto-tool==5.4.2 @@ -461,13 +513,17 @@ multidict==6.7.0 # via # aiohttp # yarl +multiprocess==0.70.18 + # via mpire mypy-extensions==1.1.0 # via typing-inspect -narwhals==2.7.0 - # via bokeh +narwhals==2.14.0 + # via + # bokeh + # panel nest-asyncio==1.6.0 # via llama-index-core -networkx==3.5 +networkx==3.6.1 # via # llama-index-core # pathway @@ -477,11 +533,14 @@ nltk==3.9.2 # via # llama-index-core # unstructured -numpy==2.3.3 +nodeenv==1.10.0 + # via pre-commit +numpy==2.4.0 # via # accelerate # bokeh # contourpy + # docling-ibm-models # langchain-community # llama-index-core # matplotlib @@ -492,6 +551,8 @@ numpy==2.3.3 # pandas # pathway # pycocotools + # rapidocr + # safetensors # scikit-learn # scipy # shapely @@ -526,7 +587,7 @@ nvidia-cusparse-cu12==12.5.8.93 ; platform_machine == 'x86_64' and sys_platform # torch nvidia-cusparselt-cu12==0.7.1 ; platform_machine == 'x86_64' and sys_platform == 'linux' # via torch -nvidia-nccl-cu12==2.27.3 ; platform_machine == 'x86_64' and sys_platform == 'linux' +nvidia-nccl-cu12==2.27.5 ; platform_machine == 'x86_64' and sys_platform == 'linux' # via torch nvidia-nvjitlink-cu12==12.8.93 ; platform_machine == 'x86_64' and sys_platform == 'linux' # via @@ -534,19 +595,25 @@ nvidia-nvjitlink-cu12==12.8.93 ; platform_machine == 'x86_64' and sys_platform = # nvidia-cusolver-cu12 # nvidia-cusparse-cu12 # torch +nvidia-nvshmem-cu12==3.3.20 ; platform_machine == 'x86_64' and sys_platform == 'linux' + # via torch nvidia-nvtx-cu12==12.8.90 ; platform_machine == 'x86_64' and sys_platform == 'linux' # via torch +ocrmac==1.0.0 ; sys_platform == 'darwin' + # via docling olefile==0.47 # via # msoffcrypto-tool # python-oxmsg omegaconf==2.3.0 - # via effdet -onnx==1.19.0 + # via + # effdet + # rapidocr +onnx==1.20.0 # via # unstructured # unstructured-inference -onnxruntime==1.23.1 +onnxruntime==1.23.2 # via # unstructured # unstructured-inference @@ -556,7 +623,7 @@ openai==1.109.1 # instructor # litellm # pathway -openapi-core==0.19.5 +openapi-core==0.22.0 # via fastmcp openapi-pydantic==0.5.1 # via fastmcp @@ -567,32 +634,36 @@ openapi-schema-validator==0.6.3 openapi-spec-validator==0.7.2 # via openapi-core opencv-python==4.11.0.86 - # via unstructured-inference + # via + # rapidocr + # unstructured-inference openpyxl==3.1.5 - # via unstructured -opentelemetry-api==1.37.0 + # via + # docling + # unstructured +opentelemetry-api==1.39.1 # via # google-cloud-pubsub # opentelemetry-exporter-otlp-proto-grpc # opentelemetry-sdk # opentelemetry-semantic-conventions # pathway -opentelemetry-exporter-otlp-proto-common==1.37.0 +opentelemetry-exporter-otlp-proto-common==1.39.1 # via opentelemetry-exporter-otlp-proto-grpc -opentelemetry-exporter-otlp-proto-grpc==1.37.0 +opentelemetry-exporter-otlp-proto-grpc==1.39.1 # via pathway -opentelemetry-proto==1.37.0 +opentelemetry-proto==1.39.1 # via # opentelemetry-exporter-otlp-proto-common # opentelemetry-exporter-otlp-proto-grpc -opentelemetry-sdk==1.37.0 +opentelemetry-sdk==1.39.1 # via # google-cloud-pubsub # opentelemetry-exporter-otlp-proto-grpc # pathway -opentelemetry-semantic-conventions==0.58b0 +opentelemetry-semantic-conventions==0.60b1 # via opentelemetry-sdk -orjson==3.11.3 ; platform_python_implementation != 'PyPy' +orjson==3.11.5 ; platform_python_implementation != 'PyPy' # via langsmith packaging==25.0 # via @@ -607,32 +678,33 @@ packaging==25.0 # onnxruntime # panel # pikepdf + # safetensors # transformers # unstructured-pytesseract pandas==2.3.3 # via # bokeh + # docling + # docling-core # panel # pathway # unstructured # unstructured-inference -panel==1.8.2 +panel==1.8.4 # via pathway -param==2.2.1 +param==2.3.1 # via # panel # pyviz-comms -parse==1.20.2 - # via openapi-core parso==0.8.5 # via jedi pathable==0.4.4 # via jsonschema-path -pathway==0.26.3 +pathway==0.27.1 # via -r ./comps/third_parties/pathway/src/requirements.in pdf2image==1.17.0 # via unstructured -pdfminer-six==20250506 +pdfminer-six==20251229 # via # unstructured # unstructured-inference @@ -640,31 +712,43 @@ pexpect==4.9.0 ; sys_platform != 'emscripten' and sys_platform != 'win32' # via ipython pi-heif==1.1.1 # via unstructured -pikepdf==9.11.0 +pikepdf==10.1.0 # via unstructured pillow==11.3.0 # via # bokeh + # docling + # docling-core + # docling-ibm-models + # docling-parse # llama-index-core # matplotlib + # ocrmac # pdf2image # pi-heif # pikepdf # python-pptx - # sentence-transformers + # rapidocr # torchvision # unstructured-pytesseract -platformdirs==4.5.0 +platformdirs==4.5.1 # via # banks # llama-index-core + # virtualenv +pluggy==1.6.0 + # via docling +polyfactory==3.2.0 + # via docling +pre-commit==4.5.1 + # via instructor prompt-toolkit==3.0.52 # via ipython propcache==0.4.1 # via # aiohttp # yarl -proto-plus==1.26.1 +proto-plus==1.27.0 # via # google-ai-generativelanguage # google-api-core @@ -684,7 +768,7 @@ protobuf==5.29.5 # onnxruntime # opentelemetry-proto # proto-plus -psutil==7.1.0 +psutil==7.2.1 # via # accelerate # unstructured @@ -704,14 +788,20 @@ pyasn1==0.6.1 # rsa pyasn1-modules==0.4.2 # via google-auth -pycocotools==2.0.10 +pyclipper==1.4.0 + # via rapidocr +pycocotools==2.0.11 # via effdet pycparser==2.23 ; implementation_name != 'PyPy' and platform_python_implementation != 'PyPy' # via cffi -pydantic==2.12.0 +pydantic==2.12.5 # via # banks # cohere + # docling + # docling-core + # docling-ibm-models + # docling-parse # fastmcp # google-generativeai # instructor @@ -728,32 +818,57 @@ pydantic==2.12.0 # pathway # pydantic-settings # unstructured-client -pydantic-core==2.41.1 +pydantic-core==2.41.5 # via # cohere # instructor # pydantic -pydantic-settings==2.11.0 +pydantic-settings==2.12.0 # via + # docling # langchain-community # mcp pygments==2.19.2 # via # ipython # ipython-pygments-lexers + # mpire # rich -pypandoc==1.15 +pyjwt==2.10.1 + # via mcp +pylatexenc==2.10 + # via docling +pyobjc-core==12.1 ; sys_platform == 'darwin' + # via + # pyobjc-framework-cocoa + # pyobjc-framework-coreml + # pyobjc-framework-quartz + # pyobjc-framework-vision +pyobjc-framework-cocoa==12.1 ; sys_platform == 'darwin' + # via + # pyobjc-framework-coreml + # pyobjc-framework-quartz + # pyobjc-framework-vision +pyobjc-framework-coreml==12.1 ; sys_platform == 'darwin' + # via pyobjc-framework-vision +pyobjc-framework-quartz==12.1 ; sys_platform == 'darwin' + # via pyobjc-framework-vision +pyobjc-framework-vision==12.1 ; sys_platform == 'darwin' + # via ocrmac +pypandoc==1.16.2 # via unstructured -pyparsing==3.2.5 +pyparsing==3.3.1 # via # httplib2 # matplotlib -pypdf==6.1.1 +pypdf==6.5.0 # via # unstructured # unstructured-client pypdfium2==4.30.0 - # via unstructured-inference + # via + # docling + # unstructured-inference pyperclip==1.11.0 # via fastmcp pyreadline3==3.5.4 ; sys_platform == 'win32' @@ -765,36 +880,44 @@ python-dateutil==2.9.0.post0 # matplotlib # pandas python-docx==1.2.0 - # via unstructured -python-dotenv==1.1.1 + # via + # docling + # unstructured +python-dotenv==1.2.1 # via # fastmcp # litellm # pydantic-settings -python-iso639==2025.2.18 +python-iso639==2025.11.16 # via unstructured python-magic==0.4.27 # via unstructured -python-multipart==0.0.20 +python-multipart==0.0.21 # via # mcp # unstructured-inference python-oxmsg==0.0.2 # via unstructured python-pptx==1.0.2 - # via unstructured -python-sat==1.8.dev23 + # via + # docling + # unstructured +python-sat==1.8.dev26 # via pathway pytz==2025.2 # via pandas pyviz-comms==3.0.6 # via panel pywin32==311 ; sys_platform == 'win32' - # via mcp + # via + # docling-parse + # mcp + # mpire pyyaml==6.0.3 # via # accelerate # bokeh + # docling-core # huggingface-hub # jsonschema-path # langchain @@ -802,18 +925,22 @@ pyyaml==6.0.3 # langchain-core # llama-index-core # omegaconf + # pre-commit + # rapidocr # timm # transformers -rapidfuzz==3.14.1 +rapidfuzz==3.14.3 # via # unstructured # unstructured-inference +rapidocr==3.4.5 + # via docling referencing==0.36.2 # via # jsonschema # jsonschema-path # jsonschema-specifications -regex==2025.9.18 +regex==2025.11.3 # via # nltk # tiktoken @@ -821,6 +948,7 @@ regex==2025.9.18 requests==2.32.5 # via # cohere + # docling # google-api-core # google-cloud-bigquery # huggingface-hub @@ -834,6 +962,7 @@ requests==2.32.5 # llama-index-retrievers-pathway # panel # pathway + # rapidocr # requests-toolbelt # tiktoken # transformers @@ -844,7 +973,7 @@ requests-toolbelt==1.0.0 # unstructured-client rfc3339-validator==0.1.4 # via openapi-schema-validator -rich==14.1.0 +rich==14.2.0 # via # cyclopts # fastmcp @@ -852,40 +981,49 @@ rich==14.1.0 # pathway # rich-rst # typer -rich-rst==1.3.1 +rich-rst==1.3.2 # via cyclopts -rpds-py==0.27.1 +rpds-py==0.30.0 # via # jsonschema # referencing rsa==4.9.1 # via google-auth -s3transfer==0.14.0 +rtree==1.4.1 + # via + # docling + # docling-ibm-models +s3transfer==0.16.0 # via boto3 -safetensors==0.6.2 +safetensors==0.7.0 # via # accelerate + # docling-ibm-models # timm # transformers -scikit-learn==1.7.2 +scikit-learn==1.8.0 # via # pathway # sentence-transformers -scipy==1.16.2 +scipy==1.16.3 # via + # docling # scikit-learn # sentence-transformers # unstructured-inference -sentence-transformers==5.1.1 +semchunk==2.2.2 + # via docling-core +sentence-transformers==5.2.0 # via -r ./comps/third_parties/pathway/src/requirements.in setuptools==80.9.0 # via # fs # llama-index-core # torch - # triton shapely==2.1.2 - # via pathway + # via + # pathway + # rapidocr shellingham==1.5.4 # via typer six==1.17.0 @@ -895,30 +1033,36 @@ six==1.17.0 # langdetect # python-dateutil # python-sat + # rapidocr # rfc3339-validator smmap==5.0.2 # via gitdb sniffio==1.3.1 - # via - # anyio - # openai -soupsieve==2.8 + # via openai +soupsieve==2.8.1 # via beautifulsoup4 -sqlalchemy==2.0.43 +sqlalchemy==2.0.45 # via # langchain # langchain-community # llama-index-core -sse-starlette==3.0.2 +sse-starlette==3.1.1 # via mcp stack-data==0.6.3 # via ipython -starlette==0.48.0 - # via mcp +starlette==0.50.0 + # via + # -r ./comps/third_parties/pathway/src/requirements.in + # mcp + # sse-starlette sympy==1.14.0 # via # onnxruntime # torch +tabulate==0.9.0 + # via + # docling-core + # docling-parse tenacity==9.1.2 # via # instructor @@ -934,7 +1078,7 @@ tiktoken==0.12.0 # litellm # llama-index-core # pathway -timm==1.0.20 +timm==1.0.22 # via # effdet # unstructured-inference @@ -944,28 +1088,36 @@ tokenizers==0.22.1 # langchain-huggingface # litellm # transformers -torch==2.8.0 +torch==2.9.1 # via # accelerate + # docling-ibm-models # effdet + # safetensors # sentence-transformers # timm # torchvision # unstructured-inference -torchvision==0.23.0 +torchvision==0.24.1 # via + # docling-ibm-models # effdet # timm -tornado==6.5.2 ; sys_platform != 'emscripten' +tornado==6.5.4 ; sys_platform != 'emscripten' # via bokeh tqdm==4.67.1 # via + # docling + # docling-ibm-models # google-generativeai # huggingface-hub # llama-index-core + # mpire # nltk # openai # panel + # rapidocr + # semchunk # sentence-transformers # transformers # unstructured @@ -974,23 +1126,40 @@ traitlets==5.14.3 # ipython # ipywidgets # matplotlib-inline -transformers==4.57.0 +transformers==4.57.3 # via + # docling-core + # docling-ibm-models # sentence-transformers # unstructured-inference -triton==3.4.0 ; platform_machine == 'x86_64' and sys_platform == 'linux' +tree-sitter==0.25.2 + # via docling-core +tree-sitter-c==0.24.1 + # via docling-core +tree-sitter-java==0.23.5 + # via docling-core +tree-sitter-javascript==0.25.0 + # via docling-core +tree-sitter-python==0.25.0 + # via docling-core +tree-sitter-typescript==0.23.2 + # via docling-core +triton==3.5.1 ; platform_machine == 'x86_64' and sys_platform == 'linux' # via torch typer==0.19.2 - # via instructor + # via + # docling + # docling-core + # instructor types-requests==2.32.4.20250913 # via cohere typing-extensions==4.15.0 # via # aiosignal - # aiosqlite # anyio # beautifulsoup4 # cohere + # docling-core # exceptiongroup # google-generativeai # grpcio @@ -999,6 +1168,7 @@ typing-extensions==4.15.0 # langchain-core # llama-index-core # llama-index-workflows + # mcp # onnx # openai # openapi-core @@ -1008,6 +1178,7 @@ typing-extensions==4.15.0 # opentelemetry-semantic-conventions # panel # pathway + # polyfactory # pydantic # pydantic-core # python-docx @@ -1028,40 +1199,48 @@ typing-inspect==0.9.0 # llama-index-core typing-inspection==0.4.2 # via + # mcp # pydantic # pydantic-settings -tzdata==2025.2 - # via pandas +tzdata==2025.3 + # via + # faker + # pandas uc-micro-py==1.0.3 # via linkify-it-py -unstructured==0.18.15 +unstructured==0.18.21 # via -r ./comps/third_parties/pathway/src/requirements.in -unstructured-client==0.42.3 +unstructured-client==0.42.6 # via unstructured -unstructured-inference==1.0.5 +unstructured-inference==1.1.1 # via unstructured unstructured-pytesseract==0.3.15 # via unstructured uritemplate==4.2.0 # via google-api-python-client -urllib3==2.5.0 +urllib3==2.6.2 # via + # -r ./comps/third_parties/pathway/src/requirements.in # botocore # requests # types-requests -uvicorn==0.37.0 ; sys_platform != 'emscripten' +uuid-utils==0.12.0 + # via langsmith +uvicorn==0.40.0 ; sys_platform != 'emscripten' # via mcp +virtualenv==20.35.4 + # via pre-commit wcwidth==0.2.14 # via prompt-toolkit webencodings==0.5.1 # via # bleach # html5lib -werkzeug==3.1.1 +werkzeug==3.1.4 # via openapi-core -widgetsnbextension==4.0.14 +widgetsnbextension==4.0.15 # via ipywidgets -wrapt==1.17.3 +wrapt==2.0.1 # via # deprecated # llama-index-core @@ -1070,7 +1249,7 @@ xlrd==2.0.2 # via unstructured xlsxwriter==3.2.9 # via python-pptx -xyzservices==2025.4.0 +xyzservices==2025.11.0 # via bokeh yarl==1.22.0 # via aiohttp diff --git a/comps/third_parties/pathway/src/requirements.in b/comps/third_parties/pathway/src/requirements.in index 449190ec01..ae1787a1f7 100644 --- a/comps/third_parties/pathway/src/requirements.in +++ b/comps/third_parties/pathway/src/requirements.in @@ -1,9 +1,13 @@ langchain +langchain-core>=0.3.81 langchain-community langchain-huggingface docling +mcp>=1.23.0 openai pathway[xpack-llm] sentence-transformers +starlette>=0.49.1 tiktoken unstructured[all-docs] >= 0.16 +urllib3>=2.6.0