-
Notifications
You must be signed in to change notification settings - Fork 7
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Clean up requirements.txt, removed all related to ingest
- Loading branch information
Showing
2 changed files
with
128 additions
and
117 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,59 +1,67 @@ | ||
# On Apple Silicon: pip uninstall grpcio -y; conda install grpcio -y | ||
nomic==2.0.14 | ||
Flask==3.0.0 | ||
flask-cors==4.0.0 | ||
gunicorn==21.2.0 | ||
protobuf==4.25.0 | ||
langchain==0.0.331 | ||
langchainhub==0.1.14 | ||
click==8.1.7 | ||
aiohttp==3.8.6 | ||
wheel==0.41.3 | ||
click==8.1.7 | ||
MarkupSafe==2.1.3 | ||
Werkzeug==3.0.1 | ||
mkdocstrings[python]==0.23.0 | ||
mkdocs-material==9.4.7 | ||
itsdangerous==2.1.2 | ||
wheel==0.41.3 | ||
Flask==3.0.0 | ||
gunicorn==21.2.0 | ||
tiktoken==0.5.1 | ||
Jinja2==3.1.2 | ||
python-dotenv==1.0.0 | ||
flask-cors==4.0.0 | ||
qdrant-client==1.7.3 | ||
mkdocs==1.5.3 | ||
openai==0.28.1 | ||
supabase==2.0.2 | ||
SQLAlchemy==2.0.22 | ||
boto3==1.28.79 | ||
PyMuPDF==1.23.6 | ||
tabulate==0.9.0 | ||
typing-inspect==0.9.0 | ||
typing_extensions==4.8.0 | ||
pysrt==1.1.2 | ||
docx2txt==0.8 | ||
pydub==0.25.1 | ||
ffmpeg-python==0.2.0 | ||
ffprobe==0.5 | ||
ffmpeg==1.4 | ||
beautifulsoup4==4.12.2 | ||
canvasapi==3.2.0 | ||
GitPython==3.1.40 | ||
|
||
# Utils | ||
tiktoken==0.5.1 | ||
python-dotenv==1.0.0 | ||
pydantic==1.10.13 # pydantic v1 works better for ray | ||
flask-executor==1.0.0 | ||
|
||
# AI & core services | ||
nomic==2.0.14 | ||
openai==0.28.1 | ||
langchain==0.0.331 | ||
langchainhub==0.1.14 | ||
|
||
# Data | ||
boto3==1.28.79 | ||
qdrant-client==1.7.3 | ||
supabase==2.0.2 | ||
|
||
# Logging | ||
posthog==3.1.0 | ||
sentry-sdk==1.39.1 | ||
|
||
# Not currently supporting coursera ingest | ||
# cs-dlp @ git+https://github.com/raffaem/[email protected] # previously called coursera-dl | ||
|
||
# removed due to /ingest in Beam | ||
# canvasapi==3.2.0 | ||
# GitPython==3.1.40 | ||
# pysrt==1.1.2 | ||
# docx2txt==0.8 | ||
# pydub==0.25.1 | ||
# ffmpeg-python==0.2.0 | ||
# ffprobe==0.5 | ||
# ffmpeg==1.4 | ||
# beautifulsoup4==4.12.2 | ||
# PyMuPDF==1.23.6 | ||
# pytesseract==0.3.10 # image OCR | ||
# openpyxl==3.1.2 # excel | ||
# networkx==3.2.1 # unused part of excel partitioning :( | ||
# python-pptx==0.6.23 | ||
# unstructured==0.10.29 # causes huge ~5.3 GB of installs. Probbably from onnx: https://github.com/Unstructured-IO/unstructured/blob/ad14321016533dc03c1782f6ebea00bc9c804846/requirements/extra-pdf-image.in#L4 | ||
|
||
# pdf packages for unstructured | ||
# pdf2image==1.16.3 | ||
# pdfminer.six==20221105 | ||
# opencv-python-headless==4.8.1.78 | ||
# unstructured.pytesseract==0.3.12 | ||
# unstructured-inference==0.7.11 # this is the real large one :( | ||
pytesseract==0.3.10 # image OCR | ||
openpyxl==3.1.2 # excel | ||
networkx==3.2.1 # unused part of excel partitioning :( | ||
python-pptx==0.6.23 | ||
unstructured==0.10.29 # causes huge ~5.3 GB of installs. Probbably from onnx: https://github.com/Unstructured-IO/unstructured/blob/ad14321016533dc03c1782f6ebea00bc9c804846/requirements/extra-pdf-image.in#L4 | ||
# unstructured[xlsx,image,pptx]==0.10.29 # causes huge ~5.3 GB of installs. Probbably from onnx: https://github.com/Unstructured-IO/unstructured/blob/ad14321016533dc03c1782f6ebea00bc9c804846/requirements/extra-pdf-image.in#L4 | ||
|
||
# Not currently supporting coursera ingest | ||
# cs-dlp @ git+https://github.com/raffaem/[email protected] # previously called coursera-dl | ||
pydantic==1.10.13 # pydantic v1 works better for ray | ||
posthog==3.1.0 | ||
sentry-sdk==1.39.1 | ||
# ray==2.8.1 | ||
# newrelic==9.3.0 |