@@ -75,15 +75,8 @@ faiss-cpu = "^1.8.0"
7575[tool .poetry .group .processors ]
7676
7777[tool .poetry .group .processors .dependencies ]
78- scrapy = " ^2.11.2"
79- unstructured = {version = " 0.15.0" , python =" >=3.10,<3.13" }
8078google-generativeai = " 0.7.2"
81- scrapy-playwright = {version =" ^0.0.33" }
8279pillow-heif = {version =" ^0.15.0" }
83- opencv-python-headless = {version =" ^4.10.0.84" }
84- unstructured-inference = {version =" ^0.7.23" }
85- unstructured-pytesseract = {version =" ^0.3.12" }
86- python-docx = {version =" ^1.1.0" }
8780cohere = {version =" 5.5.4" }
8881google-cloud-speech = {version =" ^2.26.0" }
8982mysqlclient = {version =" ^2.2.4" }
@@ -93,29 +86,40 @@ pydub = {version = "^0.25.1" }
9386boto3 = {version = " ^1.26.122" }
9487botocore = {version = " ^1.29.122" }
9588yt-dlp = " ^2024.5.27"
96- pdf2image = {version = " ^1.16.3" }
97- pdfminer-six = {version = " ^20221105" }
9889markdown = {version = " ^3.4.4" }
99- python-pptx = {version = " ^0.6.21" }
100- python-magic = {version = " ^0.4.27" }
10190anthropic = " ^0.30.0"
10291pypdf = " ^4.2.0"
10392pikepdf = " ^9.0.0"
104- llama-index-readers-file = " 0.1.30"
105- llama-index-vector-stores-chroma = " ^0.1.10"
10693websockets = " ^12.0"
107- chromadb = " ^0.5.3"
10894pynacl = " ^1.5.0"
109- llama-index-core = " ^0.10.51"
11095beautifulsoup4 = {version = " ^4.12.2" }
11196sqlalchemy = " ^2.0.31"
11297websockify = " ^0.12.0"
113- spacy = " ^3.7.5"
98+ playwright = " 1.45.0"
99+
100+ [tool .poetry .group .data ]
101+
102+ [tool .poetry .group .data .dependencies ]
103+ chromadb = " ^0.5.3"
104+ llama-index-readers-file = " 0.1.30"
105+ llama-index-vector-stores-chroma = " ^0.1.10"
106+ llama-index-core = " ^0.10.51"
114107llama-index-vector-stores-pinecone = {version =" ^0.1.8" , python =" >=3.10,<3.13" }
115108llama-index-vector-stores-qdrant = {version =" ^0.2.13" , python =" >=3.10,<3.13" }
116109llama-index-embeddings-azure-openai = " ^0.1.11"
117110llama-index-embeddings-openai = " ^0.1.11"
118- playwright = " 1.45.0"
111+ opencv-python-headless = {version =" ^4.10.0.84" }
112+ pdf2image = {version = " ^1.16.3" }
113+ pdfminer-six = {version = " ^20221105" }
114+ python-docx = {version =" ^1.1.0" }
115+ python-magic = {version = " ^0.4.27" }
116+ python-pptx = {version = " ^0.6.21" }
117+ scrapy = " ^2.11.2"
118+ scrapy-playwright = {version =" ^0.0.33" }
119+ spacy = " ^3.7.5"
120+ unstructured = {version = " 0.15.0" , python =" >=3.10,<3.13" }
121+ unstructured-inference = {version =" ^0.7.23" }
122+ unstructured-pytesseract = {version =" ^0.3.12" }
119123weaviate-client = " ^4.7.1"
120124
121125
0 commit comments