File tree Expand file tree Collapse file tree 11 files changed +1412
-161
lines changed
docs/docs/integrations/document_loaders Expand file tree Collapse file tree 11 files changed +1412
-161
lines changed Load Diff Large diffs are not rendered by default.
Original file line number Diff line number Diff line change @@ -41,7 +41,7 @@ jq>=1.4.1,<2
4141jsonschema>1
4242keybert>=0.8.5
4343langchain_openai>=0.2.1
44- litellm>=1.30,<=1.39.5
44+ litellm>=1.30
4545lxml>=4.9.3,<6.0
4646markdownify>=0.11.6,<0.12
4747motor>=3.3.1,<4
@@ -62,6 +62,7 @@ pandas>=2.0.1,<3
6262pdfminer-six==20231228
6363pdfplumber>=0.11
6464pgvector>=0.1.6,<0.2
65+ pillow>=10.4
6566playwright>=1.48.0,<2
6667praw>=7.7.1,<8
6768premai>=0.3.25,<0.4,!=0.3.100
@@ -74,6 +75,7 @@ pymupdf>=1.22.3,<2
7475pypdf>=3.4.0,<5
7576pypdfium2>=4.10.0,<5
7677pyspark>=3.4.0,<4
78+ py-zerox>=0.0.7
7779rank-bm25>=0.2.2,<0.3
7880rapidfuzz>=3.1.1,<4
7981rapidocr-onnxruntime>=1.3.2,<2
Original file line number Diff line number Diff line change 360360 PyPDFium2Loader ,
361361 PyPDFLoader ,
362362 UnstructuredPDFLoader ,
363+ ZeroxPDFLoader ,
363364 )
364365 from langchain_community .document_loaders .pebblo import (
365366 PebbloSafeLoader ,
732733 "YoutubeAudioLoader" : "langchain_community.document_loaders.blob_loaders" ,
733734 "YoutubeLoader" : "langchain_community.document_loaders.youtube" ,
734735 "YuqueLoader" : "langchain_community.document_loaders.yuque" ,
736+ "ZeroxPDFLoader" : "langchain_community.document_loaders.pdf" ,
735737}
736738
737739
@@ -940,4 +942,5 @@ def __getattr__(name: str) -> Any:
940942 "YoutubeAudioLoader" ,
941943 "YoutubeLoader" ,
942944 "YuqueLoader" ,
945+ "ZeroxPDFLoader" ,
943946]
Original file line number Diff line number Diff line change 3232 PyMuPDFParser ,
3333 PyPDFium2Parser ,
3434 PyPDFParser ,
35+ ZeroxPDFParser ,
3536 )
3637 from langchain_community .document_loaders .parsers .vsdx import (
3738 VsdxParser ,
5556 "RapidOCRBlobParser" : "langchain_community.document_loaders.parsers.images" ,
5657 "TesseractBlobParser" : "langchain_community.document_loaders.parsers.images" ,
5758 "VsdxParser" : "langchain_community.document_loaders.parsers.vsdx" ,
59+ "ZeroxPDFParser" : "langchain_community.document_loaders.parsers.pdf" ,
5860}
5961
6062
@@ -82,4 +84,5 @@ def __getattr__(name: str) -> Any:
8284 "RapidOCRBlobParser" ,
8385 "TesseractBlobParser" ,
8486 "VsdxParser" ,
87+ "ZeroxPDFParser" ,
8588]
You can’t perform that action at this time.
0 commit comments