Skip to content

Commit 91d8166

Browse files
committed
add pdf marker loader support
1 parent 06939ec commit 91d8166

File tree

1 file changed

+4
-0
lines changed

1 file changed

+4
-0
lines changed

bcorag/bcorag.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,7 @@
1818
from llama_index.core.node_parser import SemanticSplitterNodeParser
1919
from llama_index.readers.github import GithubRepositoryReader, GithubClient # type: ignore
2020
from llama_index.readers.file import PDFReader # type: ignore
21+
from llama_index.readers.pdf_marker import PDFMarkerReader # type: ignore
2122
from llama_index.core.postprocessor import SentenceTransformerRerank
2223
from dotenv import load_dotenv
2324
import tiktoken
@@ -220,6 +221,9 @@ def __init__(
220221
# pdf_loader = download_loader("PDFReader")
221222
pdf_loader = PDFReader()
222223
paper_documents = pdf_loader.load_data(file=Path(self._file_path))
224+
case "PDFMarker":
225+
pdf_loader = PDFMarkerReader()
226+
paper_documents = pdf_loader.load_data(file=Path(self._file_path))
223227

224228
documents = paper_documents # type: ignore
225229
if self._git_data is not None:

0 commit comments

Comments
 (0)