Skip to content

Commit ed2af51

Browse files
committed
update the chunk size
1 parent 3bf5f57 commit ed2af51

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

scrapegraphai/nodes/parse_node.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -74,24 +74,24 @@ def execute(self, state: dict) -> dict:
7474
docs_transformed = docs_transformed[0]
7575

7676
chunks = chunk(text=docs_transformed.page_content,
77-
chunk_size= self.node_config.get("chunk_size", 4096),
77+
chunk_size= self.node_config.get("chunk_size", 4096)-250,
7878
token_counter=lambda x: len(x.split()),
7979
memoize=False)
8080
else:
8181
docs_transformed = docs_transformed[0]
8282

8383
if type(docs_transformed) == Document:
8484
chunks = chunk(text=docs_transformed.page_content,
85-
chunk_size= self.node_config.get("chunk_size", 4096),
85+
chunk_size= self.node_config.get("chunk_size", 4096)-250,
8686
token_counter=lambda x: len(x.split()),
8787
memoize=False)
8888
else:
89-
89+
9090
chunks = chunk(text=docs_transformed,
91-
chunk_size= self.node_config.get("chunk_size", 4096),
91+
chunk_size= self.node_config.get("chunk_size", 4096)-250,
9292
token_counter=lambda x: len(x.split()),
9393
memoize=False)
94-
94+
9595
state.update({self.output[0]: chunks})
9696

9797
return state

0 commit comments

Comments
 (0)