Skip to content

Commit 42dc73e

Browse files
fix: delete fetching schema to avoid ray's duplicate execution
1 parent c42b604 commit 42dc73e

File tree

1 file changed

+0
-4
lines changed

1 file changed

+0
-4
lines changed

graphgen/engine.py

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -84,10 +84,6 @@ def _get_input_dataset(
8484

8585
main_ds = self.datasets[deps[0]]
8686
other_dss = [self.datasets[d] for d in deps[1:]]
87-
if not all(ds.schema() == main_ds.schema() for ds in other_dss):
88-
raise ValueError(
89-
f"Union requires all datasets to have the same schema for node {node.id}"
90-
)
9187
return main_ds.union(*other_dss)
9288

9389
def _execute_node(self, node: Node, initial_ds: ray.data.Dataset):

0 commit comments

Comments
 (0)