Skip to content

Commit d0eedd5

Browse files
authored
Fix for load_dataset function to restore ability to use custom loading of dataset (#8184)
1 parent 6ee1317 commit d0eedd5

File tree

1 file changed

+10
-10
lines changed

1 file changed

+10
-10
lines changed

swift/dataset/loader.py

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -297,16 +297,6 @@ def load_dataset(
297297
num_proc = None
298298
train_datasets = []
299299
val_datasets = []
300-
loader = DatasetLoader(
301-
num_proc=num_proc,
302-
load_from_cache_file=load_from_cache_file,
303-
streaming=streaming,
304-
hub_token=hub_token,
305-
strict=strict,
306-
download_mode=download_mode,
307-
columns=columns, # columns_mapping
308-
remove_unused_columns=remove_unused_columns,
309-
)
310300

311301
use_hf_default = use_hf
312302
if use_hf_default is None:
@@ -324,6 +314,16 @@ def load_dataset(
324314
dataset_syntax.dataset = dataset_meta.hf_dataset_id if use_hf else dataset_meta.ms_dataset_id
325315
else:
326316
dataset_meta = dataset_syntax.get_dataset_meta(use_hf)
317+
loader = dataset_meta.loader(
318+
num_proc=num_proc,
319+
load_from_cache_file=load_from_cache_file,
320+
streaming=streaming,
321+
hub_token=hub_token,
322+
strict=strict,
323+
download_mode=download_mode,
324+
columns=columns, # columns_mapping
325+
remove_unused_columns=remove_unused_columns,
326+
)
327327
train_dataset = loader.load(dataset_syntax, dataset_meta, use_hf=use_hf)
328328
train_dataset, val_dataset = loader.post_process(
329329
train_dataset,

0 commit comments

Comments
 (0)