We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 668b994 commit 7995954Copy full SHA for 7995954
data/generate_sft_verl.py
@@ -2,7 +2,7 @@
2
import argparse
3
from datasets import Dataset, load_dataset
4
from tqdm import tqdm
5
-
+from pprint import pprint
6
7
def make_map_fn(split):
8
def process_fn(example, idx):
@@ -36,5 +36,8 @@ def process_fn(example, idx):
36
# Apply mapping to Verl format
37
dataset = dataset.map(function=make_map_fn(args.split), with_indices=True)
38
39
+ # Pretty preview the first sample
40
os.makedirs(args.output_dir, exist_ok=True)
41
dataset.to_parquet(os.path.join(args.output_dir, f"{args.split}.parquet"))
42
+
43
+ pprint(dataset[0])
0 commit comments