Skip to content

Commit ec55ad9

Browse files
committed
Update filtered list for rft healthbench
1 parent 774578d commit ec55ad9

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

examples/fine-tuned_qa/reinforcement_finetuning_healthbench.ipynb

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -144,7 +144,7 @@
144144
},
145145
{
146146
"cell_type": "code",
147-
"execution_count": 19,
147+
"execution_count": 4,
148148
"id": "4f02e651",
149149
"metadata": {},
150150
"outputs": [],
@@ -191,7 +191,7 @@
191191
"\n",
192192
"# Only include examples that have been pre-filtered to make the RFT job simple to run and evaluate\n",
193193
"filter_indices = set(\n",
194-
" [0, 1, 2, 7, 8, 9, 10, 12, 15, 20, 21, 25, 26, 27, 30, 33, 35, 38, 39, 41, 44, 45, 47, 49, 50]\n",
194+
" [0, 1, 2, 7, 8, 9, 10, 12, 15, 20, 21, 26, 27, 30, 35, 38, 39, 41, 44, 45, 47, 49, 50]\n",
195195
")\n",
196196
"filtered_data = []\n",
197197
"for i, datapoint in enumerate(data):\n",
@@ -272,15 +272,15 @@
272272
},
273273
{
274274
"cell_type": "code",
275-
"execution_count": 7,
275+
"execution_count": 18,
276276
"id": "07c3f15f",
277277
"metadata": {},
278278
"outputs": [],
279279
"source": [
280280
"# Split data\n",
281281
"train_datapoints = [{\"messages\": data[\"prompt\"][1:]} for data in filtered_data][:12]\n",
282-
"val_datapoints = [{\"messages\": data[\"prompt\"][1:]} for data in filtered_data][12:22]\n",
283-
"test_datapoints = [{\"messages\": data[\"prompt\"][1:], \"completion\": data[\"completion\"]} for data in filtered_data][22:]\n",
282+
"val_datapoints = [{\"messages\": data[\"prompt\"][1:]} for data in filtered_data][12:20]\n",
283+
"test_datapoints = [{\"messages\": data[\"prompt\"][1:], \"completion\": data[\"completion\"]} for data in filtered_data][20:]\n",
284284
"\n",
285285
"# Write to files\n",
286286
"train_path = 'local_cache/rft_train.jsonl'\n",

0 commit comments

Comments
 (0)