Update biencoder example config to use hf dataset

oliverholworthy · oliverholworthy · commit a68425747ceb · 2026-02-25T22:03:01.000Z
Signed-off-by: Oliver Holworthy &lt;1216955+oliverholworthy@users.noreply.github.com&gt;
diff --git a/examples/biencoder/llama3_2_1b_biencoder.yaml b/examples/biencoder/llama3_2_1b_biencoder.yaml
@@ -53,9 +53,7 @@ dataloader:
   dataset:
     _target_: nemo_automodel.components.datasets.llm.make_retrieval_dataset
     data_dir_list:
-      - /adasif/retriever_models_research/training_datasets/nqsh_shuffled_50k.json
-      - /adasif/retriever_models_research/training_datasets/mldr_en_perc95_small.json
-      - /adasif/retriever_models_research/training_datasets/miracl_train_es_llama3_1b_4m_512len.json
+      - hf://nvidia/embed-nemotron-dataset-v1/FEVER
     data_type: train
     train_n_passages: 5
     eval_negative_size: 4