Skip to content

Commit 5ad3ea4

Browse files
committed
s
Signed-off-by: Alexandros Koumparoulis <akoumparouli@nvidia.com>
1 parent d18d802 commit 5ad3ea4

File tree

1 file changed

+11
-17
lines changed

1 file changed

+11
-17
lines changed

tests/unit_tests/datasets/llm/test_retrieval_dataset.py

Lines changed: 11 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -808,24 +808,18 @@ def test_retrieval_dataset_cli_smoke(tmp_path, monkeypatch, capsys):
808808
assert "Dataset loading completed successfully" in capsys.readouterr().out
809809

810810

811-
def test_retrieval_dataset_inline_cli_smoke(tmp_path, monkeypatch, capsys):
811+
def test_retrieval_dataset_inline_smoke(tmp_path):
812812
f = tmp_path / "inline.jsonl"
813813
f.write_text(json.dumps({"query": "Q", "pos_doc": "P", "neg_doc": ["N"]}))
814814

815-
monkeypatch.setattr(
816-
sys,
817-
"argv",
818-
[
819-
"prog",
820-
"--data_dir_list",
821-
str(f),
822-
"--data_type",
823-
"train",
824-
"--train_n_passages",
825-
"2",
826-
"--max_train_samples",
827-
"1",
828-
],
815+
ds = rdi.make_retrieval_dataset(
816+
data_dir_list=str(f),
817+
data_type="train",
818+
train_n_passages=2,
819+
do_shuffle=False,
820+
max_train_samples=1,
829821
)
830-
runpy.run_module("nemo_automodel.components.datasets.llm.retrieval_dataset_inline", run_name="__main__")
831-
assert "Dataset loading completed successfully" in capsys.readouterr().out
822+
ex = ds[0]
823+
assert ex["question"] == "Q"
824+
assert ex["doc_text"] == ["P", "N"]
825+
assert ex["doc_image"] == ["", ""]

0 commit comments

Comments
 (0)