|
| 1 | +import os.path |
| 2 | + |
1 | 3 | import bed_reader
|
2 | 4 | import numpy as np
|
3 | 5 | import numpy.testing as nt
|
@@ -61,6 +63,51 @@ def test_bad_file_type(self, path):
|
61 | 63 | with pytest.raises(ValueError, match="Invalid BED file magic bytes"):
|
62 | 64 | plink.BedReader(path, 1, 1)
|
63 | 65 |
|
| 66 | + @pytest.mark.parametrize( |
| 67 | + ("num_variants", "num_samples"), |
| 68 | + [ |
| 69 | + (1, 1), |
| 70 | + (1, 2), |
| 71 | + (1, 3), |
| 72 | + (1, 4), |
| 73 | + (1, 5), |
| 74 | + (1, 6), |
| 75 | + (1, 7), |
| 76 | + (1, 8), |
| 77 | + (1, 9), |
| 78 | + (2, 1), |
| 79 | + (3, 1), |
| 80 | + (10, 1), |
| 81 | + (100, 1), |
| 82 | + (10, 2), |
| 83 | + (10, 3), |
| 84 | + (10, 4), |
| 85 | + (10, 5), |
| 86 | + (20, 20), |
| 87 | + (30, 3), |
| 88 | + ], |
| 89 | + ) |
| 90 | + def test_generated_bed_files(self, tmp_path, num_variants, num_samples): |
| 91 | + bed_file = tmp_path / "a_file.bed" |
| 92 | + # Generate a regular pattern of all possible values |
| 93 | + data = np.arange(num_variants * num_samples, dtype=int) % 4 |
| 94 | + data[data == 3] = -127 |
| 95 | + data = data.reshape((num_variants, num_samples)) |
| 96 | + |
| 97 | + bed_reader.to_bed(bed_file, data.T, num_threads=1) |
| 98 | + |
| 99 | + bytes_per_variant = (num_samples + 3) // 4 |
| 100 | + expected_size = 3 + bytes_per_variant * num_variants |
| 101 | + assert os.path.getsize(bed_file) == expected_size |
| 102 | + |
| 103 | + br_map = {0: (0, 0), 1: (0, 1), 2: (1, 1), -127: (-1, -1)} |
| 104 | + reader = plink.BedReader(bed_file, num_variants, num_samples) |
| 105 | + g = reader.decode(0, num_variants) |
| 106 | + assert g.shape == (num_variants, num_samples, 2) |
| 107 | + for j in range(num_variants): |
| 108 | + for k in range(num_samples): |
| 109 | + assert br_map[data[j, k]] == tuple(g[j, k]) |
| 110 | + |
64 | 111 |
|
65 | 112 | class TestSmallExample:
|
66 | 113 | @pytest.fixture(scope="class")
|
|
0 commit comments