From 94f7fb42643233c9adcbd16a47cf03a5cf8a126f Mon Sep 17 00:00:00 2001 From: jonbrenas <51911846+jonbrenas@users.noreply.github.com> Date: Wed, 8 Jan 2025 16:41:47 +0100 Subject: [PATCH] First prototype --- malariagen_data/anoph/base_params.py | 9 +++++++++ malariagen_data/anoph/pca.py | 2 +- 2 files changed, 10 insertions(+), 1 deletion(-) diff --git a/malariagen_data/anoph/base_params.py b/malariagen_data/anoph/base_params.py index 87e7a704e..c338c00b4 100644 --- a/malariagen_data/anoph/base_params.py +++ b/malariagen_data/anoph/base_params.py @@ -10,6 +10,8 @@ single_contig_param_type, single_region_param_type, chunks_param_type, + zarr_chunks_type, + dask_chunks_type, ) contig: TypeAlias = Annotated[ @@ -256,6 +258,13 @@ def validate_sample_selection_params( # amounts of data. native_chunks: chunks = "native" + +def call_chunks_func(zarr_chunks: zarr_chunks_type) -> dask_chunks_type: + return tuple([10 * i for i in zarr_chunks]) + + +call_chunks: chunks = call_chunks_func + gff_attributes: TypeAlias = Annotated[ Optional[Union[Sequence[str], str]], """ diff --git a/malariagen_data/anoph/pca.py b/malariagen_data/anoph/pca.py index 18cd0bdb3..7f2e0012d 100644 --- a/malariagen_data/anoph/pca.py +++ b/malariagen_data/anoph/pca.py @@ -76,7 +76,7 @@ def pca( fit_exclude_samples: Optional[base_params.samples] = None, random_seed: base_params.random_seed = 42, inline_array: base_params.inline_array = base_params.inline_array_default, - chunks: base_params.chunks = base_params.native_chunks, + chunks: base_params.chunks = base_params.call_chunks, ) -> Tuple[pca_params.df_pca, pca_params.evr]: # Change this name if you ever change the behaviour of this function, to # invalidate any previously cached data.