Skip to content

Commit c710d7c

Browse files
committed
Add script for cloud download of 2021Wu_human_breast_cancer_sc
1 parent 7257e4a commit c710d7c

File tree

1 file changed

+45
-0
lines changed

1 file changed

+45
-0
lines changed
Lines changed: 45 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,45 @@
1+
#!/bin/bash
2+
3+
# get the root of the directory
4+
REPO_ROOT=$(git rev-parse --show-toplevel)
5+
6+
# ensure that the command below is run from the root of the repository
7+
cd "$REPO_ROOT"
8+
9+
set -e
10+
11+
publish_dir="s3://openproblems-data/resources/datasets"
12+
13+
# Note that the current download script and processing workflow have a specific default parameter set for the given dataset.
14+
# No additional datasets are supported by that component/workflow. Therefore the default parameters are used and don't need
15+
# to be specified here.
16+
17+
cat > /tmp/params.yaml << HERE
18+
param_list:
19+
- id: wu_human_breast_cancer_sc/2021Wu_human_breast_cancer_sc
20+
cancer_subtypes:
21+
- HER2+
22+
- TNBC
23+
- ER+
24+
25+
keep_files: false
26+
27+
output_dataset: "\$id/dataset.h5ad"
28+
output_meta: "\$id/dataset_meta.yaml"
29+
output_state: "\$id/state.yaml"
30+
publish_dir: "$publish_dir"
31+
HERE
32+
33+
tw launch https://github.com/openproblems-bio/task_ist_preprocessing.git \
34+
--revision build/main \
35+
--pull-latest \
36+
--main-script target/nextflow/datasets/workflows/process_wu_human_breast_cancer_sc/main.nf \
37+
--workspace 53907369739130 \
38+
--compute-env 6TeIFgV5OY4pJCk8I0bfOh \
39+
--params-file /tmp/params.yaml \
40+
--config common/nextflow_helpers/labels_tw.config \
41+
--labels datasets,wu_human_breast_cancer_sc
42+
43+
aws s3 sync \
44+
s3://openproblems-data/resources/datasets/wu_human_breast_cancer_sc/2021Wu_human_breast_cancer_sc \
45+
resources/datasets/wu_human_breast_cancer_sc/2021Wu_human_breast_cancer_sc

0 commit comments

Comments
 (0)