Skip to content

Commit 93469ce

Browse files
authored
Merge pull request #264 from ENCODE-DCC/dev
v2.1.4
2 parents a0e1504 + 3b918b6 commit 93469ce

File tree

53 files changed

+219
-215
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

53 files changed

+219
-215
lines changed

.circleci/config.yml

Lines changed: 9 additions & 27 deletions
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@ defaults: &defaults
77

88
machine_defaults: &machine_defaults
99
machine:
10-
image: ubuntu-1604:202007-01
10+
image: ubuntu-2004:202010-01
1111
working_directory: ~/chip-seq-pipeline2
1212

1313
make_tag: &make_tag
@@ -16,37 +16,17 @@ make_tag: &make_tag
1616
echo "export TAG=encodedcc/chip-seq-pipeline:${CIRCLE_BRANCH}_${CIRCLE_WORKFLOW_ID}" > ${BASH_ENV}
1717
1818
commands:
19-
download_task_test_data:
20-
description: "Download task test data. This is based on py2 so run this before installing py3."
21-
steps:
22-
- run:
23-
command: |
24-
cd dev/test/test_task/
25-
rm -rf chip-seq-pipeline-test-data
26-
export BOTO_CONFIG=/dev/null
27-
gsutil -m cp -r gs://encode-pipeline-test-samples/encode-chip-seq-pipeline/chip-seq-pipeline-test-data .
28-
2919
install_python3_caper_gcs:
3020
description: "Install py3, caper and gcs. Set py3 as default python."
3121
steps:
3222
- run:
3323
command: |
3424
sudo apt-get update && sudo apt-get install software-properties-common git wget curl -y
25+
sudo apt-get install -y software-properties-common git wget curl python3 python3-pip default-jre
3526
36-
# install java 11
37-
sudo add-apt-repository ppa:openjdk-r/ppa -y
38-
sudo apt-get update && sudo apt-get install openjdk-11-jdk -y
39-
# automatically set 11 as default java
40-
sudo update-java-alternatives -a
41-
42-
sudo add-apt-repository ppa:deadsnakes/ppa -y
43-
sudo apt-get update && sudo apt-get install python3.6 -y
44-
sudo wget --no-check-certificate https://bootstrap.pypa.io/get-pip.py
45-
sudo python3.6 get-pip.py
46-
sudo ln -s /usr/bin/python3.6 /usr/local/bin/python3
47-
48-
pip3 install --upgrade pip
49-
pip3 install caper google-cloud-storage
27+
sudo python3 -m pip install --upgrade pip
28+
sudo pip3 install PyYAML --ignore-installed
29+
sudo pip3 install caper google-cloud-storage
5030
5131
run_workflow_test:
5232
description: "Run workflow test. This requires an env var INPUT as input JSON's basename."
@@ -86,7 +66,7 @@ jobs:
8666
name: build image
8767
command: |
8868
source ${BASH_ENV}
89-
export DOCKER_CACHE_TAG=v1.8.1
69+
export DOCKER_CACHE_TAG=v2.1.0
9070
echo "pulling ${DOCKER_CACHE_TAG}!"
9171
docker pull encodedcc/chip-seq-pipeline:${DOCKER_CACHE_TAG}
9272
docker login -u=${DOCKERHUB_USER} -p=${DOCKERHUB_PASS}
@@ -97,7 +77,6 @@ jobs:
9777
<<: *machine_defaults
9878
steps:
9979
- checkout
100-
- download_task_test_data
10180
- install_python3_caper_gcs
10281
- run: *make_tag
10382
- run:
@@ -106,6 +85,9 @@ jobs:
10685
source ${BASH_ENV}
10786
cd dev/test/test_task/
10887
88+
echo ${GCLOUD_SERVICE_ACCOUNT_SECRET_JSON} > tmp_secret_key.json
89+
export GOOGLE_APPLICATION_CREDENTIALS=$PWD/tmp_secret_key.json
90+
10991
# unittest for wrapper .py
11092
docker run ${TAG} bash -c "cd /software/chip-seq-pipeline/dev/test/test_py/; pytest -vv"
11193

.gitignore

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -125,3 +125,5 @@ tmp_db*
125125
temp_db*
126126

127127
cromwell.out
128+
cromwell.out.*
129+

README.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -127,8 +127,8 @@ You cannot use these input JSON files directly. Go to the destination directory
127127
We have a separate project on DNANexus to provide example FASTQs and `genome_tsv` for `hg38` and `mm10` (also chr19-only version of those two. Use chr19-only versions for testing). We recommend to make copies of these directories on your own project.
128128

129129
`genome_tsv`
130-
- AWS: https://platform.dnanexus.com/projects/BKpvFg00VBPV975PgJ6Q03v6/data/pipeline-genome-data/genome_tsv/v3
131-
- Azure: https://platform.dnanexus.com/projects/F6K911Q9xyfgJ36JFzv03Z5J/data/pipeline-genome-data/genome_tsv/v3
130+
- AWS: https://platform.dnanexus.com/projects/BKpvFg00VBPV975PgJ6Q03v6/data/pipeline-genome-data/genome_tsv/v4
131+
- Azure: https://platform.dnanexus.com/projects/F6K911Q9xyfgJ36JFzv03Z5J/data/pipeline-genome-data/genome_tsv/v4
132132

133133
Example FASTQs
134134
- AWS: https://platform.dnanexus.com/projects/BKpvFg00VBPV975PgJ6Q03v6/data/pipeline-test-samples/encode-chip-seq-pipeline/ENCSR000DYI/fastq_subsampled

chip.wdl

Lines changed: 10 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -7,10 +7,10 @@ struct RuntimeEnvironment {
77
}
88

99
workflow chip {
10-
String pipeline_ver = 'v2.1.2'
10+
String pipeline_ver = 'v2.1.4'
1111

1212
meta {
13-
version: 'v2.1.2'
13+
version: 'v2.1.4'
1414

1515
author: 'Jin wook Lee'
1616
@@ -19,8 +19,8 @@ workflow chip {
1919

2020
specification_document: 'https://docs.google.com/document/d/1lG_Rd7fnYgRpSIqrIfuVlAz2dW1VaSQThzk836Db99c/edit?usp=sharing'
2121

22-
default_docker: 'encodedcc/chip-seq-pipeline:v2.1.2'
23-
default_singularity: 'https://encode-pipeline-singularity-image.s3.us-west-2.amazonaws.com/chip-seq-pipeline_v2.1.2.sif'
22+
default_docker: 'encodedcc/chip-seq-pipeline:v2.1.4'
23+
default_singularity: 'https://encode-pipeline-singularity-image.s3.us-west-2.amazonaws.com/chip-seq-pipeline_v2.1.4.sif'
2424
croo_out_def: 'https://storage.googleapis.com/encode-pipeline-output-definition/chip.croo.v5.json'
2525

2626
parameter_group: {
@@ -71,8 +71,8 @@ workflow chip {
7171
}
7272
input {
7373
# group: runtime_environment
74-
String docker = 'encodedcc/chip-seq-pipeline:v2.1.2'
75-
String singularity = 'https://encode-pipeline-singularity-image.s3.us-west-2.amazonaws.com/chip-seq-pipeline_v2.1.2.sif'
74+
String docker = 'encodedcc/chip-seq-pipeline:v2.1.4'
75+
String singularity = 'https://encode-pipeline-singularity-image.s3.us-west-2.amazonaws.com/chip-seq-pipeline_v2.1.4.sif'
7676
String conda = 'encode-chip-seq-pipeline'
7777
String conda_macs2 = 'encode-chip-seq-pipeline-macs2'
7878
String conda_spp = 'encode-chip-seq-pipeline-spp'
@@ -2096,6 +2096,7 @@ workflow chip {
20962096
ctl_paired_ends = ctl_paired_end_,
20972097
pipeline_type = pipeline_type,
20982098
aligner = aligner_,
2099+
no_dup_removal = no_dup_removal,
20992100
peak_caller = peak_caller_,
21002101
cap_num_peak = cap_num_peak_,
21012102
idr_thresh = idr_thresh,
@@ -3046,6 +3047,7 @@ task qc_report {
30463047
Array[Boolean] ctl_paired_ends
30473048
String pipeline_type
30483049
String aligner
3050+
Boolean no_dup_removal
30493051
String peak_caller
30503052
Int cap_num_peak
30513053
Float idr_thresh
@@ -3105,6 +3107,7 @@ task qc_report {
31053107
command {
31063108
set -e
31073109
python3 $(which encode_task_qc_report.py) \
3110+
--pipeline-prefix chip \
31083111
${'--pipeline-ver ' + pipeline_ver} \
31093112
${"--title '" + sub(title,"'","_") + "'"} \
31103113
${"--desc '" + sub(description,"'","_") + "'"} \
@@ -3114,6 +3117,7 @@ task qc_report {
31143117
--ctl-paired-ends ${sep=' ' ctl_paired_ends} \
31153118
--pipeline-type ${pipeline_type} \
31163119
--aligner ${aligner} \
3120+
${if (no_dup_removal) then '--no-dup-removal ' else ''} \
31173121
--peak-caller ${peak_caller} \
31183122
${'--cap-num-peak ' + cap_num_peak} \
31193123
--idr-thresh ${idr_thresh} \
Binary file not shown.
Binary file not shown.
Binary file not shown.

0 commit comments

Comments
 (0)