Skip to content

Commit 02dfe36

Browse files
author
weichan
committed
small adjustments
1 parent 97d3993 commit 02dfe36

File tree

5 files changed

+27
-16
lines changed

5 files changed

+27
-16
lines changed

config/config_CD19_28z.yml

Lines changed: 17 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# Long-read data
2-
experiment: "28z"
2+
experiment: "28z_with_mod"
33
samples:
44
MK028_28z: "/home/weichan/permanent/Projects/VIS/Data/VIS_MPX_pooled/VIS_MPX_MK028_28z_pooled.bam"
55
MK014_28z: "/home/weichan/permanent/Projects/VIS/Data/VIS_MPX_pooled/VIS_MPX_MK014_28z_pooled.bam"
@@ -27,26 +27,30 @@ ref_genome_ctrl: "/home/weichan/permanent/Projects/VIS/Data/VIS_Magdeburg_withBa
2727
#ucsc_H3K27Ac: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_LayeredH3K27Ac_02_24"
2828
#ucsc_H3K4Me3: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_LayeredH3K4Me3_02_24"
2929
#ucsc_DNaseH: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_DNaseClusters_02_24_cut"
30-
ucsc_TF: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_TFClusters_processed.bed"
30+
annotate_ucsc_tf: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_TFClusters_processed.bed"
3131
#annotation_1: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_GENCODEV44_processed.bed"
32-
annotation_1: "/home/weichan/permanent/Projects/VIS/dev/UCSC/new_UCSC_GENCODEV44_processed.bed"
32+
annotate_gencode: "/home/weichan/permanent/Projects/VIS/dev/UCSC/new_UCSC_GENCODEV44_processed.bed"
3333
#ucsc_Genes_gtf: "/home/weichan/permanent/Projects/VIS/dev/UCSC/gencode.v44.annotation.gtf"
3434
#ucsc exons
35-
ucsc_exons: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_GENCODE_V44_Exons"
36-
ucsc_introns: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_GENCODE_V44_Introns"
35+
annotate_ucsc_exons: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_GENCODE_V44_Exons"
36+
annotate_ucsc_introns: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_GENCODE_V44_Introns"
37+
#promoters
38+
annotate_ucsc_promoter: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_Promoters_EPDnew"
39+
#enhancer
40+
annotate_ucsc_enhancer: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_VISTA_Enhancer_02_2025.bed"
41+
#enhancer fantom5
42+
annotate_fantom5_enhancer: "/home/weichan/permanent/Projects/VIS/dev/FANTOM5/F5.hg38.enhancers.bed"
3743
#sedb
3844
#sedb_cd4: "/home/weichan/permanent/Projects/VIS/dev/SEdb/sedb_cd4_closest_gene.bed"
3945
#sedb_cd8: "/home/weichan/permanent/Projects/VIS/dev/SEdb/sedb_cd8_closest_gene.bed"
4046
#tss
4147
#ucsc_tss: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_TSS_peaks_processed_sorted.bed"
4248
#miRNA
43-
#ucsc_mirna: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_miRNA_processed_sorted.bed"
49+
annotate_ucsc_mirna: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_miRNA_processed_sorted.bed"
4450
#cancer genes
45-
cosmic_genes: "/home/weichan/permanent/Projects/VIS/dev/COSMIC/Cosmic_CancerGeneCensus_Tsv_v101_GRCh38/Cosmic_CancerGeneCensus_v101_GRCh38_processed.bed"
46-
#promoters
47-
ucsc_promoter: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_Promoters_EPDnew"
51+
annotate_cosmic_genes: "/home/weichan/permanent/Projects/VIS/dev/COSMIC/Cosmic_CancerGeneCensus_Tsv_v101_GRCh38/Cosmic_CancerGeneCensus_v101_GRCh38_processed.bed"
4852
#hiC
49-
encode_hic: "/home/weichan/permanent/Projects/VIS/dev/ENCODE/HiC_Tcells/HiC_processed.bed"
53+
annotate_encode_hic: "/home/weichan/permanent/Projects/VIS/dev/ENCODE/HiC_Tcells/HiC_processed.bed"
5054
#VIS detection
5155
detection: "rules/detection.smk"
5256
#qc rule collection
@@ -61,3 +65,6 @@ downstream: "rules/downstream.smk"
6165
#epigenetics: "rules/epigenetics.smk"
6266
#variants rule collection WIP
6367
#variants: "rules/variants.smk"
68+
base_modifications: "rules/base_modifications.smk"
69+
plot_functional_genomics: "rules/plot_functional_genomics.smk"
70+
threads: 10

config/config_CD19_BBz.yml

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# Long-read data
2-
experiment: "annotation_test_cmod"
2+
experiment: "BBz_with_mod"
33
samples:
44
MK028_BBz: "/home/weichan/permanent/Projects/VIS/Data/VIS_MPX_pooled/VIS_MPX_MK028_BBz_pooled.bam"
55
MK014_BBz: "/home/weichan/permanent/Projects/VIS/Data/VIS_MPX_pooled/VIS_MPX_MK014_BBz_pooled.bam"
@@ -36,6 +36,10 @@ annotate_ucsc_exons: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_GENCODE
3636
annotate_ucsc_introns: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_GENCODE_V44_Introns"
3737
#promoters
3838
annotate_ucsc_promoter: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_Promoters_EPDnew"
39+
#enhancer fantom5
40+
annotate_fantom5_enhancer: "/home/weichan/permanent/Projects/VIS/dev/FANTOM5/F5.hg38.enhancers.bed"
41+
#enhancer refTSS
42+
annotate_refTSS_tss: "/home/weichan/permanent/Projects/VIS/dev/refTSS/refTSS_v4.1_human_coordinate.hg38.bed"
3943
#enhancer
4044
annotate_ucsc_enhancer: "/home/weichan/permanent/Projects/VIS/dev/UCSC/UCSC_VISTA_Enhancer_02_2025.bed"
4145
#sedb

workflow/Snakefile

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3,9 +3,9 @@ import os
33
from pathlib import Path
44

55
env_name = os.getenv('CONDA_DEFAULT_ENV')
6-
print(f"Current environment (should be either 'VIS_minimal' or 'VIS_full'): {env_name}")
6+
#print(f"Current environment (should be either 'VIS_minimal' or 'VIS_full'): {env_name}")
77

8-
CONFIG = "config/config_CD19_BBz.yml"
8+
CONFIG = "config/config_CD19_28z.yml"
99
configfile: CONFIG
1010
#SRC=config["source_dir"] #only in use for r script scirp, will be removed sooner or later
1111
SAMPLES = expand(config["samples"])
@@ -65,4 +65,4 @@ rule all:
6565
#expand(f"{outdir}/intermediate/blastn/Filtered_Annotated_{fragmentsize}_InsertionMatches_{{sample}}.gff", sample=SAMPLES),
6666
#expand(f"{outdir}/final/functional_genomics/localization/{fragmentsize}_{{sample}}", sample=SAMPLES),
6767
# for msa
68-
#expand(f"{outdir}/intermediate/fasta/Inserted_sequence_{{sample}}.fa", sample=SAMPLES)
68+
#expand(f"{outdir}/intermediate/fasta/Inserted_sequence_{{sample}}.fa", sample=SAMPLES)

workflow/rules/base_modifications.smk

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@ rule readnames_final:
2626
rule only_keep_filtered_insertions:
2727
input:
2828
isobam=f"{outdir}/intermediate/mapping/Precut_{{sample}}_sorted.bam",
29-
readnames=f"{outdir}/intermediate/cmod/final_insertion_readnames_{{sample}}.txt"
29+
readnames=f"{outdir}/intermediate/base_modifications/final_insertion_readnames_{{sample}}.txt"
3030
log:
3131
log=f"{outdir}/intermediate/log/base_modifications/only_keep_filtered_insertions/{{sample}}.log"
3232
output:

workflow/rules/functional_genomics.smk

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@ rule calc_distance_to_elements:
3535
output:
3636
f"{outdir}/final/functional_genomics/Functional_distances_to_Insertions_{{sample}}.bed"
3737
run:
38-
vhf.calculate_element_distance(input.insertions, output[0], log.log, params.annotation_files)
38+
vhf_fg.calculate_element_distance(input.insertions, output[0], log.log, params.annotation_files)
3939

4040
#kinda 'hacky' solution for flexibility: Now it does not matter if one annotation or 20 are defined.
4141
rule annotation_overlap_insertion:

0 commit comments

Comments
 (0)