-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrun_calculate_conversion_rate.smk
33 lines (26 loc) · 1.14 KB
/
run_calculate_conversion_rate.smk
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
import os
from pathlib import Path
INPUT_DIR="/SAN/vyplab/alb_projects/data/4su_full_ward_tdp_kd_ipsc/HISAT3N/"
OUTPUT_DIR="/SAN/vyplab/alb_projects/data/4su_full_ward_tdp_kd_ipsc/HISAT3N_perbase_conv/"
INPUT_BED="/SAN/vyplab/vyplab_reference_genomes/annotation/human/GRCh38/gencode.v40_all_introns_unique.bed"
conversion_suffix = '.conversion.fake.bed.gz'
basenameBed = Path(INPUT_BED).stem
SAMPLES = [f.replace(conversion_suffix, "") for f in os.listdir(INPUT_DIR) if f.endswith(conversion_suffix)]
rule all:
input:
expand(OUTPUT_DIR + "{sample}" + "_" + basenameBed + "_perbase_cov.tsv", sample = SAMPLES)
rule calculate_splice_stability:
input:
conversion_file = INPUT_DIR + "{sample}" + conversion_suffix
output:
outputfile = OUTPUT_DIR + "{sample}" + "_" + basenameBed + "_perbase_cov.tsv"
params:
bed = INPUT_BED,
t_out = OUTPUT_DIR + "{sample}" + "_" + basenameBed + "TEMP_perbase_cov.tsv"
shell:
"""
tabix {input.conversion_file}\
-R {params.bed} > {params.t_out}
scripts/rateMawk.sh {params.t_out} {output.outputfile}
rm {params.t_out}
"""