From 44749dd3a520d949b3ec1967b0370d74a6a57bda Mon Sep 17 00:00:00 2001 From: riasc Date: Thu, 20 Jun 2024 22:02:53 -0500 Subject: [PATCH] catch errors when rnaseq is not provided (exitron/altsplicing calling) and add reference genome index as input for indel calling (htcaller) --- workflow/rules/common.smk | 17 +++++++++++------ workflow/rules/germline.smk | 3 ++- 2 files changed, 13 insertions(+), 7 deletions(-) diff --git a/workflow/rules/common.smk b/workflow/rules/common.smk index 75ec9a5..9a2a295 100644 --- a/workflow/rules/common.smk +++ b/workflow/rules/common.smk @@ -124,6 +124,7 @@ def all_identical(l): # load up the config config['data'] = data_structure(config['data']) +print(config) ########### PREPROCESSING ########## def get_raw_reads(wildcards): @@ -734,18 +735,22 @@ def get_prioritization_long_indels(wildcards): def get_prioritization_exitrons(wildcards): exitrons = [] if config["exitronsplicing"]["activate"]: - exitrons += expand("results/{sample}/annotation/exitrons.vcf", - sample=config["data"]["name"]) - + if len(config["data"]["rnaseq"]) != 0: + exitrons += expand("results/{sample}/annotation/exitrons.vcf", + sample=config["data"]["name"]) + else: + print('rnaseq data has not been specified in the config file, but exitron calling is activated - skipping...') return exitrons def get_prioritization_altsplicing(wildcards): altsplicing = [] if config["altsplicing"]["activate"]: - altsplicing += expand("results/{sample}/annotation/altsplicing.vcf", - sample=config["data"]["name"]) - + if len(config["data"]["rnaseq"]) != 0: + altsplicing += expand("results/{sample}/annotation/altsplicing.vcf", + sample=config["data"]["name"]) + else: + print('rnaseq data has not been specified in the config file, but alternative splicing calling is activated - skipping...') return altsplicing def get_prioritization_custom(wildcards): diff --git a/workflow/rules/germline.smk b/workflow/rules/germline.smk index 2081405..0cd912f 100644 --- a/workflow/rules/germline.smk +++ b/workflow/rules/germline.smk @@ -73,7 +73,8 @@ rule detect_variants_htc_first_round: input: bam="results/{sample}/{seqtype}/align/{group}_final_BWA_split/{chr}.bam", idx="results/{sample}/{seqtype}/align/{group}_final_BWA_split/{chr}.bam.bai", - ref="resources/refs/genome.fasta" + ref="resources/refs/genome.fasta", + ref_idx="resources/refs/genome.fasta.fai" output: vcf="results/{sample}/{seqtype}/indel/htcaller/{group}_variants.1rd/{chr}.vcf" message: