forked from lukfor/pipeline-umi-amplicon
-
Notifications
You must be signed in to change notification settings - Fork 0
/
config.yml
executable file
·53 lines (36 loc) · 1.32 KB
/
config.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
# Name of output folder
sample_name: example_egfr_single_read_run
# Input FASTQ files. Can be a (zipped) FASTQ file or a folder containing (zipped) FASTQ files
input_fastq: data/example_egfr_single_cluster.fastq
# Reference genome
reference_fasta: "data/example_egfr_reference.fasta"
# BED file containing intervals with regions that are going to be analysed
targets_bed: data/example_egfr_amplicon.bed
############################
######### Optional #########
############################
#
# Max differences between UMI in read and UMI pattern
umi_errors: 3
# Min number of reads required for a consensus read
min_reads_per_cluster: 20
# Max number of 1D used for a consensus read
max_reads_per_cluster: 60
# Min overlap with target region
min_overlap: 0.90
# Balance forward and reverse 1D reads in clusters
balance_strands: True
# Medaka model used to compute consensus reads
medaka_model: "r941_min_high_g360"
# Forward tail of primer (Ftail...UMI...primer)
fwd_context: "GTATCGTGTAGAGACTGCGTAGG"
# Reverse tail of primer (Rtail...UMI...primer)
rev_context: "AGTGATCGAGTCAGTGCGAGTG"
# Forward UMI (Ftail...UMI...primer)
fwd_umi: "TTTVVVVTTVVVVTTVVVVTTVVVVTTT"
# Reverse UMI (Rtail...UMI...primer)
rev_umi: "AAABBBBAABBBBAABBBBAABBBBAAA"
# Minimum combined UMI length
min_length: 40
# Maximum combined UMI length
max_length: 60