-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathconfig_template.yaml
79 lines (59 loc) · 2.58 KB
/
config_template.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
---
#############################
#### REQUIRED PARAMETERS ####
#############################
# All paths are relative to the current working directory unless noted otherwise
samples: path/to/samples_table.tsv
#### GENOME RESOURCES #####
# All genome resources have to match the source/organism
# of all samples in the sample table
genome_file: path/to/gzipped/ensembl/genome.fa.gz
gtf_file: path/to/gzipped/ensembl/gene_annotations.gtf.gz
mirna_file: path/to/unzipped/mirbase/mirna_annotations.gff3
bed_file: path/to/pileups/genomic_regions.bed
# Tab-separated mappings table between UCSC (column 1)
# and Ensembl (coulm 2) chromosome names
# Available at: https://github.com/dpryan79/ChromosomeMappings
map_chr_file: path/to/ucsc_ensembl_mappings.tsv
###############################
#### "OPTIONAL" PARAMETERS ####
###############################
# The below parameters only need to be changed if the default behavior of
# MIRFLOWZ is to be changed; however, they still need to be present!
#### DIRECTORIES ####
output_dir: results/
pileups_dir: results/pileups
intermediates_dir: results/intermediates
local_log: logs/local/
cluster_log: logs/cluster/
scripts_dir: ../scripts/
#### PROCESSING PARAMETERS ####
# annotation modifications
extension: 6 # extension of the mature miRNA start and end coordinates in bp
# quality filter
q_value: 10 # Q (Phred) score; minimum quality score to keep
p_value: 50 # minimum % of bases that must have Q quality
# adapter removal
error_rate: 0.1 # fraction of allowed errors
minimum_length: 15 # discard processed reads shorter than the indicated length
overlap: 3 # minimum overlap length of adapter and read to trim the bases
max_n: 0 # discard reads containing more than the indicated number of N bases
# mapping
max_length_reads: 30 # maximum length of processed reads to map with oligomap
nh: 100 # discard reads with more mappings than the indicated number
#### QUANTIFICATION PARAMETERS ####
# Types of miRNAs to quantify
# Remove miRNA types you are not interested in.
# If 'isomir' and 'mirna' are both in the list, a single table with both types
# is made.
mir_list: ['isomir', 'mirna', 'pri-mir']
#### ASCII-STYLE ALIGNMENT PILEUPS PARAMETERS ####
# Dictionary with the list of library names to aggregate when performing the
# pileups as values and the condition as keys. Library names must match the
# ones in the samples table `sample` column. The dictionary keys will be used
# as the pileup's output directory name.
# e.g. lib_dict: {"group_A": ["lib_1", "lib_3"], "group_B": ["lib_2"]}
#
# Leave as an empty dictionary if no pileups are desired.
lib_dict: {}
...