forked from karel-brinda/MiniPhy
-
Notifications
You must be signed in to change notification settings - Fork 0
/
config.yaml
71 lines (52 loc) Β· 2.02 KB
/
config.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
########################
# SNAKEMAKE PARAMETERS #
########################
# (1) Directories for individual stages of the workflow
input_dir: input
intermediate_dir: intermediate
output_dir: output
conda_dir: .conda
# (2) Parameters for Snakemake execution
threads: all # use all available cores
use_conda: True # build conda environments automatically by Snakemake
####################################
# COMPRESSION PROTOCOLS TO INCLUDE #
####################################
# Protocol 1: compr. of genome assemblies
protocol_asm: True
# Protocol 2: compr. of dBGs (w/o k-mer propagation; pre-propagation simplitigs)
protocol_pre: False
# Protocol 3: compr. of dBGs (w/ k-mer propagation; post-propagation simplitigs)
protocol_post: False
############################
# DATA ANALYSES TO INCLUDE #
############################
# Calculate #seqs and their cumulative length
sequence_statistics: True
# Include analyses based on k-mer counts (using JellyFish 2)
kmer_statistics: False
##############
# PARAMETERS #
##############
# (1) General parameters; notes:
# - kmer length defines k for dBGs in Protocols 2 and 3
# - the same k-mer length is used also for k-mer counting (all protocols)
# - converting sequences to upper case is used in Protocol 1
# - if trees_required is true, then the workflow will insist on user-provided trees
kmer_length: 31
asms_to_uppercase: True
trees_required: False
# (2) XZ parameters; notes:
# - best compression is always achieved with 1 thread
# - increasing xz_threads is useful for acceleration, but the files get >2x bigger
# - for all XZ params, see 'man xz'
xz_threads: 1
xz_params: "-9"
# (3) Attotree parameters; notes:
# - sketch size should be at least 10k to achieve a sufficient resolution
attotree_threads: 8
attotree_kmer_length: 21
attotree_sketch_size: 10000
# (4) Jellyfish parameters
jellyfish_threads: 8
jellyfish_size: "40M"