-
Notifications
You must be signed in to change notification settings - Fork 7
/
Copy pathconfig.yaml
86 lines (73 loc) · 2.73 KB
/
config.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
# workdir must have a directory named "alignments" with each multiple-sequence alignments in a seperate fasta file.
workdir: "datasmall"
# options are ["nuc", "prot"]
chartype: "nuc"
# options are:
# "de-novo": backbone species will be selected using mainlines (see the mainlines_config below)
# "tree": workdir/backbone.nwk is used as the backbone. Therefore genetreeinfer&refine_bb will be skipped
# "list": workdir/species.txt is used as the list of backbone species. therefore mainlines will be skipped. However,
# genetreeinfer&refine will still run to get a backbone tree.
backbone: "de-novo"
resources:
# MBs
large_memory: 16000
# cores used in monolithic tasks such as decompose and prep_backbone_alignments
cores: 4
trim_config:
# sites with less non-gap fraction than below will be removed
percent_nongap: 0.05
mainlines_config:
# target number of taxa
n: 100
# concatenation alignment length
length: 5000
# backbone filtering is recommended if backbone contains misplaced or noisy sequences
backbone_filtering: False
apples_config:
# [FM, OLS]
method: FM
# float. [0-infinity)
filter: 0.2
# integer. [5-infinity)
base: 25
# minimum overlap fraction. Default is 0.001
overlap: 0.05
prep_config:
# cluster must have a minimum diameter
edge_thr: 0.02
# approximate cluster size (no guarantees)
# if "auto", uDance determines the size using standard formula
# Min[Round[8 Sqrt[n] + 3 Sqrt[m], 100], 2500]
# otherwise, this number can be any integer.
cluster_size: "auto"
#cluster_size: 50
# minimum subtree alignment length
sublength: 100
# minimum fragment length
fraglength: 75
# large clusters are pruned. ASTRAL's limit is around 9000 for 400+ genes.
pruneafter: 9000
# experimental. when number of queries landed on a partition are less than or equal to this number
# the partition will be skipped to save running time
min_placements: 0
infer_config:
# [raxml-ng,iqtree,raxml-8]
method: "raxml-8"
# number of starting trees
numstart: 2
# number of starting tree instances that run concurrently
# this number should not exceeed "numstart"
numthread: 1
refine_config:
# contract low support branches threshold. 0.9 for iqtree -abayes
contract: 0.33
# gene occupancy threshold for inclusion
occupancy: 2
# 1D k-means-based (k=2) outlier gene detection parameter. Limit for outlier size fraction.
# Larger clusters cannot be designated as outliers
outlier_sizelimit: 0.2
# 1D k-means-based (k=2) outlier gene detection parameter. Centroid difference must be
# larger than this value to designate the first cluster as outliers.
outlier_difference: 0.1
# Experimental. Infer branch lengths in substitution unit using ASTRAL. [True, False]
infer_branchlen: True