-
Notifications
You must be signed in to change notification settings - Fork 12
Expand file tree
/
Copy pathdefaults.config
More file actions
211 lines (159 loc) · 6.7 KB
/
defaults.config
File metadata and controls
211 lines (159 loc) · 6.7 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
/*
Required / Default Parameters.
This parameters must always be set
*/
params {
/*
DB DOWNLOAD WORKFLOW
*/
// Trigger database download and formatting workflow? --> will not run annotation
// Will download and format a database inside {output} parameter
get_dbs = false
force_update = false
get_zenodo_db = false // download pre-built database
/*
ANNOTATION INPUTS
*/
// Input data mus be given inside a well-formated samplesheet.
// We provide a well-formated example at: https://github.com/fmalmeida/test_datasets/raw/main/bacannot_testing_samplesheets/samplesheet.yaml
//
// Please read the example samplesheet so you can understand how to properly fill it.
//
// It is also documented in the main manual: https://bacannot.readthedocs.io/en/latest/samplesheet
input = null
// Enable reads deduplication for assembly? (If input has reads)
enable_deduplication = false
// path to directory containing databases used by bacannot
// you can download databases with:
// nextflow run fmalmeida/bacannot --get_dbs --output bacannot_dbs -profile <docker/conda/singularity>
bacannot_db = null
/*
GENERAL PARAMETERS
*/
// Main output folder name. More than one bacannot annotation can be redirected
// to the same output parameter. It is good to keep related annotations together.
// A subdirectory with the filename will be created inside this directory.
output = 'results'
// Number of minimum overlapping base pairs required for merging
// Negative values, such as -20, means the number of required overlapping bases for merging.
// Positive values, such as 5, means the maximum distance accepted between features for merging.
// By default (if Blank), this process is not executed. For execution the user needs to provide a value
bedtools_merge_distance = null
/*
* Bakta optional
*/
// If user set path to an existing bakta database, the pipeline will use bakta instead of prokka
bakta_db = null
/*
* Prokka optional parameters
*/
// Include comprehensive PGAP hmm database in prokka annotation instead of TIGRFAM.
// PGAP is big and using it may have higher running times but better results
prokka_use_pgap = false
// Annotation mode: Archaea|Bacteria|Mitochondria|Viruses (default 'Bacteria')
prokka_kingdom = null
// Translation table code. Must be set if the above is set.
// Example: params.prokka_genetic.code = 11
prokka_genetic_code = null
// Use rnammer instead of Barrnap? False or True?
prokka_use_rnammer = false
/*
* Resfinder species panel
*/
// Species panel to be used when annotating with Resfinder.
// It sets a default for all samples in the samplesheet.
// If a sample has a different value inside the samplesheet it will overwrite the value for that sample
// If blank it will not be executed.
// It must be identical (without the *) as written in their webservice https://cge.cbs.dtu.dk/services/ResFinder/.
// E.g. 'Escherichia coli'; 'Klebsiella' ...
resfinder_species = null
/*
* Handling the execution of processes
*
* By default, all processes are executed. These
* parameters tells wheter NOT to run a process.
*
* Which means: false will allow its execution
* while true will create a barrier and skip a process.
*/
// (NOT RUN?) Plasmids annotation (controls PlasmidFinder execution)
skip_plasmid_search = false
// (NOT RUN?) General Virulence annotation (controls VFDB and Victors scan)
skip_virulence_search = false
// (NOT RUN?) Resistance annotation (controls AMRfinder and RGI)
skip_resistance_search = false
// (NOT RUN?) ICE annotation (controls ICEberg annotation)
skip_iceberg_search = false
// (NOT RUN?) prophage annotation (controls PHAST and Phigaro)
skip_prophage_search = false
// (NOT RUN?) KO (KEGG Orthology) annotation
skip_kofamscan = false
// (NOT RUN?) antiSMASH (secondary metabolite) annotation
skip_antismash = false
// (NOT RUN?) sourmash
skip_sourmash = false
// (NOT RUN?) integron finder tool
skip_integron_finder = false
// (NOT RUN?) CIRCOS tool
skip_circos = false
/*
* Custom databases can be used to annotate additional genes in the genome.
* It runs a BLAST alignment against the genome, therefore, the custom database
* More than one custom database can be given separated by commas.
* Gene headers must be properly formated as described in the
* documentation: https://bacannot.readthedocs.io/en/latest/custom-db
*/
// Custom fastas (PROT / NUCL)
custom_db = null
// Custom annotation using list of NCBI protein accs
ncbi_proteins = null
/*
* Annotation thresholds to be used when scanning specific databases and features
* Select a combination of thresholds that is meaningful for your data. Some of
* the databases are protein-only, others are nucleotide only. We cannnot control
* that and the databases will be scanned either if blastp or blastn using these
* thresholds described here.
*/
// Identity threshold for plasmid annotation
plasmids_minid = 90
// Coverage threshold for plasmid annotation
plasmids_mincov = 60
// Virulence genes identity threshold
blast_virulence_minid = 90
// Virulence genes coverage threshold
blast_virulence_mincov = 90
// AMR genes identity threshold
blast_resistance_minid= 90
// AMR genes coverage threshold
blast_resistance_mincov = 90
// MGEs (ICEs and Phages) identity threshold
blast_MGEs_minid = 85
// MGEs (ICEs and Phages) coverage threshold
blast_MGEs_mincov = 85
// User's custom database identity threshold
blast_custom_minid = 65
// User's custom database coverage threshold
blast_custom_mincov = 65
/*
* Sourmash configuration
*/
// kmer size (21, 31 or 51)
sourmash_kmer = 31
// scale, e.g. a scale 1000 on a 5Mb genome will generate 5000 hashes
// 1000 is generally recommended by the tool's developers
sourmash_scale = 1000
/*
* Resources allocation configuration
* Defaults only, expecting to be overwritten
*/
// Select versions of bioconda quay.io additional tools
// Tools that are not part of the core of the pipeline,
// but can eventually be used by users
unicycler_version = '0.5.0--py310h6cc9453_3'
flye_version = '2.9--py39h6935b12_1'
bakta_version = '1.7.0--pyhdfd78af_1'
// Max resource options
max_memory = '20.GB'
max_cpus = 16
max_time = '40.h'
}