forked from nf-core/sarek
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathnextflow.config
270 lines (237 loc) · 8.39 KB
/
nextflow.config
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
/*
* -------------------------------------------------
* nf-core/sarek Nextflow config file
* -------------------------------------------------
* Default config options for all environments.
*/
// Global default params, used in configs
params {
// Workflow flags
annotateTools = null // Only with --step annotate
genome = 'GRCh38_PGP_UK'
input = null // No default input
noGVCF = null // g.vcf are produced by HaplotypeCaller
noStrelkaBP = null // Strelka will use Manta candidateSmallIndels if available
no_intervals = null // Intervals will be built from the fasta file
skipQC = null // All QC tools are used
step = 'mapping' // Starts with mapping
tools = null // No default Variant Calling or Annotation tools
vepFile = 's3://lifebit-featured-datasets/pipelines/genomechronicler/no_vepFile.txt'
// Workflow settings
annotation_cache = null // Annotation cache disabled
cadd_cache = null // CADD cache disabled
genesplicer = null // genesplicer disabled
markdup_java_options = '"-Xms4000m -Xmx7g"' //Established values for markDuplicate memory consumption, see https://github.com/SciLifeLab/Sarek/pull/689 for details
nucleotidesPerSecond = 1000.0 // Default interval size
split_fastq = null // Fastq files will not be split by default
outdir = './results'
publishDirMode = 'copy' // Default PublishDirMode (same as other nf-core pipelines)
saveGenomeIndex = null // Built Indexes not saved
sequencing_center = null // No sequencing center to be written in BAM header in MapReads process
sentieon = null // Not using Sentieon by default
// Optional files/directory
cadd_InDels = false // No CADD InDels file
cadd_InDels_tbi = false // No CADD InDels index
cadd_WG_SNVs = false // No CADD SNVs file
cadd_WG_SNVs_tbi = false // No CADD SNVs index
pon = false // No default PON (Panel of Normals) file for GATK Mutect2 / Sentieon TNscope
pon_index = false // No default PON index for GATK Mutect2 / Sentieon TNscope
snpEff_cache = null // No directory for snpEff cache
targetBED = false // No default TargetBED file for targeted sequencing
vep_cache = null // No directory for VEP cache
// Custom config
config_profile_contact = false
config_profile_description = false
config_profile_url = false
custom_config_version = 'master'
custom_config_base = "https://raw.githubusercontent.com/nf-core/configs/${params.custom_config_version}"
// Reference genomes
igenomesIgnore = false
igenomes_base = 's3://ngi-igenomes/igenomes/'
// Default
help = false
hostnames = false
monochrome_logs = false // Monochrome logs disabled
multiqc_config = "${baseDir}/assets/multiqc_config.yaml" // Default multiqc config
name = false // No default name
tracedir = "${params.outdir}/pipeline_info"
// email
email = false // No default email
maxMultiqcEmailFileSize = 25.MB
plaintext_email = false // Plaintext email disabled
// Base specifications
cpus = 8
max_cpus = 16
max_memory = 128.GB
max_time = 240.h
max_forks = 96
med_resources_fraction = 0.50
singleCPUMem = 7.GB
bwa_cpus_fraction = 0.6
bwa_cpus = null
sort_cpus = null
// Deprecated params
annotateVCF = null
genomeDict = null
genomeFile = null
genomeIndex = null
noReports = null
sample = null
sampleDir = null
}
// Container slug
// Stable releases should specify release tag (ie: `2.5`)
// Developmental code should specify dev
process.container = 'nfcore/sarek:2.5.2'
process {
withLabel: forks_max {
cpus = {params.max_forks}
maxForks = 96
}
withLabel: cpus_max {
cpus = {params.max_cpus}
maxForks = 2
}
withLabel: memory_max {
memory = {params.max_memory}
}
withLabel: med_resources {
cpus = { alloc_med_resource(params.max_cpus) }
//maxForks = { alloc_med_resource(params.max_forks) }
memory = { alloc_med_resource(params.max_memory) }
}
withName: BaseRecalibratorSpark {
container = "broadinstitute/gatk:4.1.4.0"
maxForks = 64
}
withName: MarkDuplicatesSpark {
container = "broadinstitute/gatk:4.1.3.0"
maxForks = 2
}
withName: RunGenomeChronicler {
container = "lifebitai/genomechronicler:pgp-uk-5513c6f"
}
withName: ApplyBQSRSpark {
container = "broadinstitute/gatk:4.1.4.0"
maxForks = 96
}
withName: HaplotypeCaller {
container = "broadinstitute/gatk:4.1.4.0"
cpus = 1
maxForks = 96
}
withName: Mutect2 {
container = "broadinstitute/gatk:4.1.4.0"
}
withName: PileupSummariesForMutect2 {
container = "broadinstitute/gatk:4.1.4.0"
}
withName: MultiQC {
errorStrategy = 'retry'
maxRetries = 4
}
}
// Load base.config by default for all pipelines
includeConfig 'conf/base.config'
// Load nf-core custom profiles from different Institutions
try {
includeConfig "${params.custom_config_base}/nfcore_custom.config"
} catch (Exception e) {
System.err.println("WARNING: Could not load nf-core/config profiles: ${params.custom_config_base}/nfcore_custom.config")
}
// Load nf-core/sarek custom profiles from different Institutions
try {
includeConfig "${params.custom_config_base}/pipeline/sarek.config"
} catch (Exception e) {
System.err.println("WARNING: Could not load nf-core/config/sarek profiles: ${params.custom_config_base}/pipeline/sarek.config")
}
profiles {
standard { includeConfig 'conf/test.config'
}
conda {
docker.enabled = false
process.conda = "$baseDir/environment.yml"
singularity.enabled = false
}
debug { process.beforeScript = 'echo $HOSTNAME' }
docker {
docker {
enabled = true
fixOwnership = true
runOptions = "-u \$(id -u):\$(id -g)"
}
singularity.enabled = false
}
singularity {
docker.enabled = false
singularity.autoMounts = true
singularity.enabled = true
}
test { includeConfig 'conf/test.config' }
test_annotation { includeConfig 'conf/test_annotation.config' }
test_splitfastq { includeConfig 'conf/test_splitfastq.config' }
test_targeted { includeConfig 'conf/test_targeted.config' }
test_tool { includeConfig 'conf/test_tool.config' }
}
// Load genomes.config or igenomes.config
if (!params.igenomesIgnore) {
includeConfig 'conf/igenomes.config'
} else {
includeConfig 'conf/genomes.config'
}
// Capture exit codes from upstream processes when piping
process.shell = ['/bin/bash', '-euo', 'pipefail']
timeline {
enabled = true
file = "${params.tracedir}/execution_timeline.html"
}
report {
enabled = true
file = "${params.tracedir}/execution_report.html"
}
trace {
enabled = true
file = "${params.tracedir}/execution_trace.txt"
}
dag {
enabled = true
file = "${params.tracedir}/pipeline_dag.svg"
}
manifest {
name = 'nf-core/sarek'
author = 'Maxime Garcia, Szilveszter Juhos'
homePage = 'https://github.com/nf-core/sarek'
description = 'An open-source analysis pipeline to detect germline or somatic variants from whole genome or targeted sequencing'
mainScript = 'main.nf'
nextflowVersion = '>=19.10.0'
version = '2.5.2'
}
// Return the minimum between requirements and a maximum limit to ensure that resource requirements don't go over
def check_resource(obj) {
try {
if (obj.getClass() == nextflow.util.MemoryUnit && obj.compareTo(params.max_memory as nextflow.util.MemoryUnit) == 1)
return params.max_memory as nextflow.util.MemoryUnit
else if (obj.getClass() == nextflow.util.Duration && obj.compareTo(params.max_time as nextflow.util.Duration) == 1)
return params.max_time as nextflow.util.Duration
else if (obj.getClass() == java.lang.Integer)
return Math.min(obj, params.max_cpus as int)
else if (obj.getClass() == java.lang.Integer)
return Math.min(obj, params.max_forks as int)
else
return obj
} catch (all) {
println " ### ERROR ### Max params max_memory:'${params.max_memory}', max_time:'${params.max_time}' or max_cpus:'${params.max_cpus}' is not valid! Using default value: $obj"
}
}
def alloc_med_resource(obj) {
try {
if (obj.getClass() == java.lang.String)
return ( (obj as nextflow.util.MemoryUnit) * (params.med_resources_fraction as float) )
else if (obj.getClass() == java.lang.Integer)
return ( (obj as int) * (params.med_resources_fraction as float) as int)
else
return obj
} catch (all) {
println " ### ERROR ### Max params max_memory:'${params.max_memory}', or max_cpus:'${params.max_cpus}' or max_cpus:'${params.max_forks}' is not valid! Using default value: $obj"
}
}