2021-10-29 17:21:34 +01:00
|
|
|
process GATK4_GENOMICSDBIMPORT {
|
|
|
|
tag "$meta.id"
|
|
|
|
label 'process_low'
|
|
|
|
|
2022-02-15 11:29:36 +01:00
|
|
|
conda (params.enable_conda ? "bioconda::gatk4=4.2.5.0" : null)
|
2021-11-26 07:58:40 +00:00
|
|
|
container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ?
|
2022-02-15 11:29:36 +01:00
|
|
|
'https://depot.galaxyproject.org/singularity/gatk4:4.2.5.0--hdfd78af_0' :
|
|
|
|
'quay.io/biocontainers/gatk4:4.2.5.0--hdfd78af_0' }"
|
2021-10-29 17:21:34 +01:00
|
|
|
|
|
|
|
input:
|
|
|
|
tuple val(meta), path(vcf), path(tbi), path(intervalfile), val(intervalval), path(wspace)
|
|
|
|
val run_intlist
|
|
|
|
val run_updatewspace
|
|
|
|
val input_map
|
|
|
|
|
|
|
|
output:
|
2021-11-06 15:51:15 +00:00
|
|
|
tuple val(meta), path("${prefix}") , optional:true, emit: genomicsdb
|
2021-10-29 17:21:34 +01:00
|
|
|
tuple val(meta), path("$updated_db") , optional:true, emit: updatedb
|
|
|
|
tuple val(meta), path("*.interval_list"), optional:true, emit: intervallist
|
|
|
|
path "versions.yml" , emit: versions
|
|
|
|
|
2022-02-04 09:53:32 +01:00
|
|
|
when:
|
|
|
|
task.ext.when == null || task.ext.when
|
|
|
|
|
2021-10-29 17:21:34 +01:00
|
|
|
script:
|
2021-12-07 15:00:43 +01:00
|
|
|
def args = task.ext.args ?: ''
|
|
|
|
prefix = task.ext.prefix ?: "${meta.id}"
|
2021-10-29 17:21:34 +01:00
|
|
|
|
|
|
|
// settings for running default create gendb mode
|
2021-11-06 15:51:15 +00:00
|
|
|
inputs_command = input_map ? "--sample-name-map ${vcf[0]}" : "${'-V ' + vcf.join(' -V ')}"
|
|
|
|
dir_command = "--genomicsdb-workspace-path ${prefix}"
|
|
|
|
intervals_command = intervalfile ? " -L ${intervalfile} " : " -L ${intervalval} "
|
2021-10-29 17:21:34 +01:00
|
|
|
|
|
|
|
// settings changed for running get intervals list mode if run_intlist is true
|
|
|
|
if (run_intlist) {
|
|
|
|
inputs_command = ''
|
|
|
|
dir_command = "--genomicsdb-update-workspace-path ${wspace}"
|
|
|
|
intervals_command = "--output-interval-list-to-file ${prefix}.interval_list"
|
|
|
|
}
|
|
|
|
|
|
|
|
// settings changed for running update gendb mode. inputs_command same as default, update_db forces module to emit the updated gendb
|
|
|
|
if (run_updatewspace) {
|
|
|
|
dir_command = "--genomicsdb-update-workspace-path ${wspace}"
|
|
|
|
intervals_command = ''
|
|
|
|
updated_db = wspace.toString()
|
|
|
|
}
|
|
|
|
|
2021-12-07 15:22:24 +01:00
|
|
|
def avail_mem = 3
|
|
|
|
if (!task.memory) {
|
|
|
|
log.info '[GATK GenomicsDBImport] Available memory not known - defaulting to 3GB. Specify process memory requirements to change this.'
|
|
|
|
} else {
|
|
|
|
avail_mem = task.memory.giga
|
|
|
|
}
|
2021-10-29 17:21:34 +01:00
|
|
|
"""
|
2021-12-07 15:22:24 +01:00
|
|
|
gatk --java-options "-Xmx${avail_mem}g" GenomicsDBImport \\
|
2021-10-29 17:21:34 +01:00
|
|
|
$inputs_command \\
|
|
|
|
$dir_command \\
|
|
|
|
$intervals_command \\
|
2021-11-26 07:58:40 +00:00
|
|
|
$args
|
2021-10-29 17:21:34 +01:00
|
|
|
|
|
|
|
cat <<-END_VERSIONS > versions.yml
|
2021-11-26 07:58:40 +00:00
|
|
|
"${task.process}":
|
|
|
|
gatk4: \$(echo \$(gatk --version 2>&1) | sed 's/^.*(GATK) v//; s/ .*\$//')
|
2021-10-29 17:21:34 +01:00
|
|
|
END_VERSIONS
|
|
|
|
"""
|
|
|
|
}
|