nf-core_modules/modules/gatk4/genomicsdbimport/main.nf
Maxime U. Garcia 409af2f27c
Improve syntax/logic coherence in all gatk4 plugins (#1459)
* feat: code polishing

* Apply suggestions from code review

Co-authored-by: FriederikeHanssen <Friederike.hanssen@qbic.uni-tuebingen.de>

* code polishing

* more code polishing

* code polishing

* tests for applybqsrspark

* fix typo

* no need to check md5sum for versions.yml

* fix: use correct syntax

* code polishing again

* add tests for markduplicatesspark

* simplify mergevcfs tests

* add tests for baserecalibratorspark

* fix: path to entry

* code polishing

* fix linting

* simplify module

* update meta.yml

* fix pair mode

* fix: MITO mode

* more tests

* fix command

* bad copy paste

* fix typos

* fix tests

* fix test

* update meta.yml

* correct versions.yml in all test.yml

* code polishing

* code polishing

* more code polishing

* fix args

* add tmpdir for all

Co-authored-by: FriederikeHanssen <Friederike.hanssen@qbic.uni-tuebingen.de>
2022-04-12 17:15:39 +02:00

67 lines
2.5 KiB
Text

process GATK4_GENOMICSDBIMPORT {
tag "$meta.id"
label 'process_low'
conda (params.enable_conda ? "bioconda::gatk4=4.2.5.0" : null)
container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ?
'https://depot.galaxyproject.org/singularity/gatk4:4.2.5.0--hdfd78af_0' :
'quay.io/biocontainers/gatk4:4.2.5.0--hdfd78af_0' }"
input:
tuple val(meta), path(vcf), path(tbi), path(interval_file), val(interval_value), path(wspace)
val run_intlist
val run_updatewspace
val input_map
output:
tuple val(meta), path("$prefix") , optional:true, emit: genomicsdb
tuple val(meta), path("$updated_db") , optional:true, emit: updatedb
tuple val(meta), path("*.interval_list"), optional:true, emit: intervallist
path "versions.yml" , emit: versions
when:
task.ext.when == null || task.ext.when
script:
def args = task.ext.args ?: ''
prefix = task.ext.prefix ?: "${meta.id}"
// settings for running default create gendb mode
input_command = input_map ? "--sample-name-map ${vcf[0]}" : vcf.collect(){"--variant $it"}.join(' ')
genomicsdb_command = "--genomicsdb-workspace-path ${prefix}"
interval_command = interval_file ? "--intervals ${interval_file}" : "--intervals ${interval_value}"
// settings changed for running get intervals list mode if run_intlist is true
if (run_intlist) {
genomicsdb_command = "--genomicsdb-update-workspace-path ${wspace}"
interval_command = "--output-interval-list-to-file ${prefix}.interval_list"
}
// settings changed for running update gendb mode. input_command same as default, update_db forces module to emit the updated gendb
if (run_updatewspace) {
genomicsdb_command = "--genomicsdb-update-workspace-path ${wspace}"
interval_command = ''
updated_db = "${wspace}"
}
def avail_mem = 3
if (!task.memory) {
log.info '[GATK GenomicsDBImport] Available memory not known - defaulting to 3GB. Specify process memory requirements to change this.'
} else {
avail_mem = task.memory.giga
}
"""
gatk --java-options "-Xmx${avail_mem}g" GenomicsDBImport \\
$input_command \\
$genomicsdb_command \\
$interval_command \\
--tmp-dir . \\
$args
cat <<-END_VERSIONS > versions.yml
"${task.process}":
gatk4: \$(echo \$(gatk --version 2>&1) | sed 's/^.*(GATK) v//; s/ .*\$//')
END_VERSIONS
"""
}