nf-core_modules/modules/csvtk/split/main.nf
SusiJo ad46010385
Added new module csvtk/split (#1014)
* added module csvtk/split

* removed todo statement

* adjusted meta map names

* changed tests to use generic input files

* added module in pytest

* updated test-data paths

* Apply suggestions from code review

Co-authored-by: Harshil Patel <drpatelh@users.noreply.github.com>
2021-11-15 18:29:55 +00:00

50 lines
1.8 KiB
Text

// Import generic module functions
include { initOptions; saveFiles; getSoftwareName; getProcessName } from './functions'
params.options = [:]
options = initOptions(params.options)
process CSVTK_SPLIT {
tag "$meta.id"
label 'process_low'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:params.options, publish_dir:getSoftwareName(task.process), meta:meta, publish_by_meta:['id']) }
conda (params.enable_conda ? "bioconda::csvtk=0.23.0" : null)
if (workflow.containerEngine == 'singularity' && !params.singularity_pull_docker_container) {
container "https://depot.galaxyproject.org/singularity/csvtk:0.23.0--h9ee0642_0"
} else {
container "quay.io/biocontainers/csvtk:0.23.0--h9ee0642_0"
}
input:
tuple val(meta), path(csv)
val in_format
val out_format
output:
tuple val(meta), path("*.${out_extension}"), emit: split_csv
path "versions.yml" , emit: versions
script:
def prefix = options.suffix ? "${meta.id}${options.suffix}" : "${meta.id}"
def delimiter = in_format == "tsv" ? "--tabs" : (in_format == "csv" ? "--delimiter ',' " : in_format)
def out_delimiter = out_format == "tsv" ? "--out-tabs" : (out_format == "csv" ? "--out-delimiter ',' " : out_format)
out_extension = out_format == "tsv" ? 'tsv' : 'csv'
"""
sed -i.bak '/^##/d' $csv
csvtk \\
split \\
$options.args \\
--num-cpus $task.cpus \\
$delimiter \\
$out_delimiter \\
$csv
cat <<-END_VERSIONS > versions.yml
${getProcessName(task.process)}:
${getSoftwareName(task.process)}: \$(echo \$( csvtk version | sed -e 's/csvtk v//g' ))
END_VERSIONS
"""
}