process SCRAMBLE_CLUSTERIDENTIFIER { tag "$" label 'process_single' conda (params.enable_conda ? "bioconda::scramble=1.0.1" : null) container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ? '': '' }" input: tuple val(meta), path(input), path(input_index) path fasta output: tuple val(meta), path("*.clusters.txt") , emit: clusters path "versions.yml" , emit: versions when: task.ext.when == null || task.ext.when script: def args = task.ext.args ?: '' def prefix = task.ext.prefix ?: "${}" def VERSION = '1.0.1' // WARN: Version information not provided by tool on CLI. Please update this string when bumping container versions. // The tool does not contain a way to specify the reference file when using CRAM files. // It just looks in the header of the CRAM file where the reference file is located, // but that reference can't always be fetched since most test data is created on // another machine. I had to find another way to specify the reference and I // found that I could create an md5 cache of a specified fasta and supply it to // the REF_PATH environment variable. This way the tool uses the correct reference. // An issue has been made about this: // The reference code is a placeholder until this issue has been fixed. def reference = fasta ? "wget && perl -root ./md5_ref ${fasta} && export REF_PATH=`pwd`/md5_ref/%2s/%2s/%s" : "" """ ${reference} cluster_identifier \\ ${args} \\ ${input} \\ > ${prefix}.clusters.txt cat <<-END_VERSIONS > versions.yml "${task.process}": scramble: ${VERSION} END_VERSIONS """ }