* -----------------------------------------------------
* Utility functions used in nf-core DSL2 module files
* -----------------------------------------------------
* Extract name of software tool from process name using $task.process
def getSoftwareName(task_process) {
return task_process.tokenize(':')[-1].tokenize('_')[0].toLowerCase()
* Function to initialise default values and to generate a Groovy Map of available options for nf-core modules
def initOptions(Map args) {
def Map options = [:]
options.args = args.args ?: ''
options.args2 = args.args2 ?: ''
options.publish_by_id = args.publish_by_id ?: false
options.publish_dir = args.publish_dir ?: ''
options.publish_files = args.publish_files
options.suffix = args.suffix ?: ''
return options
* Tidy up and join elements of a list to return a path string
def getPathFromList(path_list) {
def paths = path_list.findAll { item -> !item?.trim().isEmpty() } // Remove empty entries
paths = paths.collect { it.trim().replaceAll("^[/]+|[/]+\$", "") } // Trim whitespace and trailing slashes
return paths.join('/')
* Function to save/publish module results
def saveFiles(Map args) {
if (!args.filename.endsWith('.version.txt')) {
def ioptions = initOptions(args.options)
def path_list = [ ioptions.publish_dir ?: args.publish_dir ]
if (ioptions.publish_by_id) {
if (ioptions.publish_files instanceof Map) {
for (ext in ioptions.publish_files) {
if (args.filename.endsWith(ext.key)) {
def ext_list = path_list.collect()
return "${getPathFromList(ext_list)}/$args.filename"
} else if (ioptions.publish_files == null) {
return "${getPathFromList(path_list)}/$args.filename"

@ -0,0 +1,30 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
process GFFREAD {
tag "$gff"
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), publish_id:'') }
container ""
conda (params.conda ? "bioconda::gffread=0.11.7" : null)
path gff
val options
path "*.gtf" , emit: gtf
path "*.version.txt", emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
gffread $gff $ioptions.args -o ${gff.baseName}.gtf
echo \$(gffread --version 2>&1) > ${software}.version.txt

@ -0,0 +1,90 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
def VERSION = '2.2.0'
process HISAT2_ALIGN {
tag "$"
label 'process_high'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
container ""
//container ""
conda (params.conda ? "bioconda::hisat2=2.2.0 bioconda::samtools=1.10" : null)
tuple val(meta), path(reads)
path index
path splicesites
val options
tuple val(meta), path("*.bam"), emit: bam
tuple val(meta), path("*.log"), emit: summary
path "*.version.txt" , emit: version
tuple val(meta), path("*fastq.gz"), optional:true, emit: fastq
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
def prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
def strandedness = ''
if (meta.strandedness == 'forward') {
strandedness = meta.single_end ? '--rna-strandness F' : '--rna-strandness FR'
} else if (meta.strandedness == 'reverse') {
strandedness = meta.single_end ? '--rna-strandness R' : '--rna-strandness RF'
def seq_center = params.seq_center ? "--rg-id ${prefix} --rg CN:${params.seq_center.replaceAll('\\s','_')} SM:$prefix" : "--rg-id ${prefix} --rg SM:$prefix"
if (meta.single_end) {
def unaligned = params.save_unaligned ? "--un-gz ${prefix}.unmapped.fastq.gz" : ''
INDEX=`find -L ./ -name "*.1.ht2" | sed 's/.1.ht2//'`
hisat2 \\
-x \$INDEX \\
-U $reads \\
$strandedness \\
--known-splicesite-infile $splicesites \\
--summary-file ${prefix}.hisat2.summary.log \\
--threads $task.cpus \\
$seq_center \\
$unaligned \\
$ioptions.args \\
| samtools view -bS -F 4 -F 256 - > ${prefix}.bam
echo $VERSION > ${software}.version.txt
} else {
def unaligned = params.save_unaligned ? "--un-conc-gz ${prefix}.unmapped.fastq.gz" : ''
INDEX=`find -L ./ -name "*.1.ht2" | sed 's/.1.ht2//'`
hisat2 \\
-x \$INDEX \\
-1 ${reads[0]} \\
-2 ${reads[1]} \\
$strandedness \\
--known-splicesite-infile $splicesites \\
--summary-file ${prefix}.hisat2.summary.log \\
--threads $task.cpus \\
$seq_center \\
$unaligned \\
--no-mixed \\
--no-discordant \\
$ioptions.args \\
| samtools view -bS -F 4 -F 8 -F 256 - > ${prefix}.bam
if [ -f ${prefix}.unmapped.fastq.1.gz ]; then
mv ${prefix}.unmapped.fastq.1.gz ${prefix}.unmapped_1.fastq.gz
if [ -f ${prefix}.unmapped.fastq.2.gz ]; then
mv ${prefix}.unmapped.fastq.2.gz ${prefix}.unmapped_2.fastq.gz
echo $VERSION > ${software}.version.txt

// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
def VERSION = '2.2.0'
process HISAT2_BUILD {
tag "$fasta"
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), publish_id:'') }
container ""
//container ""
conda (params.conda ? "bioconda::hisat2=2.2.0" : null)
path fasta
path gtf
path splicesites
val options
path "hisat2", emit: index
path "*.version.txt", emit: version
def avail_mem = 0
if (!task.memory) { "[HISAT2 index build] Available memory not known - defaulting to 0. Specify process memory requirements to change this."
} else { "[HISAT2 index build] Available memory: ${task.memory}"
avail_mem = task.memory.toGiga()
def extract_exons = ''
def ss = ''
def exon = ''
if (avail_mem > params.hisat_build_memory) { "[HISAT2 index build] Over ${params.hisat_build_memory} GB available, so using splice sites and exons in HISAT2 index"
extract_exons = " $gtf > ${gtf.baseName}.exons.txt"
ss = "--ss $splicesites"
exon = "--exon ${gtf.baseName}.exons.txt"
} else { "[HISAT2 index build] Less than ${params.hisat_build_memory} GB available, so NOT using splice sites and exons in HISAT2 index." "[HISAT2 index build] Use --hisat_build_memory [small number] to skip this check."
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
mkdir hisat2
hisat2-build \\
-p $task.cpus \\
$ss \\
$exon \\
$ioptions.args \\
$fasta \\
echo $VERSION > ${software}.version.txt

@ -0,0 +1,31 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
def VERSION = '2.2.0'
tag "$gtf"
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), publish_id:'') }
container ""
//container ""
conda (params.conda ? "bioconda::hisat2=2.2.0" : null)
path gtf
val options
path "*.splice_sites.txt", emit: txt
path "*.version.txt" , emit: version
def software = getSoftwareName(task.process)
""" $gtf > ${gtf.baseName}.splice_sites.txt
echo $VERSION > ${software}.version.txt

@ -0,0 +1,54 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
tag "$"
label 'process_medium'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
container ""
//container ""
conda (params.conda ? "bioconda::qualimap=2.2.2d" : null)
tuple val(meta), path(bam)
path gtf
val options
tuple val(meta), path("${prefix}"), emit: results
path "*.version.txt" , emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
def strandedness = 'non-strand-specific'
if (meta.strandedness == 'forward') {
strandedness = 'strand-specific-forward'
} else if (meta.strandedness == 'reverse') {
strandedness = 'strand-specific-reverse'
def paired_end = meta.single_end ? '' : '-pe'
def memory = task.memory.toGiga() + "G"
mkdir tmp
qualimap \\
--java-mem-size=$memory \\
rnaseq \\
$ioptions.args \\
-bam $bam \\
-gtf $gtf \\
-p $strandedness \\
$paired_end \\
-outdir $prefix
echo \$(qualimap 2>&1) | sed 's/^.*QualiMap v.//; s/Built.*\$//' > ${software}.version.txt

@ -0,0 +1,49 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
tag "$"
label 'process_medium'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
container ""
//container ""
conda (params.conda ? "bioconda::rsem=1.3.3" : null)
tuple val(meta), path(reads)
path index
val options
tuple val(meta), path("*.genes.results") , emit: counts_gene
tuple val(meta), path("*.isoforms.results"), emit: counts_transcript
tuple val(meta), path("*.stat") , emit: stat
path "*.version.txt" , emit: version
tuple val(meta), path("*.STAR.genome.bam") , optional:true, emit: bam_star
tuple val(meta), path("${prefix}.genome.bam") , optional:true, emit: bam_genome
tuple val(meta), path("${prefix}.transcript.bam"), optional:true, emit: bam_transcript
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
def paired_end = meta.single_end ? "" : "--paired-end"
INDEX=`find -L ./ -name "*.grp" | sed 's/.grp//'`
rsem-calculate-expression \\
--num-threads $task.cpus \\
--temporary-folder ./tmp/ \\
$paired_end \\
$ioptions.args \\
$reads \\
\$INDEX \\
rsem-calculate-expression --version | sed -e "s/Current version: RSEM v//g" > ${software}.version.txt

@ -0,0 +1,39 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
tag "$fasta"
label 'process_high'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), publish_id:'') }
container ""
//container ""
conda (params.conda ? "bioconda::rsem=1.3.3" : null)
path fasta
path gtf
val options
path "rsem" , emit: index
path "*.version.txt", emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
mkdir rsem
rsem-prepare-reference \\
--gtf $gtf \\
--num-threads $task.cpus \\
$ioptions.args \\
$fasta \\
rsem-calculate-expression --version | sed -e "s/Current version: RSEM v//g" > ${software}.version.txt

@ -0,0 +1,36 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
tag "$"
label 'process_medium'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
container ""
//container ""
conda (params.conda ? "bioconda::rseqc=3.0.1" : null)
tuple val(meta), path(bam)
val options
tuple val(meta), path("*.bam_stat.txt"), emit: txt
path "*.version.txt" , emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
def prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
""" \\
-i $bam \\
$ioptions.args \\
> ${prefix}.bam_stat.txt --version | sed -e "s/ //g" > ${software}.version.txt

@ -0,0 +1,38 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
tag "$"
label 'process_medium'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
container ""
//container ""
conda (params.conda ? "bioconda::rseqc=3.0.1" : null)
tuple val(meta), path(bam)
path bed
val options
tuple val(meta), path("*.infer_experiment.txt"), emit: txt
path "*.version.txt" , emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
def prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
""" \\
-i $bam \\
-r $bed \\
$ioptions.args \\
> ${prefix}.infer_experiment.txt --version | sed -e "s/ //g" > ${software}.version.txt

@ -0,0 +1,50 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
tag "$"
label 'process_medium'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
container ""
//container ""
conda (params.conda ? "bioconda::rseqc=3.0.1" : null)
tuple val(meta), path(bam)
path bed
val options
tuple val(meta), path("*distance.txt"), optional:true, emit: distance
tuple val(meta), path("*freq.txt") , optional:true, emit: freq
tuple val(meta), path("*mean.txt") , optional:true, emit: mean
tuple val(meta), path("*.pdf") , optional:true, emit: pdf
tuple val(meta), path("*.r") , optional:true, emit: rscript
path "*.version.txt" , emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
def prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
if (!meta.single_end) {
""" \\
-i $bam \\
-r $bed \\
-o $prefix \\
$ioptions.args \\
> stdout.txt
head -n 2 stdout.txt > ${prefix}.inner_distance_mean.txt --version | sed -e "s/ //g" > ${software}.version.txt
} else {
""" --version | sed -e "s/ //g" > ${software}.version.txt

@ -0,0 +1,45 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
tag "$"
label 'process_medium'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
container ""
//container ""
conda (params.conda ? "bioconda::rseqc=3.0.1" : null)
tuple val(meta), path(bam)
path bed
val options
tuple val(meta), path("*.junction.bed"), emit: bed
tuple val(meta), path("*.Interact.bed"), emit: interact_bed
tuple val(meta), path("*.xls") , emit: xls
tuple val(meta), path("*junction.pdf") , emit: pdf
tuple val(meta), path("*events.pdf") , emit: events_pdf
tuple val(meta), path("*.r") , emit: rscript
tuple val(meta), path("*.log") , emit: log
path "*.version.txt" , emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
def prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
""" \\
-i $bam \\
-r $bed \\
-o $prefix \\
$ioptions.args \\
2> ${prefix}.junction_annotation.log --version | sed -e "s/ //g" > ${software}.version.txt

@ -0,0 +1,39 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
tag "$"
label 'process_medium'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
container ""
//container ""
conda (params.conda ? "bioconda::rseqc=3.0.1" : null)
tuple val(meta), path(bam)
path bed
val options
tuple val(meta), path("*.pdf"), emit: pdf
tuple val(meta), path("*.r") , emit: rscript
path "*.version.txt" , emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
def prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
""" \\
-i $bam \\
-r $bed \\
-o $prefix \\
$ioptions.args --version | sed -e "s/ //g" > ${software}.version.txt

@ -0,0 +1,37 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
tag "$"
label 'process_medium'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
container ""
//container ""
conda (params.conda ? "bioconda::rseqc=3.0.1" : null)
tuple val(meta), path(bam)
path bed
val options
tuple val(meta), path("*.read_distribution.txt"), emit: txt
path "*.version.txt" , emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
def prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
""" \\
-i $bam \\
-r $bed \\
> ${prefix}.read_distribution.txt --version | sed -e "s/ //g" > ${software}.version.txt

@ -0,0 +1,39 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
tag "$"
label 'process_medium'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
container ""
//container ""
conda (params.conda ? "bioconda::rseqc=3.0.1" : null)
tuple val(meta), path(bam)
val options
tuple val(meta), path("*seq.DupRate.xls"), emit: seq_xls
tuple val(meta), path("*pos.DupRate.xls"), emit: pos_xls
tuple val(meta), path("*.pdf") , emit: pdf
tuple val(meta), path("*.r") , emit: rscript
path "*.version.txt" , emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
def prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
""" \\
-i $bam \\
-o $prefix \\
$ioptions.args --version | sed -e "s/ //g" > ${software}.version.txt

@ -0,0 +1,36 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
process SALMON_INDEX {
tag "$fasta"
label "process_medium"
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), publish_id:'') }
container ""
//container ""
conda (params.conda ? "bioconda::salmon=1.3.0" : null)
path fasta
val options
path "salmon" , emit: index
path "*.version.txt", emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
salmon \\
index \\
--threads $task.cpus \\
-t $fasta \\
$ioptions.args \\
-i salmon
salmon --version | sed -e "s/salmon //g" > ${software}.version.txt

@ -0,0 +1,50 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
process SALMON_QUANT {
tag "$"
label "process_medium"
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
container ""
//container ""
conda (params.conda ? "bioconda::salmon=1.3.0" : null)
tuple val(meta), path(reads)
path index
path gtf
val options
tuple val(meta), path("${prefix}"), emit: results
path "*.version.txt" , emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
def strandedness = meta.single_end ? 'U' : 'IU'
if (meta.strandedness == 'forward') {
strandedness = meta.single_end ? 'SF' : 'ISF'
} else if (meta.strandedness == 'reverse') {
strandedness = meta.single_end ? 'SR' : 'ISR'
def endedness = meta.single_end ? "-r $reads" : "-1 ${reads[0]} -2 ${reads[1]}"
salmon quant \\
--geneMap $gtf \\
--threads $task.cpus \\
--libType=$strandedness \\
--index $index \\
$endedness \\
$ioptions.args \\
-o $prefix
salmon --version | sed -e "s/salmon //g" > ${software}.version.txt

@ -0,0 +1,70 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
process SORTMERNA {
tag "$"
label "process_high"
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
container ""
//container ""
conda (params.conda ? "bioconda::sortmerna=4.2.0" : null)
tuple val(meta), path(reads)
path fasta
val options
tuple val(meta), path("*.fastq.gz"), emit: reads
tuple val(meta), path("*.log") , emit: log
path "*.version.txt" , emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
def prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
def Refs = ""
for (i=0; i<fasta.size(); i++) { Refs+= " --ref ${fasta[i]}" }
if (meta.single_end) {
sortmerna \\
$Refs \\
--reads $reads \\
--threads $task.cpus \\
--workdir . \\
--aligned rRNA_reads \\
--other non_rRNA_reads \\
gzip -f < non_rRNA_reads.fq > ${prefix}.fastq.gz
mv rRNA_reads.log ${prefix}.sortmerna.log
echo \$(sortmerna --version 2>&1) | sed 's/^.*SortMeRNA version //; s/ Build Date.*\$//' > ${software}.version.txt
} else {
sortmerna \\
$Refs \\
--reads ${reads[0]} \\
--reads ${reads[1]} \\
--threads $task.cpus \\
--workdir . \\
--aligned rRNA_reads \\
--other non_rRNA_reads \\
--paired_in \\
--out2 \\
gzip -f < non_rRNA_reads_fwd.fq > ${prefix}_1.fastq.gz
gzip -f < non_rRNA_reads_rev.fq > ${prefix}_2.fastq.gz
mv rRNA_reads.log ${prefix}.sortmerna.log
echo \$(sortmerna --version 2>&1) | sed 's/^.*SortMeRNA version //; s/ Build Date.*\$//' > ${software}.version.txt

@ -0,0 +1,62 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
process STAR_ALIGN {
tag "$"
label 'process_high'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
// Don't upgrade me - 2.7X indices incompatible with iGenomes.
container ""
//container ""
conda (params.conda ? "bioconda::star=2.6.1d" : null)
tuple val(meta), path(reads)
path index
path gtf
val options
tuple val(meta), path("*Aligned.out.bam") , emit: bam
tuple val(meta), path("*") , emit: log_final
tuple val(meta), path("*Log.out") , emit: log_out
tuple val(meta), path("*Log.progress.out"), emit: log_progress
path "*.version.txt" , emit: version
tuple val(meta), path("*sortedByCoord.out.bam") , optional:true, emit: bam_sorted
tuple val(meta), path("*toTranscriptome.out.bam"), optional:true, emit: bam_transcript
tuple val(meta), path("*fastq.gz") , optional:true, emit: fastq
tuple val(meta), path("*.tab") , optional:true, emit: tab
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
def prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
def ignore_gtf = params.star_ignore_sjdbgtf ? '' : "--sjdbGTFfile $gtf"
def seq_center = params.seq_center ? "--outSAMattrRGline ID:$prefix 'CN:$params.seq_center' 'SM:$prefix'" : "--outSAMattrRGline ID:$prefix 'SM:$prefix'"
--genomeDir $index \\
--readFilesIn $reads \\
--runThreadN $task.cpus \\
--outFileNamePrefix $prefix. \\
$ignore_gtf \\
$seq_center \\
if [ -f ${prefix}.Unmapped.out.mate1 ]; then
mv ${prefix}.Unmapped.out.mate1 ${prefix}.unmapped_1.fastq
gzip ${prefix}.unmapped_1.fastq
if [ -f ${prefix}.Unmapped.out.mate2 ]; then
mv ${prefix}.Unmapped.out.mate2 ${prefix}.unmapped_2.fastq
gzip ${prefix}.unmapped_2.fastq
STAR --version | sed -e "s/STAR_//g" > ${software}.version.txt

@ -0,0 +1,43 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
tag "$fasta"
label 'process_high'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), publish_id:'') }
// Don't upgrade me - 2.7X indices incompatible with iGenomes.
container ""
//container ""
conda (params.conda ? "bioconda::star=2.6.1d" : null)
path fasta
path gtf
val options
path "star" , emit: index
path "*.version.txt", emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
def avail_mem = task.memory ? "--limitGenomeGenerateRAM ${task.memory.toBytes() - 100000000}" : ''
mkdir star
--runMode genomeGenerate \\
--genomeDir star/ \\
--genomeFastaFiles $fasta \\
--sjdbGTFfile $gtf \\
--runThreadN $task.cpus \\
$avail_mem \\
STAR --version | sed -e "s/STAR_//g" > ${software}.version.txt

@ -0,0 +1,52 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
process STRINGTIE {
tag "$"
label 'process_medium'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
container ""
//container ""
conda (params.conda ? "bioconda::stringtie=2.1.2" : null)
tuple val(meta), path(bam)
path gtf
val options
tuple val(meta), path("*.coverage.gtf") , emit: coverage_gtf
tuple val(meta), path("*.transcripts.gtf"), emit: transcript_gtf
tuple val(meta), path("*.txt") , emit: abundance
tuple val(meta), path("*.ballgown") , emit: ballgown
path "*.version.txt" , emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
def prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
def strandedness = ''
if (meta.strandedness == 'forward') {
strandedness = '--fr'
} else if (meta.strandedness == 'reverse') {
strandedness = '--rf'
stringtie \\
$bam \\
$strandedness \\
-G $gtf \\
-o ${prefix}.transcripts.gtf \\
-A ${prefix}.gene_abundance.txt \\
-C ${prefix}.coverage.gtf \\
-b ${prefix}.ballgown \\
stringtie --version > ${software}.version.txt

@ -0,0 +1,38 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
tag "$"
label "process_medium"
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
container ""
//container ""
conda (params.conda ? "bioconda::umi_tools=1.0.1" : null)
tuple val(meta), path(bam), path(bai)
val options
tuple val(meta), path("*.bam"), emit: bam
tuple val(meta), path("*.tsv"), emit: tsv
path "*.version.txt" , emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
def prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
umi_tools dedup \\
-I $bam \\
-S ${prefix}.bam \\
--output-stats=$prefix \\
$ioptions.args \\
umi_tools --version | sed -e "s/UMI-tools version: //g" > ${software}.version.txt

@ -0,0 +1,54 @@
// Import generic module functions
include { initOptions; saveFiles; getSoftwareName } from './functions'
tag "$"
label "process_low"
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:options, publish_dir:getSoftwareName(task.process), }
container ""
//container ""
conda (params.conda ? "bioconda::umi_tools=1.0.1" : null)
tuple val(meta), path(reads)
val options
tuple val(meta), path("*.fastq.gz"), emit: reads
tuple val(meta), path("*.log") , emit: log
path "*.version.txt" , emit: version
def software = getSoftwareName(task.process)
def ioptions = initOptions(options)
def prefix = ioptions.suffix ? "${}${ioptions.suffix}" : "${}"
if (meta.single_end) {
umi_tools \\
extract \\
-I $reads \\
-S ${prefix}.umi_extract.fastq.gz \\
$ioptions.args \\
> ${prefix}.umi_extract.log
umi_tools --version | sed -e "s/UMI-tools version: //g" > ${software}.version.txt
} else {
umi_tools \\
extract \\
-I ${reads[0]} \\
--read2-in=${reads[1]} \\
-S ${prefix}.umi_extract_1.fastq.gz \\
--read2-out=${prefix}.umi_extract_2.fastq.gz \\
$ioptions.args \\
> ${prefix}.umi_extract.log
umi_tools --version | sed -e "s/UMI-tools version: //g" > ${software}.version.txt