2020-12-17 18:50:24 -05:00
|
|
|
process STAR_ALIGN {
|
|
|
|
tag "$meta.id"
|
|
|
|
label 'process_high'
|
|
|
|
|
2022-05-27 06:35:04 -04:00
|
|
|
conda (params.enable_conda ? "bioconda::star=2.7.10a bioconda::samtools=1.15.1 conda-forge::gawk=5.1.0" : null)
|
2021-11-26 02:58:40 -05:00
|
|
|
container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ?
|
2022-05-27 06:35:04 -04:00
|
|
|
'https://depot.galaxyproject.org/singularity/mulled-v2-1fa26d1ce03c295fe2fdcf85831a92fbcbd7e8c2:afaaa4c6f5b308b4b6aa2dd8e99e1466b2a6b0cd-0' :
|
|
|
|
'quay.io/biocontainers/mulled-v2-1fa26d1ce03c295fe2fdcf85831a92fbcbd7e8c2:afaaa4c6f5b308b4b6aa2dd8e99e1466b2a6b0cd-0' }"
|
2020-12-17 18:50:24 -05:00
|
|
|
|
|
|
|
input:
|
|
|
|
tuple val(meta), path(reads)
|
2022-05-27 06:35:04 -04:00
|
|
|
path index
|
|
|
|
path gtf
|
2021-11-26 02:58:40 -05:00
|
|
|
val star_ignore_sjdbgtf
|
|
|
|
val seq_platform
|
|
|
|
val seq_center
|
2020-12-17 18:50:24 -05:00
|
|
|
|
|
|
|
output:
|
2021-01-26 06:46:30 -05:00
|
|
|
tuple val(meta), path('*d.out.bam') , emit: bam
|
2021-01-25 03:02:03 -05:00
|
|
|
tuple val(meta), path('*Log.final.out') , emit: log_final
|
|
|
|
tuple val(meta), path('*Log.out') , emit: log_out
|
|
|
|
tuple val(meta), path('*Log.progress.out'), emit: log_progress
|
2021-10-01 09:04:56 -04:00
|
|
|
path "versions.yml" , emit: versions
|
2020-12-17 18:50:24 -05:00
|
|
|
|
2021-01-25 03:02:03 -05:00
|
|
|
tuple val(meta), path('*sortedByCoord.out.bam') , optional:true, emit: bam_sorted
|
|
|
|
tuple val(meta), path('*toTranscriptome.out.bam'), optional:true, emit: bam_transcript
|
2021-01-26 06:46:30 -05:00
|
|
|
tuple val(meta), path('*Aligned.unsort.out.bam') , optional:true, emit: bam_unsorted
|
2021-01-25 03:02:03 -05:00
|
|
|
tuple val(meta), path('*fastq.gz') , optional:true, emit: fastq
|
|
|
|
tuple val(meta), path('*.tab') , optional:true, emit: tab
|
2021-07-26 13:03:30 -04:00
|
|
|
tuple val(meta), path('*.out.junction') , optional:true, emit: junction
|
2022-03-23 08:13:58 -04:00
|
|
|
tuple val(meta), path('*.out.sam') , optional:true, emit: sam
|
2020-12-17 18:50:24 -05:00
|
|
|
|
2022-02-04 03:53:32 -05:00
|
|
|
when:
|
|
|
|
task.ext.when == null || task.ext.when
|
|
|
|
|
2020-12-17 18:50:24 -05:00
|
|
|
script:
|
2021-11-26 02:58:40 -05:00
|
|
|
def args = task.ext.args ?: ''
|
2021-12-02 07:39:55 -05:00
|
|
|
def prefix = task.ext.prefix ?: "${meta.id}"
|
2021-11-26 02:58:40 -05:00
|
|
|
def ignore_gtf = star_ignore_sjdbgtf ? '' : "--sjdbGTFfile $gtf"
|
|
|
|
def seq_platform = seq_platform ? "'PL:$seq_platform'" : ""
|
|
|
|
def seq_center = seq_center ? "--outSAMattrRGline ID:$prefix 'CN:$seq_center' 'SM:$prefix' $seq_platform " : "--outSAMattrRGline ID:$prefix 'SM:$prefix' $seq_platform "
|
|
|
|
def out_sam_type = (args.contains('--outSAMtype')) ? '' : '--outSAMtype BAM Unsorted'
|
|
|
|
def mv_unsorted_bam = (args.contains('--outSAMtype BAM Unsorted SortedByCoordinate')) ? "mv ${prefix}.Aligned.out.bam ${prefix}.Aligned.unsort.out.bam" : ''
|
2020-12-17 18:50:24 -05:00
|
|
|
"""
|
|
|
|
STAR \\
|
|
|
|
--genomeDir $index \\
|
|
|
|
--readFilesIn $reads \\
|
|
|
|
--runThreadN $task.cpus \\
|
|
|
|
--outFileNamePrefix $prefix. \\
|
2021-01-25 08:09:03 -05:00
|
|
|
$out_sam_type \\
|
2020-12-17 18:50:24 -05:00
|
|
|
$ignore_gtf \\
|
|
|
|
$seq_center \\
|
2021-11-26 02:58:40 -05:00
|
|
|
$args
|
2020-12-17 18:50:24 -05:00
|
|
|
|
2021-01-26 06:46:30 -05:00
|
|
|
$mv_unsorted_bam
|
2021-01-25 08:09:03 -05:00
|
|
|
|
2020-12-17 18:50:24 -05:00
|
|
|
if [ -f ${prefix}.Unmapped.out.mate1 ]; then
|
|
|
|
mv ${prefix}.Unmapped.out.mate1 ${prefix}.unmapped_1.fastq
|
|
|
|
gzip ${prefix}.unmapped_1.fastq
|
|
|
|
fi
|
|
|
|
if [ -f ${prefix}.Unmapped.out.mate2 ]; then
|
|
|
|
mv ${prefix}.Unmapped.out.mate2 ${prefix}.unmapped_2.fastq
|
|
|
|
gzip ${prefix}.unmapped_2.fastq
|
|
|
|
fi
|
|
|
|
|
2021-09-27 04:41:24 -04:00
|
|
|
cat <<-END_VERSIONS > versions.yml
|
2021-11-26 02:58:40 -05:00
|
|
|
"${task.process}":
|
|
|
|
star: \$(STAR --version | sed -e "s/STAR_//g")
|
2022-05-27 06:35:04 -04:00
|
|
|
samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//')
|
|
|
|
gawk: \$(echo \$(gawk --version 2>&1) | sed 's/^.*GNU Awk //; s/, .*\$//')
|
2021-09-27 04:41:24 -04:00
|
|
|
END_VERSIONS
|
2020-12-17 18:50:24 -05:00
|
|
|
"""
|
2022-08-09 03:42:19 -04:00
|
|
|
|
|
|
|
stub:
|
|
|
|
def prefix = task.ext.prefix ?: "${meta.id}"
|
|
|
|
"""
|
|
|
|
touch ${prefix}Xd.out.bam
|
|
|
|
touch ${prefix}.Log.final.out
|
|
|
|
touch ${prefix}.Log.out
|
|
|
|
touch ${prefix}.Log.progress.out
|
|
|
|
touch ${prefix}.sortedByCoord.out.bam
|
|
|
|
touch ${prefix}.toTranscriptome.out.bam
|
|
|
|
touch ${prefix}.Aligned.unsort.out.bam
|
|
|
|
touch ${prefix}.unmapped_1.fastq.gz
|
|
|
|
touch ${prefix}.unmapped_2.fastq.gz
|
|
|
|
touch ${prefix}.tab
|
|
|
|
touch ${prefix}.Chimeric.out.junction
|
|
|
|
touch ${prefix}.out.sam
|
|
|
|
|
|
|
|
cat <<-END_VERSIONS > versions.yml
|
|
|
|
"${task.process}":
|
|
|
|
star: \$(STAR --version | sed -e "s/STAR_//g")
|
|
|
|
samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//')
|
|
|
|
gawk: \$(echo \$(gawk --version 2>&1) | sed 's/^.*GNU Awk //; s/, .*\$//')
|
|
|
|
END_VERSIONS
|
|
|
|
"""
|
2020-12-17 18:50:24 -05:00
|
|
|
}
|