2022-03-15 06:18:43 -04:00
|
|
|
process ASCAT {
|
|
|
|
tag "$meta.id"
|
|
|
|
label 'process_medium'
|
|
|
|
|
2022-06-23 11:06:00 -04:00
|
|
|
conda (params.enable_conda ? "bioconda::ascat=3.0.0 bioconda::cancerit-allelecount=4.3.0" : null)
|
2022-03-15 06:18:43 -04:00
|
|
|
container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ?
|
|
|
|
'https://depot.galaxyproject.org/singularity/mulled-v2-c278c7398beb73294d78639a864352abef2931ce:dfe5aaa885de434adb2b490b68972c5840c6d761-0':
|
|
|
|
'quay.io/biocontainers/mulled-v2-c278c7398beb73294d78639a864352abef2931ce:dfe5aaa885de434adb2b490b68972c5840c6d761-0' }"
|
|
|
|
|
|
|
|
input:
|
|
|
|
tuple val(meta), path(input_normal), path(index_normal), path(input_tumor), path(index_tumor)
|
|
|
|
path(allele_files)
|
|
|
|
path(loci_files)
|
2022-06-23 11:06:00 -04:00
|
|
|
path(bed_file) // optional
|
|
|
|
path(fasta) // optional
|
|
|
|
path(gc_file) // optional
|
|
|
|
path(rt_file) // optional
|
2022-03-15 06:18:43 -04:00
|
|
|
|
|
|
|
output:
|
2022-06-23 11:06:00 -04:00
|
|
|
tuple val(meta), path("*png"), emit: png
|
|
|
|
tuple val(meta), path("*cnvs.txt"), emit: cnvs
|
|
|
|
tuple val(meta), path("*metrics.txt"), emit: metrics
|
|
|
|
tuple val(meta), path("*purityploidy.txt"), emit: purityploidy
|
|
|
|
tuple val(meta), path("*segments.txt"), emit: segments
|
|
|
|
tuple val(meta), path("*alleleFrequencies_chr*.txt"), emit: allelefreqs
|
|
|
|
path "versions.yml", emit: versions
|
2022-03-15 06:18:43 -04:00
|
|
|
|
|
|
|
when:
|
|
|
|
task.ext.when == null || task.ext.when
|
|
|
|
|
|
|
|
script:
|
|
|
|
def args = task.ext.args ?: ''
|
|
|
|
def prefix = task.ext.prefix ?: "${meta.id}"
|
|
|
|
def gender = args.gender ? "$args.gender" : "NULL"
|
|
|
|
def genomeVersion = args.genomeVersion ? "$args.genomeVersion" : "NULL"
|
|
|
|
def purity = args.purity ? "$args.purity" : "NULL"
|
|
|
|
def ploidy = args.ploidy ? "$args.ploidy" : "NULL"
|
2022-06-23 11:06:00 -04:00
|
|
|
def gc_input = gc_file ? "$gc_file" : "NULL"
|
|
|
|
def rt_input = rt_file ? "$rt_file" : "NULL"
|
2022-03-15 06:18:43 -04:00
|
|
|
|
|
|
|
def minCounts_arg = args.minCounts ? ",minCounts = $args.minCounts" : ""
|
2022-06-23 11:06:00 -04:00
|
|
|
def bed_file_arg = bed_file ? ",BED_file = '$bed_file'": ""
|
2022-03-15 06:18:43 -04:00
|
|
|
def chrom_names_arg = args.chrom_names ? ",chrom_names = $args.chrom_names" : ""
|
|
|
|
def min_base_qual_arg = args.min_base_qual ? ",min_base_qual = $args.min_base_qual" : ""
|
|
|
|
def min_map_qual_arg = args.min_map_qual ? ",min_map_qual = $args.min_map_qual" : ""
|
2022-06-23 11:06:00 -04:00
|
|
|
def fasta_arg = fasta ? ",ref.fasta = '$fasta'" : ""
|
2022-03-15 06:18:43 -04:00
|
|
|
def skip_allele_counting_tumour_arg = args.skip_allele_counting_tumour ? ",skip_allele_counting_tumour = $args.skip_allele_counting_tumour" : ""
|
|
|
|
def skip_allele_counting_normal_arg = args.skip_allele_counting_normal ? ",skip_allele_counting_normal = $args.skip_allele_counting_normal" : ""
|
|
|
|
|
|
|
|
"""
|
|
|
|
#!/usr/bin/env Rscript
|
|
|
|
library(RColorBrewer)
|
|
|
|
library(ASCAT)
|
|
|
|
options(bitmapType='cairo')
|
|
|
|
|
2022-06-23 11:06:00 -04:00
|
|
|
#build prefixes: <abspath_to_files/prefix_chr>
|
|
|
|
allele_path = normalizePath("$allele_files")
|
|
|
|
allele_prefix = paste0(allele_path, "/", "$allele_files", "_chr")
|
|
|
|
|
|
|
|
loci_path = normalizePath("$loci_files")
|
|
|
|
loci_prefix = paste0(loci_path, "/", "$loci_files", "_chr")
|
2022-03-15 06:18:43 -04:00
|
|
|
|
|
|
|
#prepare from BAM files
|
|
|
|
ascat.prepareHTS(
|
|
|
|
tumourseqfile = "$input_tumor",
|
|
|
|
normalseqfile = "$input_normal",
|
|
|
|
tumourname = "Tumour",
|
|
|
|
normalname = "Normal",
|
|
|
|
allelecounter_exe = "alleleCounter",
|
2022-06-23 11:06:00 -04:00
|
|
|
alleles.prefix = allele_prefix,
|
|
|
|
loci.prefix = loci_prefix,
|
2022-03-15 06:18:43 -04:00
|
|
|
gender = "$gender",
|
|
|
|
genomeVersion = "$genomeVersion",
|
|
|
|
nthreads = $task.cpus
|
|
|
|
$minCounts_arg
|
2022-06-23 11:06:00 -04:00
|
|
|
$bed_file_arg
|
2022-03-15 06:18:43 -04:00
|
|
|
$chrom_names_arg
|
|
|
|
$min_base_qual_arg
|
|
|
|
$min_map_qual_arg
|
2022-06-23 11:06:00 -04:00
|
|
|
$fasta_arg
|
2022-03-15 06:18:43 -04:00
|
|
|
$skip_allele_counting_tumour_arg
|
|
|
|
$skip_allele_counting_normal_arg
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
#Load the data
|
|
|
|
ascat.bc = ascat.loadData(
|
|
|
|
Tumor_LogR_file = "Tumour_tumourLogR.txt",
|
|
|
|
Tumor_BAF_file = "Tumour_normalBAF.txt",
|
|
|
|
Germline_LogR_file = "Tumour_normalLogR.txt",
|
|
|
|
Germline_BAF_file = "Tumour_normalBAF.txt",
|
|
|
|
genomeVersion = "$genomeVersion",
|
|
|
|
gender = "$gender"
|
|
|
|
)
|
|
|
|
|
|
|
|
#Plot the raw data
|
2022-06-23 11:06:00 -04:00
|
|
|
ascat.plotRawData(ascat.bc, img.prefix = "Before_correction_")
|
|
|
|
|
|
|
|
# optional LogRCorrection
|
|
|
|
if("$gc_input" != "NULL") {
|
|
|
|
gc_input = paste0(normalizePath("$gc_input"), "/", "$gc_input", ".txt")
|
|
|
|
|
|
|
|
if("$rt_input" != "NULL"){
|
|
|
|
rt_input = paste0(normalizePath("$rt_input"), "/", "$rt_input", ".txt")
|
|
|
|
ascat.bc = ascat.correctLogR(ascat.bc, GCcontentfile = gc_input, replictimingfile = rt_input)
|
|
|
|
#Plot raw data after correction
|
|
|
|
ascat.plotRawData(ascat.bc, img.prefix = "After_correction_GC_")
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
ascat.bc = ascat.correctLogR(ascat.bc, GCcontentfile = gc_input, replictimingfile = $rt_input)
|
|
|
|
#Plot raw data after correction
|
|
|
|
ascat.plotRawData(ascat.bc, img.prefix = "After_correction_GC_RT_")
|
|
|
|
}
|
|
|
|
}
|
2022-03-15 06:18:43 -04:00
|
|
|
|
|
|
|
#Segment the data
|
|
|
|
ascat.bc = ascat.aspcf(ascat.bc)
|
|
|
|
|
|
|
|
#Plot the segmented data
|
|
|
|
ascat.plotSegmentedData(ascat.bc)
|
|
|
|
|
|
|
|
#Run ASCAT to fit every tumor to a model, inferring ploidy, normal cell contamination, and discrete copy numbers
|
|
|
|
#If psi and rho are manually set:
|
|
|
|
if (!is.null($purity) && !is.null($ploidy)){
|
|
|
|
ascat.output <- ascat.runAscat(ascat.bc, gamma=1, rho_manual=$purity, psi_manual=$ploidy)
|
|
|
|
} else if(!is.null($purity) && is.null($ploidy)){
|
|
|
|
ascat.output <- ascat.runAscat(ascat.bc, gamma=1, rho_manual=$purity)
|
|
|
|
} else if(!is.null($ploidy) && is.null($purity)){
|
|
|
|
ascat.output <- ascat.runAscat(ascat.bc, gamma=1, psi_manual=$ploidy)
|
|
|
|
} else {
|
|
|
|
ascat.output <- ascat.runAscat(ascat.bc, gamma=1)
|
|
|
|
}
|
|
|
|
|
2022-06-23 11:06:00 -04:00
|
|
|
#Extract metrics from ASCAT profiles
|
|
|
|
QC = ascat.metrics(ascat.bc,ascat.output)
|
|
|
|
|
2022-03-15 06:18:43 -04:00
|
|
|
#Write out segmented regions (including regions with one copy of each allele)
|
|
|
|
write.table(ascat.output[["segments"]], file=paste0("$prefix", ".segments.txt"), sep="\t", quote=F, row.names=F)
|
|
|
|
|
|
|
|
#Write out CNVs in bed format
|
|
|
|
cnvs=ascat.output[["segments"]][2:6]
|
|
|
|
write.table(cnvs, file=paste0("$prefix",".cnvs.txt"), sep="\t", quote=F, row.names=F, col.names=T)
|
|
|
|
|
|
|
|
#Write out purity and ploidy info
|
|
|
|
summary <- tryCatch({
|
|
|
|
matrix(c(ascat.output[["aberrantcellfraction"]], ascat.output[["ploidy"]]), ncol=2, byrow=TRUE)}, error = function(err) {
|
|
|
|
# error handler picks up where error was generated
|
|
|
|
print(paste("Could not find optimal solution: ",err))
|
|
|
|
return(matrix(c(0,0),nrow=1,ncol=2,byrow = TRUE))
|
|
|
|
}
|
|
|
|
)
|
|
|
|
colnames(summary) <- c("AberrantCellFraction","Ploidy")
|
|
|
|
write.table(summary, file=paste0("$prefix",".purityploidy.txt"), sep="\t", quote=F, row.names=F, col.names=T)
|
|
|
|
|
2022-06-23 11:06:00 -04:00
|
|
|
write.table(QC, file=paste0("$prefix", ".metrics.txt"), sep="\t", quote=F, row.names=F)
|
|
|
|
|
|
|
|
# version export
|
|
|
|
f <- file("versions.yml","w")
|
|
|
|
alleleCounter_version = system(paste("alleleCounter --version"), intern = T)
|
|
|
|
ascat_version = sessionInfo()\$otherPkgs\$ASCAT\$Version
|
|
|
|
writeLines(paste0('"', "$task.process", '"', ":"), f)
|
|
|
|
writeLines(paste(" alleleCounter:", alleleCounter_version), f)
|
|
|
|
writeLines(paste(" ascat:", ascat_version), f)
|
2022-03-15 06:18:43 -04:00
|
|
|
close(f)
|
2022-06-23 11:06:00 -04:00
|
|
|
|
2022-03-15 06:18:43 -04:00
|
|
|
"""
|
|
|
|
|
|
|
|
|
|
|
|
stub:
|
|
|
|
def prefix = task.ext.prefix ?: "${meta.id}"
|
|
|
|
"""
|
2022-03-16 08:29:11 -04:00
|
|
|
echo stub > ${prefix}.cnvs.txt
|
2022-06-23 11:06:00 -04:00
|
|
|
echo stub > ${prefix}.metrics.txt
|
2022-03-16 08:29:11 -04:00
|
|
|
echo stub > ${prefix}.purityploidy.txt
|
|
|
|
echo stub > ${prefix}.segments.txt
|
|
|
|
echo stub > Tumour.ASCATprofile.png
|
|
|
|
echo stub > Tumour.ASPCF.png
|
2022-06-23 11:06:00 -04:00
|
|
|
echo stub > Before_correction_Tumour.germline.png
|
|
|
|
echo stub > After_correction_GC_Tumour.germline.png
|
2022-03-16 08:29:11 -04:00
|
|
|
echo stub > Tumour.rawprofile.png
|
|
|
|
echo stub > Tumour.sunrise.png
|
2022-06-23 11:06:00 -04:00
|
|
|
echo stub > Before_correction_Tumour.tumour.png
|
|
|
|
echo stub > After_correction_GC_Tumour.tumour.png
|
|
|
|
echo stub > Tumour_alleleFrequencies_chr21.txt
|
|
|
|
echo stub > Tumour_alleleFrequencies_chr22.txt
|
|
|
|
echo stub > Normal_alleleFrequencies_chr21.txt
|
|
|
|
echo stub > Normal_alleleFrequencies_chr22.txt
|
|
|
|
|
|
|
|
echo "${task.process}:" > versions.yml
|
|
|
|
echo ' alleleCounter: 4.3.0' >> versions.yml
|
2022-03-15 06:18:43 -04:00
|
|
|
echo ' ascat: 3.0.0' >> versions.yml
|
2022-06-23 11:06:00 -04:00
|
|
|
|
2022-03-15 06:18:43 -04:00
|
|
|
"""
|
|
|
|
|
|
|
|
|
|
|
|
}
|