2019-06-24 20:50:36 -04:00
|
|
|
/*
|
|
|
|
* -------------------------------------------------
|
|
|
|
* Nextflow config file for Chan Zuckerberg Biohub
|
|
|
|
* -------------------------------------------------
|
|
|
|
* Defines reference genomes, using iGenome paths
|
|
|
|
* Imported under the default 'standard' Nextflow
|
|
|
|
* profile in nextflow.config
|
|
|
|
*/
|
|
|
|
|
|
|
|
//Profile config names for nf-core/configs
|
|
|
|
params {
|
|
|
|
config_profile_description = 'Chan Zuckerberg Biohub AWS Batch profile provided by nf-core/configs.'
|
|
|
|
config_profile_contact = 'Olga Botvinnik (@olgabot)'
|
|
|
|
config_profile_url = 'https://www.czbiohub.org/'
|
|
|
|
}
|
|
|
|
|
|
|
|
docker {
|
|
|
|
enabled = true
|
|
|
|
}
|
|
|
|
|
|
|
|
process {
|
|
|
|
executor = 'awsbatch'
|
2019-07-01 12:25:46 -04:00
|
|
|
queue = 'default-971039e0-830c-11e9-9e0b-02c5b84a8036'
|
2019-06-24 20:50:36 -04:00
|
|
|
errorStrategy = 'ignore'
|
|
|
|
}
|
|
|
|
|
|
|
|
workDir = "s3://czb-nextflow/intermediates/"
|
|
|
|
|
|
|
|
aws.region = 'us-west-2'
|
|
|
|
executor.awscli = '/home/ec2-user/miniconda/bin/aws'
|
|
|
|
params.tracedir = './'
|
|
|
|
|
|
|
|
params {
|
|
|
|
saveReference = true
|
|
|
|
|
|
|
|
// Largest SPOT instances available on AWS: https://ec2instances.info/
|
|
|
|
max_memory = 1952.GB
|
|
|
|
max_cpus = 96
|
|
|
|
max_time = 240.h
|
|
|
|
|
2019-06-24 20:52:10 -04:00
|
|
|
// Compatible with multiple versions of rnaseq pipeline
|
2019-06-24 20:50:36 -04:00
|
|
|
seq_center = "czbiohub"
|
2019-06-24 20:52:10 -04:00
|
|
|
seqCenter = "czbiohub"
|
2019-06-24 20:50:36 -04:00
|
|
|
|
|
|
|
// illumina iGenomes reference file paths on CZ Biohub reference s3 bucket
|
|
|
|
// No final slash because it's added later
|
|
|
|
igenomes_base = "s3://czbiohub-reference/igenomes"
|
|
|
|
|
|
|
|
// GENCODE (human + mouse) reference file paths on CZ Biohub reference s3 bucket
|
|
|
|
// No final slash because it's added later
|
|
|
|
gencode_base = "s3://czbiohub-reference/gencode"
|
|
|
|
transgenes_base = "s3://czbiohub-reference/transgenes"
|
|
|
|
|
|
|
|
// AWS configurations
|
|
|
|
awsregion = "us-west-2"
|
|
|
|
awsqueue = "nextflow"
|
|
|
|
|
2019-10-28 06:38:24 -04:00
|
|
|
igenomes_ignore = true
|
|
|
|
igenomesIgnore = true //deprecated
|
2019-06-24 20:50:36 -04:00
|
|
|
|
|
|
|
fc_extra_attributes = 'gene_name'
|
|
|
|
fc_group_features = 'gene_id'
|
|
|
|
fc_group_features_type = 'gene_type'
|
|
|
|
|
2019-07-03 19:01:03 -04:00
|
|
|
trim_pattern = '_+S\\d+'
|
|
|
|
|
2019-06-24 20:50:36 -04:00
|
|
|
// GENCODE GTF and fasta files
|
|
|
|
genomes {
|
|
|
|
'GRCh38' {
|
|
|
|
fasta = "${params.gencode_base}/human/v30/GRCh38.p12.genome.ERCC92.fa"
|
2019-06-26 20:56:26 -04:00
|
|
|
gtf = "${params.gencode_base}/human/v30/gencode.v30.annotation.ERCC92.gtf"
|
2019-06-24 20:50:36 -04:00
|
|
|
transcript_fasta = "${params.gencode_base}/human/v30/gencode.v30.transcripts.ERCC92.fa"
|
|
|
|
star = "${params.gencode_base}/human/v30/STARIndex/"
|
2019-06-27 18:02:47 -04:00
|
|
|
salmon_index = "${params.gencode_base}/human/v30/salmon_index/"
|
2019-06-24 20:50:36 -04:00
|
|
|
}
|
|
|
|
'GRCm38' {
|
|
|
|
fasta = "${params.gencode_base}/mouse/vM21/GRCm38.p6.genome.ERCC92.fa"
|
2019-06-26 20:56:26 -04:00
|
|
|
gtf = "${params.gencode_base}/mouse/vM21/gencode.vM21.annotation.ERCC92.gtf"
|
2019-06-24 20:50:36 -04:00
|
|
|
transcript_fasta = "${params.gencode_base}/mouse/vM21/gencode.vM21.transcripts.ERCC92.fa"
|
2019-07-09 19:02:25 -04:00
|
|
|
star = "${params.gencode_base}/mouse/vM21/STARIndex/"
|
2019-06-24 20:50:36 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
transgenes {
|
|
|
|
'ChR2' {
|
|
|
|
fasta = "${params.transgenes_base}/ChR2/ChR2.fa"
|
|
|
|
gtf = "${params.transgenes_base}/ChR2/ChR2.gtf"
|
|
|
|
}
|
|
|
|
'Cre' {
|
|
|
|
fasta = "${params.transgenes_base}/Cre/Cre.fa"
|
|
|
|
gtf = "${params.transgenes_base}/Cre/Cre.gtf"
|
|
|
|
}
|
|
|
|
'ERCC' {
|
|
|
|
fasta = "${params.transgenes_base}/ERCC92/ERCC92.fa"
|
|
|
|
gtf = "${params.transgenes_base}/ERCC92/ERCC92.gtf"
|
|
|
|
}
|
|
|
|
'GCaMP6m' {
|
|
|
|
fasta = "${params.transgenes_base}/GCaMP6m/GCaMP6m.fa"
|
|
|
|
gtf = "${params.transgenes_base}/GCaMP6m/GCaMP6m.gtf"
|
|
|
|
}
|
|
|
|
'GFP' {
|
|
|
|
fasta = "${params.transgenes_base}/Gfp/Gfp.fa"
|
|
|
|
gtf = "${params.transgenes_base}/Gfp/Gfp.gtf"
|
|
|
|
}
|
|
|
|
'NpHR' {
|
|
|
|
fasta = "${params.transgenes_base}/NpHR/NpHR.fa"
|
|
|
|
gtf = "${params.transgenes_base}/NpHR/NpHR.gtf"
|
|
|
|
}
|
|
|
|
'RCaMP' {
|
|
|
|
fasta = "${params.transgenes_base}/RCaMP/RCaMP.fa"
|
|
|
|
gtf = "${params.transgenes_base}/RCaMP/RCaMP.gtf"
|
|
|
|
}
|
|
|
|
'RGECO' {
|
|
|
|
fasta = "${params.transgenes_base}/RGECO/RGECO.fa"
|
|
|
|
gtf = "${params.transgenes_base}/RGECO/RGECO.gtf"
|
|
|
|
}
|
|
|
|
'Tdtom' {
|
|
|
|
fasta = "${params.transgenes_base}/Tdtom/Tdtom.fa"
|
|
|
|
gtf = "${params.transgenes_base}/Tdtom/Tdtom.gtf"
|
|
|
|
}
|
|
|
|
'Car-T' {
|
|
|
|
fasta = "${params.transgenes_base}/car-t/car-t.fa"
|
|
|
|
gtf = "${params.transgenes_base}/car-t/car-t.gtf"
|
|
|
|
}
|
|
|
|
'zsGreen' {
|
|
|
|
fasta = "${params.transgenes_base}/zsGreen/zsGreen.fa"
|
|
|
|
gtf = "${params.transgenes_base}/zsGreen/zsGreen.gtf"
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|