mirror of
https://github.com/MillironX/taxprofiler.git
synced 2024-11-22 16:49:56 +00:00
Merge pull request #130 from nf-core/krakentools/combinekreports
Adds KRAKEN_COMBINEKREPORTS for 'native' multi-sample OTU
This commit is contained in:
commit
d9795a4fdc
7 changed files with 163 additions and 13 deletions
|
@ -294,6 +294,15 @@ process {
|
||||||
]
|
]
|
||||||
}
|
}
|
||||||
|
|
||||||
|
withName: KRAKENTOOLS_COMBINEKREPORTS {
|
||||||
|
ext.prefix = { "kraken2_${meta.id}_combined_reports" }
|
||||||
|
publishDir = [
|
||||||
|
path: { "${params.outdir}/kraken2/" },
|
||||||
|
mode: params.publish_dir_mode,
|
||||||
|
pattern: '*.{txt}'
|
||||||
|
]
|
||||||
|
}
|
||||||
|
|
||||||
withName: KRONA_CLEANUP {
|
withName: KRONA_CLEANUP {
|
||||||
ext.prefix = params.perform_runmerging ? { "${meta.id}-${meta.db_name}" } : { "${meta.id}-${meta.run_accession}-${meta.db_name}" }
|
ext.prefix = params.perform_runmerging ? { "${meta.id}-${meta.db_name}" } : { "${meta.id}-${meta.run_accession}-${meta.db_name}" }
|
||||||
publishDir = [
|
publishDir = [
|
||||||
|
@ -358,6 +367,15 @@ process {
|
||||||
]
|
]
|
||||||
}
|
}
|
||||||
|
|
||||||
|
withName: KRAKENTOOLS_COMBINEKREPORTS_CENTRIFUGE {
|
||||||
|
ext.prefix = { "centrifuge_${meta.id}_combined_reports" }
|
||||||
|
publishDir = [
|
||||||
|
path: { "${params.outdir}/centrifuge/" },
|
||||||
|
mode: params.publish_dir_mode,
|
||||||
|
pattern: '*.{txt}'
|
||||||
|
]
|
||||||
|
}
|
||||||
|
|
||||||
withName: KAIJU_KAIJU {
|
withName: KAIJU_KAIJU {
|
||||||
ext.prefix = params.perform_runmerging ? { "${meta.id}-${meta.db_name}" } : { "${meta.id}-${meta.run_accession}-${meta.db_name}" }
|
ext.prefix = params.perform_runmerging ? { "${meta.id}-${meta.db_name}" } : { "${meta.id}-${meta.run_accession}-${meta.db_name}" }
|
||||||
publishDir = [
|
publishDir = [
|
||||||
|
@ -369,7 +387,7 @@ process {
|
||||||
}
|
}
|
||||||
|
|
||||||
withName: KAIJU_KAIJU2TABLE {
|
withName: KAIJU_KAIJU2TABLE {
|
||||||
ext.prefix = { "${meta.id}_combined_reports" }
|
ext.prefix = { "kaiju_${meta.id}_combined_reports" }
|
||||||
publishDir = [
|
publishDir = [
|
||||||
path: { "${params.outdir}/kaiju/" },
|
path: { "${params.outdir}/kaiju/" },
|
||||||
mode: params.publish_dir_mode,
|
mode: params.publish_dir_mode,
|
||||||
|
|
|
@ -73,6 +73,10 @@
|
||||||
"branch": "master",
|
"branch": "master",
|
||||||
"git_sha": "409a308ba46284d8ebb48c2c1befd6f6433db3f7"
|
"git_sha": "409a308ba46284d8ebb48c2c1befd6f6433db3f7"
|
||||||
},
|
},
|
||||||
|
"krakentools/combinekreports": {
|
||||||
|
"branch": "master",
|
||||||
|
"git_sha": "ee0346b4d14ffdc15ce7e093ca1363cd07c9bd78"
|
||||||
|
},
|
||||||
"krakentools/kreport2krona": {
|
"krakentools/kreport2krona": {
|
||||||
"branch": "master",
|
"branch": "master",
|
||||||
"git_sha": "233fa70811a03a4cecb2ece483b5c8396e2cee1d"
|
"git_sha": "233fa70811a03a4cecb2ece483b5c8396e2cee1d"
|
||||||
|
@ -135,7 +139,7 @@
|
||||||
},
|
},
|
||||||
"untar": {
|
"untar": {
|
||||||
"branch": "master",
|
"branch": "master",
|
||||||
"git_sha": "5e7b1ef9a5a2d9258635bcbf70fcf37dacd1b247"
|
"git_sha": "393dbd6ddafe3f18eac02893dd4a21e4d45de679"
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
34
modules/nf-core/modules/krakentools/combinekreports/main.nf
generated
Normal file
34
modules/nf-core/modules/krakentools/combinekreports/main.nf
generated
Normal file
|
@ -0,0 +1,34 @@
|
||||||
|
process KRAKENTOOLS_COMBINEKREPORTS {
|
||||||
|
label 'process_low'
|
||||||
|
|
||||||
|
conda (params.enable_conda ? "bioconda::krakentools=1.2" : null)
|
||||||
|
container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ?
|
||||||
|
'https://depot.galaxyproject.org/singularity/krakentools:1.2--pyh5e36f6f_0':
|
||||||
|
'quay.io/biocontainers/krakentools:1.2--pyh5e36f6f_0' }"
|
||||||
|
|
||||||
|
input:
|
||||||
|
tuple val(meta), path(kreports)
|
||||||
|
|
||||||
|
output:
|
||||||
|
tuple val(meta), path("*.txt"), emit: txt
|
||||||
|
path "versions.yml", emit: versions
|
||||||
|
|
||||||
|
when:
|
||||||
|
task.ext.when == null || task.ext.when
|
||||||
|
|
||||||
|
script:
|
||||||
|
def args = task.ext.args ?: ''
|
||||||
|
prefix = task.ext.prefix ?: "${meta.id}"
|
||||||
|
def VERSION = '1.2' // WARN: Version information not provided by tool on CLI. Please update this string when bumping container versions.
|
||||||
|
"""
|
||||||
|
combine_kreports.py \\
|
||||||
|
-r ${kreports} \\
|
||||||
|
-o ${prefix}.txt \\
|
||||||
|
${args}
|
||||||
|
|
||||||
|
cat <<-END_VERSIONS > versions.yml
|
||||||
|
"${task.process}":
|
||||||
|
combine_kreports.py: ${VERSION}
|
||||||
|
END_VERSIONS
|
||||||
|
"""
|
||||||
|
}
|
43
modules/nf-core/modules/krakentools/combinekreports/meta.yml
generated
Normal file
43
modules/nf-core/modules/krakentools/combinekreports/meta.yml
generated
Normal file
|
@ -0,0 +1,43 @@
|
||||||
|
name: krakentools_combinekreports
|
||||||
|
description: Takes a Kraken report file and prints out a krona-compatible TEXT file
|
||||||
|
keywords:
|
||||||
|
- kraken
|
||||||
|
- krakentools
|
||||||
|
- metagenomics
|
||||||
|
- table
|
||||||
|
- combining
|
||||||
|
- merging
|
||||||
|
tools:
|
||||||
|
- krakentools:
|
||||||
|
description: KrakenTools is a suite of scripts to be used for post-analysis of Kraken/KrakenUniq/Kraken2/Bracken results. Please cite the relevant paper if using KrakenTools with any of the listed programs.
|
||||||
|
homepage: https://github.com/jenniferlu717/KrakenTools
|
||||||
|
licence: ["GPL v3"]
|
||||||
|
|
||||||
|
input:
|
||||||
|
- meta:
|
||||||
|
type: map
|
||||||
|
description: |
|
||||||
|
Groovy Map containing sample information
|
||||||
|
e.g. [ id:'test', single_end:false ]
|
||||||
|
- kreports:
|
||||||
|
type: file
|
||||||
|
description: List of kraken-style report files
|
||||||
|
pattern: "*.{txt,kreport}"
|
||||||
|
|
||||||
|
output:
|
||||||
|
- meta:
|
||||||
|
type: map
|
||||||
|
description: |
|
||||||
|
Groovy Map containing sample information
|
||||||
|
e.g. [ id:'test', single_end:false ]
|
||||||
|
- versions:
|
||||||
|
type: file
|
||||||
|
description: File containing software versions
|
||||||
|
pattern: "versions.yml"
|
||||||
|
- txt:
|
||||||
|
type: file
|
||||||
|
description: Combined kreport file of all input files
|
||||||
|
pattern: "*.txt"
|
||||||
|
|
||||||
|
authors:
|
||||||
|
- "@jfy133"
|
23
modules/nf-core/modules/untar/main.nf
generated
23
modules/nf-core/modules/untar/main.nf
generated
|
@ -25,12 +25,23 @@ process UNTAR {
|
||||||
"""
|
"""
|
||||||
mkdir output
|
mkdir output
|
||||||
|
|
||||||
tar \\
|
## Ensures --strip-components only applied when top level of tar contents is a directory
|
||||||
-C output --strip-components 1 \\
|
## If just files or multiple directories, place all in output
|
||||||
-xzvf \\
|
if [[ \$(tar -tzf ${archive} | grep "/\$" | wc -l) -eq 1 ]]; then
|
||||||
$args \\
|
tar \\
|
||||||
$archive \\
|
-C output --strip-components 1 \\
|
||||||
$args2
|
-xzvf \\
|
||||||
|
$args \\
|
||||||
|
$archive \\
|
||||||
|
$args2
|
||||||
|
else
|
||||||
|
tar \\
|
||||||
|
-C output \\
|
||||||
|
-xzvf \\
|
||||||
|
$args \\
|
||||||
|
$archive \\
|
||||||
|
$args2
|
||||||
|
fi
|
||||||
|
|
||||||
mv output ${untar}
|
mv output ${untar}
|
||||||
|
|
||||||
|
|
8
modules/nf-core/modules/untar/meta.yml
generated
8
modules/nf-core/modules/untar/meta.yml
generated
|
@ -26,9 +26,9 @@ output:
|
||||||
Groovy Map containing sample information
|
Groovy Map containing sample information
|
||||||
e.g. [ id:'test', single_end:false ]
|
e.g. [ id:'test', single_end:false ]
|
||||||
- untar:
|
- untar:
|
||||||
type: file
|
type: directory
|
||||||
description:
|
description: Directory containing contents of archive
|
||||||
pattern: "*.*"
|
pattern: "*/"
|
||||||
- versions:
|
- versions:
|
||||||
type: file
|
type: file
|
||||||
description: File containing software versions
|
description: File containing software versions
|
||||||
|
@ -36,3 +36,5 @@ output:
|
||||||
authors:
|
authors:
|
||||||
- "@joseespinosa"
|
- "@joseespinosa"
|
||||||
- "@drpatelh"
|
- "@drpatelh"
|
||||||
|
- "@matthdsm"
|
||||||
|
- "@jfy133"
|
||||||
|
|
|
@ -2,8 +2,10 @@
|
||||||
// Standardise output files e.g. aggregation
|
// Standardise output files e.g. aggregation
|
||||||
//
|
//
|
||||||
|
|
||||||
include { KAIJU_KAIJU2TABLE } from '../../modules/nf-core/modules/kaiju/kaiju2table/main'
|
include { KRAKENTOOLS_COMBINEKREPORTS as KRAKENTOOLS_COMBINEKREPORTS_CENTRIFUGE } from '../../modules/nf-core/modules/krakentools/combinekreports/main'
|
||||||
include { MOTUS_MERGE } from '../../modules/nf-core/modules/motus/merge/main'
|
include { KAIJU_KAIJU2TABLE } from '../../modules/nf-core/modules/kaiju/kaiju2table/main'
|
||||||
|
include { KRAKENTOOLS_COMBINEKREPORTS } from '../../modules/nf-core/modules/krakentools/combinekreports/main'
|
||||||
|
include { MOTUS_MERGE } from '../../modules/nf-core/modules/motus/merge/main'
|
||||||
|
|
||||||
workflow STANDARDISATION_PROFILES {
|
workflow STANDARDISATION_PROFILES {
|
||||||
take:
|
take:
|
||||||
|
@ -23,6 +25,8 @@ workflow STANDARDISATION_PROFILES {
|
||||||
ch_input_profiles = profiles
|
ch_input_profiles = profiles
|
||||||
.branch {
|
.branch {
|
||||||
motus: it[0]['tool'] == 'motus'
|
motus: it[0]['tool'] == 'motus'
|
||||||
|
kraken2: it[0]['tool'] == 'kraken2'
|
||||||
|
centrifuge: it[0]['tool'] == 'centrifuge'
|
||||||
unknown: true
|
unknown: true
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -43,6 +47,23 @@ workflow STANDARDISATION_PROFILES {
|
||||||
Standardise and aggregate
|
Standardise and aggregate
|
||||||
*/
|
*/
|
||||||
|
|
||||||
|
// CENTRIFUGE
|
||||||
|
|
||||||
|
// Collect and replace id for db_name for prefix
|
||||||
|
// Have to sort by size to ensure first file actually has hits otherwise
|
||||||
|
// the script fails
|
||||||
|
ch_profiles_for_centrifuge = ch_input_profiles.centrifuge
|
||||||
|
.map { [it[0]['db_name'], it[1]] }
|
||||||
|
.groupTuple(sort: {-it.size()} )
|
||||||
|
.map {
|
||||||
|
[[id:it[0]], it[1]]
|
||||||
|
}
|
||||||
|
|
||||||
|
KRAKENTOOLS_COMBINEKREPORTS_CENTRIFUGE ( ch_profiles_for_centrifuge )
|
||||||
|
ch_standardised_tables = ch_standardised_tables.mix( KRAKENTOOLS_COMBINEKREPORTS_CENTRIFUGE.out.txt )
|
||||||
|
ch_multiqc_files = ch_multiqc_files.mix( KRAKENTOOLS_COMBINEKREPORTS_CENTRIFUGE.out.txt )
|
||||||
|
ch_versions = ch_versions.mix( KRAKENTOOLS_COMBINEKREPORTS_CENTRIFUGE.out.versions )
|
||||||
|
|
||||||
// Kaiju
|
// Kaiju
|
||||||
|
|
||||||
// Collect and replace id for db_name for prefix
|
// Collect and replace id for db_name for prefix
|
||||||
|
@ -58,6 +79,23 @@ workflow STANDARDISATION_PROFILES {
|
||||||
ch_multiqc_files = ch_multiqc_files.mix( KAIJU_KAIJU2TABLE.out.summary )
|
ch_multiqc_files = ch_multiqc_files.mix( KAIJU_KAIJU2TABLE.out.summary )
|
||||||
ch_versions = ch_versions.mix( KAIJU_KAIJU2TABLE.out.versions )
|
ch_versions = ch_versions.mix( KAIJU_KAIJU2TABLE.out.versions )
|
||||||
|
|
||||||
|
// Kraken2
|
||||||
|
|
||||||
|
// Collect and replace id for db_name for prefix
|
||||||
|
// Have to sort by size to ensure first file actually has hits otherwise
|
||||||
|
// the script fails
|
||||||
|
ch_profiles_for_kraken2 = ch_input_profiles.kraken2
|
||||||
|
.map { [it[0]['db_name'], it[1]] }
|
||||||
|
.groupTuple(sort: {-it.size()} )
|
||||||
|
.map {
|
||||||
|
[[id:it[0]], it[1]]
|
||||||
|
}
|
||||||
|
|
||||||
|
KRAKENTOOLS_COMBINEKREPORTS ( ch_profiles_for_kraken2 )
|
||||||
|
ch_standardised_tables = ch_standardised_tables.mix( KRAKENTOOLS_COMBINEKREPORTS.out.txt )
|
||||||
|
ch_multiqc_files = ch_multiqc_files.mix( KRAKENTOOLS_COMBINEKREPORTS.out.txt )
|
||||||
|
ch_versions = ch_versions.mix( KRAKENTOOLS_COMBINEKREPORTS.out.versions )
|
||||||
|
|
||||||
// mOTUs has a 'single' database, and cannot create custom ones.
|
// mOTUs has a 'single' database, and cannot create custom ones.
|
||||||
// Therefore removing db info here, and publish merged at root mOTUs results
|
// Therefore removing db info here, and publish merged at root mOTUs results
|
||||||
// directory
|
// directory
|
||||||
|
|
Loading…
Reference in a new issue