mirror of
https://github.com/MillironX/nf-core_modules.git
synced 2024-11-13 05:13:09 +00:00
Add blast/tblastn module (#2092)
* cherry pick the module files from sanger-tol branch and update the test data from official nf-core test datasets * Update modules/blast/tblastn/main.nf, align the emit Co-authored-by: nvnieuwk <101190534+nvnieuwk@users.noreply.github.com> Co-authored-by: nvnieuwk <101190534+nvnieuwk@users.noreply.github.com>
This commit is contained in:
parent
d1c8bddaaa
commit
8e21005d53
6 changed files with 134 additions and 0 deletions
37
modules/blast/tblastn/main.nf
Normal file
37
modules/blast/tblastn/main.nf
Normal file
|
@ -0,0 +1,37 @@
|
|||
process BLAST_TBLASTN {
|
||||
tag "$meta.id"
|
||||
label 'process_medium'
|
||||
|
||||
conda (params.enable_conda ? 'bioconda::blast=2.12.0' : null)
|
||||
container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ?
|
||||
'https://depot.galaxyproject.org/singularity/blast:2.12.0--pl5262h3289130_0' :
|
||||
'quay.io/biocontainers/blast:2.12.0--pl5262h3289130_0' }"
|
||||
|
||||
input:
|
||||
tuple val(meta), path(fasta)
|
||||
path db
|
||||
|
||||
output:
|
||||
tuple val(meta), path('*.tblastn.txt') , emit: txt
|
||||
path "versions.yml" , emit: versions
|
||||
|
||||
when:
|
||||
task.ext.when == null || task.ext.when
|
||||
|
||||
script:
|
||||
def args = task.ext.args ?: ''
|
||||
def prefix = task.ext.prefix ?: "${meta.id}"
|
||||
"""
|
||||
DB=`find -L ./ -name "*.nsq" | sed 's/.nsq//'`
|
||||
tblastn \\
|
||||
-num_threads $task.cpus \\
|
||||
-db \$DB \\
|
||||
-query $fasta \\
|
||||
$args \\
|
||||
-out ${prefix}.tblastn.txt
|
||||
cat <<-END_VERSIONS > versions.yml
|
||||
"${task.process}":
|
||||
blast: \$(tblastn -version 2>&1 | sed 's/^.*tblastn: //; s/ .*\$//')
|
||||
END_VERSIONS
|
||||
"""
|
||||
}
|
41
modules/blast/tblastn/meta.yml
Normal file
41
modules/blast/tblastn/meta.yml
Normal file
|
@ -0,0 +1,41 @@
|
|||
name: blast_tblastn
|
||||
description: Queries a BLAST DNA database
|
||||
keywords:
|
||||
- fasta
|
||||
- blast
|
||||
- tblastn
|
||||
- DNA sequence
|
||||
tools:
|
||||
- blast:
|
||||
description: |
|
||||
Protein to Translated Nucleotide BLAST.
|
||||
homepage: https://blast.ncbi.nlm.nih.gov/Blast.cgi
|
||||
documentation: https://blast.ncbi.nlm.nih.gov/Blast.cgi?CMD=Web&PAGE_TYPE=Blastdocs
|
||||
doi: 10.1016/S0022-2836(05)80360-2
|
||||
licence: ["US-Government-Work"]
|
||||
input:
|
||||
- meta:
|
||||
type: map
|
||||
description: |
|
||||
Groovy Map containing sample information
|
||||
e.g. [ id:'test', single_end:false ]
|
||||
- fasta:
|
||||
type: file
|
||||
description: Input fasta file containing queries sequences
|
||||
pattern: "*.{fa,fasta}"
|
||||
- db:
|
||||
type: directory
|
||||
description: Directory containing blast database
|
||||
pattern: "*"
|
||||
output:
|
||||
- txt:
|
||||
type: file
|
||||
description: File containing blastn hits
|
||||
pattern: "*.{tblastn.txt}"
|
||||
- versions:
|
||||
type: file
|
||||
description: File containing software versions
|
||||
pattern: "versions.yml"
|
||||
authors:
|
||||
- "@yumisims"
|
||||
- "@gq2"
|
|
@ -379,6 +379,10 @@ blast/makeblastdb:
|
|||
- modules/blast/makeblastdb/**
|
||||
- tests/modules/blast/makeblastdb/**
|
||||
|
||||
blast/tblastn:
|
||||
- modules/blast/tblastn/**
|
||||
- tests/modules/blast/tblastn/**
|
||||
|
||||
bowtie/align:
|
||||
- modules/bowtie/align/**
|
||||
- modules/bowtie/build/**
|
||||
|
|
15
tests/modules/blast/tblastn/main.nf
Normal file
15
tests/modules/blast/tblastn/main.nf
Normal file
|
@ -0,0 +1,15 @@
|
|||
#!/usr/bin/env nextflow
|
||||
|
||||
nextflow.enable.dsl = 2
|
||||
|
||||
include { BLAST_TBLASTN } from '../../../../modules/blast/tblastn/main.nf'
|
||||
include { BLAST_MAKEBLASTDB } from '../../../../modules/blast/makeblastdb/main.nf'
|
||||
|
||||
workflow test_blast_tblastn {
|
||||
|
||||
input = [ file(params.test_data['sarscov2']['genome']['genome_fasta'], checkIfExists: true) ]
|
||||
input_pep = [ file(params.test_data['sarscov2']['genome']['proteome_fasta'], checkIfExists: true) ]
|
||||
|
||||
BLAST_MAKEBLASTDB ( input )
|
||||
BLAST_TBLASTN ( [ [id:'test'], input_pep ], BLAST_MAKEBLASTDB.out.db )
|
||||
}
|
12
tests/modules/blast/tblastn/nextflow.config
Normal file
12
tests/modules/blast/tblastn/nextflow.config
Normal file
|
@ -0,0 +1,12 @@
|
|||
process {
|
||||
|
||||
withName: BLAST_MAKEBLASTDB {
|
||||
publishDir = { "${params.outdir}/${task.process.tokenize(':')[-1].tokenize('_')[0].toLowerCase()}" }
|
||||
ext.args = '-dbtype nucl'
|
||||
}
|
||||
|
||||
withName: BLAST_TBLASTN {
|
||||
publishDir = { "${params.outdir}/${task.process.tokenize(':')[-1].tokenize('_')[0].toLowerCase()}" }
|
||||
ext.args = '-outfmt 6 -task tblastn -evalue 0.001 -qcov_hsp_perc 60 -max_target_seqs 1'
|
||||
}
|
||||
}
|
25
tests/modules/blast/tblastn/test.yml
Normal file
25
tests/modules/blast/tblastn/test.yml
Normal file
|
@ -0,0 +1,25 @@
|
|||
- name: blast tblastn
|
||||
command: nextflow run ./tests/modules/blast/tblastn -entry test_blast_tblastn -c ./tests/config/nextflow.config -c ./tests/modules/blast/tblastn/nextflow.config
|
||||
tags:
|
||||
- blast
|
||||
- blast/tblastn
|
||||
files:
|
||||
- path: ./output/blast/test.tblastn.txt
|
||||
md5sum: c26ccfa5ceae82fc6affdc77f5505b62
|
||||
- path: ./output/blast/versions.yml
|
||||
md5sum: 6d23563b8d75e2fe1e03d3fbe10098a9
|
||||
- path: ./output/blast/blast_db/genome.fasta.nsq
|
||||
md5sum: 982cbc7d9e38743b9b1037588862b9da
|
||||
- path: ./output/blast/blast_db/genome.fasta.nin
|
||||
- path: ./output/blast/blast_db/genome.fasta
|
||||
md5sum: 6e9fe4042a72f2345f644f239272b7e6
|
||||
- path: ./output/blast/blast_db/genome.fasta.nhr
|
||||
md5sum: f4b4ddb034fd3dd7b25c89e9d50c004e
|
||||
- path: ./output/blast/blast_db/genome.fasta.ndb
|
||||
md5sum: 0d553c830656469211de113c5022f06d
|
||||
- path: ./output/blast/blast_db/genome.fasta.not
|
||||
md5sum: 1e53e9d08f1d23af0299cfa87478a7bb
|
||||
- path: ./output/blast/blast_db/genome.fasta.nto
|
||||
md5sum: 33cdeccccebe80329f1fdbee7f5874cb
|
||||
- path: ./output/blast/blast_db/genome.fasta.ntf
|
||||
md5sum: de1250813f0c7affc6d12dac9d0fb6bb
|
Loading…
Reference in a new issue