update ensemblvep and snpeff modules

2024-12-22 02:58:17 +00:00 · 2022-05-05 12:57:14 +02:00 · 2022-05-05 12:57:14 +02:00 · 40dd662fd2
commit 40dd662fd2
parent 6bb9be38c5
21 changed files with 149 additions and 125 deletions
--- a/modules/ensemblvep/Dockerfile
+++ b/modules/ensemblvep/Dockerfile
@ -8,13 +8,14 @@ LABEL \
 COPY environment.yml /
 RUN conda env create -f /environment.yml && conda clean -a
 # Add conda installation dir to PATH (instead of doing 'conda activate')
 ENV PATH /opt/conda/envs/nf-core-vep-104.3/bin:$PATH
 # Setup default ARG variables
 ARG GENOME=GRCh38
 ARG SPECIES=homo_sapiens
-ARG VEP_VERSION=99
+ARG VEP_VERSION=104
 ARG VEP_TAG=104.3
 # Add conda installation dir to PATH (instead of doing 'conda activate')
 ENV PATH /opt/conda/envs/nf-core-vep-${VEP_TAG}/bin:$PATH
 # Download Genome
 RUN vep_install \
@ -27,4 +28,4 @@ RUN vep_install \
    --NO_BIOPERL --NO_HTSLIB --NO_TEST --NO_UPDATE
 # Dump the details of the installed packages to a file for posterity
-RUN conda env export --name nf-core-vep-104.3 > nf-core-vep-104.3.yml
+RUN conda env export --name nf-core-vep-${VEP_TAG} > nf-core-vep-${VEP_TAG}.yml
--- a/modules/ensemblvep/build.sh
+++ b/modules/ensemblvep/build.sh
@ -10,11 +10,12 @@ build_push() {
    VEP_TAG=$4
    docker build \
        . \
        -t nfcore/vep:${VEP_TAG}.${GENOME} \
        software/vep/. \
        --build-arg GENOME=${GENOME} \
        --build-arg SPECIES=${SPECIES} \
-        --build-arg VEP_VERSION=${VEP_VERSION}
+        --build-arg VEP_VERSION=${VEP_VERSION} \
        --build-arg VEP_TAG=${VEP_TAG}
    docker push nfcore/vep:${VEP_TAG}.${GENOME}
 }
--- a/modules/ensemblvep/main.nf
+++ b/modules/ensemblvep/main.nf
@ -13,6 +13,7 @@ process ENSEMBLVEP {
    val   species
    val   cache_version
    path  cache
    path  extra_files
    output:
    tuple val(meta), path("*.ann.vcf"), emit: vcf
--- a/modules/ensemblvep/meta.yml
+++ b/modules/ensemblvep/meta.yml
@ -10,17 +10,6 @@ tools:
      homepage: https://www.ensembl.org/info/docs/tools/vep/index.html
      documentation: https://www.ensembl.org/info/docs/tools/vep/script/index.html
      licence: ["Apache-2.0"]
 params:
  - use_cache:
      type: boolean
      description: |
        Enable the usage of containers with cache
        Does not work with conda
  - vep_tag:
      type: value
      description: |
        Specify the tag for the container
        https://hub.docker.com/r/nfcore/vep/tags
 input:
  - meta:
      type: map
@ -47,6 +36,10 @@ input:
      type: file
      description: |
        path to VEP cache (optional)
  - extra_files:
      type: tuple
      description: |
        path to file(s) needed for plugins  (optional)
 output:
  - vcf:
      type: file
--- a/modules/snpeff/Dockerfile
+++ b/modules/snpeff/Dockerfile
@ -8,15 +8,16 @@ LABEL \
 COPY environment.yml /
 RUN conda env create -f /environment.yml && conda clean -a
 # Add conda installation dir to PATH (instead of doing 'conda activate')
 ENV PATH /opt/conda/envs/nf-core-snpeff-5.0/bin:$PATH
 # Setup default ARG variables
 ARG GENOME=GRCh38
 ARG SNPEFF_CACHE_VERSION=99
 ARG SNPEFF_TAG=99
 # Add conda installation dir to PATH (instead of doing 'conda activate')
 ENV PATH /opt/conda/envs/nf-core-snpeff-${SNPEFF_TAG}/bin:$PATH
 # Download Genome
 RUN snpEff download -v ${GENOME}.${SNPEFF_CACHE_VERSION}
 # Dump the details of the installed packages to a file for posterity
-RUN conda env export --name nf-core-snpeff-5.0 > nf-core-snpeff-5.0.yml
+RUN conda env export --name nf-core-snpeff-${SNPEFF_TAG} > nf-core-snpeff-${SNPEFF_TAG}.yml
--- a/modules/snpeff/build.sh
+++ b/modules/snpeff/build.sh
@ -9,10 +9,11 @@ build_push() {
    SNPEFF_TAG=$3
    docker build \
        . \
        -t nfcore/snpeff:${SNPEFF_TAG}.${GENOME} \
        software/snpeff/. \
        --build-arg GENOME=${GENOME} \
-        --build-arg SNPEFF_CACHE_VERSION=${SNPEFF_CACHE_VERSION}
+        --build-arg SNPEFF_CACHE_VERSION=${SNPEFF_CACHE_VERSION} \
        --build-arg SNPEFF_TAG=${SNPEFF_TAG}
    docker push nfcore/snpeff:${SNPEFF_TAG}.${GENOME}
 }
--- a/modules/snpeff/meta.yml
+++ b/modules/snpeff/meta.yml
@ -10,18 +10,6 @@ tools:
      homepage: https://pcingola.github.io/SnpEff/
      documentation: https://pcingola.github.io/SnpEff/se_introduction/
      licence: ["MIT"]
 params:
  - use_cache:
      type: boolean
      description: |
        boolean to enable the usage of containers with cache
        Enable the usage of containers with cache
        Does not work with conda
  - snpeff_tag:
      type: value
      description: |
        Specify the tag for the container
        https://hub.docker.com/r/nfcore/snpeff/tags
 input:
  - meta:
      type: map
--- a/subworkflows/nf-core/annotation/ensemblvep/main.nf
+++ b/subworkflows/nf-core/annotation/ensemblvep/main.nf
@ -0,0 +1,31 @@
 //
 // Run VEP to annotate VCF files
 //
 include { ENSEMBLVEP       } from '../../../../modules/ensemblvep/main'
 include { TABIX_BGZIPTABIX } from '../../../../modules/tabix/bgziptabix/main'
 workflow ANNOTATION_ENSEMBLVEP {
    take:
    vcf               // channel: [ val(meta), vcf ]
    vep_genome        //   value: genome to use
    vep_species       //   value: species to use
    vep_cache_version //   value: cache version to use
    vep_cache         //    path: /path/to/vep/cache (optionnal)
    vep_extra_files   // channel: [ file1, file2...] (optionnal)
    main:
    ch_versions = Channel.empty()
    ENSEMBLVEP(vcf, vep_genome, vep_species, vep_cache_version, vep_cache, vep_extra_files)
    TABIX_BGZIPTABIX(ENSEMBLVEP.out.vcf)
    // Gather versions of all tools used
    ch_versions = ch_versions.mix(ENSEMBLVEP.out.versions.first())
    ch_versions = ch_versions.mix(TABIX_BGZIPTABIX.out.versions.first())
    emit:
    vcf_tbi  = TABIX_BGZIPTABIX.out.gz_tbi // channel: [ val(meta), vcf.gz, vcf.gz.tbi ]
    reports  = ENSEMBLVEP.out.report       //    path: *.html
    versions = ch_versions                 //    path: versions.yml
 }
--- a/subworkflows/nf-core/annotation/ensemblvep/meta.yml
+++ b/subworkflows/nf-core/annotation/ensemblvep/meta.yml
@ -0,0 +1,49 @@
 name: annotation_ensemblvep
 description: |
  Perform annotation with ensemblvep and bgzip + tabix index the resulting VCF file
 keywords:
  - ensemblvep
 modules:
  - ensemblvep
  - tabix/bgziptabix
 input:
  - meta:
      type: map
      description: |
        Groovy Map containing sample information
        e.g. [ id:'test', single_end:false ]
  - vcf:
      type: file
      description: |
        vcf to annotate
  - genome:
      type: value
      description: |
        which genome to annotate with
  - species:
      type: value
      description: |
        which species to annotate with
  - cache_version:
      type: value
      description: |
        which version of the cache to annotate with
  - cache:
      type: file
      description: |
        path to VEP cache (optional)
  - extra_files:
      type: tuple
      description: |
        path to file(s) needed for plugins  (optional)
 output:
  - versions:
      type: file
      description: File containing software versions
      pattern: "versions.yml"
  - vcf_tbi:
      type: file
      description: Compressed vcf file + tabix index
      pattern: "[ *{.vcf.gz,vcf.gz.tbi} ]"
 authors:
  - "@maxulysse"
--- a/subworkflows/nf-core/annotation/snpeff/main.nf
+++ b/subworkflows/nf-core/annotation/snpeff/main.nf
@ -0,0 +1,28 @@
 //
 // Run SNPEFF to annotate VCF files
 //
 include { SNPEFF           } from '../../../../modules/snpeff/main'
 include { TABIX_BGZIPTABIX } from '../../../../modules/tabix/bgziptabix/main'
 workflow ANNOTATION_SNPEFF {
    take:
    vcf          // channel: [ val(meta), vcf ]
    snpeff_db    //   value: db version to use
    snpeff_cache //    path: /path/to/snpeff/cache (optionnal)
    main:
    ch_versions = Channel.empty()
    SNPEFF(vcf, snpeff_db, snpeff_cache)
    TABIX_BGZIPTABIX(SNPEFF.out.vcf)
    // Gather versions of all tools used
    ch_versions = ch_versions.mix(SNPEFF.out.versions.first())
    ch_versions = ch_versions.mix(TABIX_BGZIPTABIX.out.versions.first())
    emit:
    vcf_tbi  = TABIX_BGZIPTABIX.out.gz_tbi // channel: [ val(meta), vcf.gz, vcf.gz.tbi ]
    reports  = SNPEFF.out.report           //    path: *.html
    versions = ch_versions                 //    path: versions.yml
 }
--- a/subworkflows/nf-core/annotation/snpeff/meta.yml
+++ b/subworkflows/nf-core/annotation/snpeff/meta.yml
@ -11,11 +11,19 @@ input:
      type: map
      description: |
        Groovy Map containing sample information
-        e.g. [ id:'test' ]
+        e.g. [ id:'test', single_end:false ]
-  - input:
+  - vcf:
-      type: vcf
+      type: file
-      description: list containing one vcf file
+      description: |
-      pattern: "[ *.{vcf,vcf.gz} ]"
+        vcf to annotate
  - db:
      type: value
      description: |
        which db to annotate with
  - cache:
      type: file
      description: |
        path to snpEff cache (optional)
 output:
  - versions:
      type: file
--- a/subworkflows/nf-core/annotation_ensemblvep/main.nf
+++ b/subworkflows/nf-core/annotation_ensemblvep/main.nf
@ -1,26 +0,0 @@
 //
 // Run VEP to annotate VCF files
 //
 include { ENSEMBLVEP                                } from '../../../modules/ensemblvep/main'
 include { TABIX_BGZIPTABIX as ANNOTATION_BGZIPTABIX } from '../../../modules/tabix/bgziptabix/main'
 workflow ANNOTATION_ENSEMBLVEP {
    take:
    vcf               // channel: [ val(meta), vcf ]
    vep_genome        //   value: which genome
    vep_species       //   value: which species
    vep_cache_version //   value: which cache version
    vep_cache         //    path: path_to_vep_cache (optionnal)
    main:
    ENSEMBLVEP(vcf, vep_genome, vep_species, vep_cache_version, vep_cache)
    ANNOTATION_BGZIPTABIX(ENSEMBLVEP.out.vcf)
    ch_versions = ENSEMBLVEP.out.versions.first().mix(ANNOTATION_BGZIPTABIX.out.versions.first())
    emit:
    vcf_tbi  = ANNOTATION_BGZIPTABIX.out.gz_tbi // channel: [ val(meta), vcf.gz, vcf.gz.tbi ]
    reports  = ENSEMBLVEP.out.report            //    path: *.html
    versions = ch_versions                      //    path: versions.yml
 }
--- a/subworkflows/nf-core/annotation_ensemblvep/meta.yml
+++ b/subworkflows/nf-core/annotation_ensemblvep/meta.yml
@ -1,29 +0,0 @@
 name: annotation_ensemblvep
 description: |
  Perform annotation with ensemblvep and bgzip + tabix index the resulting VCF file
 keywords:
  - ensemblvep
 modules:
  - ensemblvep
  - tabix/bgziptabix
 input:
  - meta:
      type: map
      description: |
        Groovy Map containing sample information
        e.g. [ id:'test' ]
  - input:
      type: vcf
      description: list containing one vcf file
      pattern: "[ *.{vcf,vcf.gz} ]"
 output:
  - versions:
      type: file
      description: File containing software versions
      pattern: "versions.yml"
  - vcf_tbi:
      type: file
      description: Compressed vcf file + tabix index
      pattern: "[ *{.vcf.gz,vcf.gz.tbi} ]"
 authors:
  - "@maxulysse"
--- a/subworkflows/nf-core/annotation_snpeff/main.nf
+++ b/subworkflows/nf-core/annotation_snpeff/main.nf
@ -1,23 +0,0 @@
 //
 // Run SNPEFF to annotate VCF files
 //
 include { SNPEFF                                    } from '../../../modules/snpeff/main'
 include { TABIX_BGZIPTABIX as ANNOTATION_BGZIPTABIX } from '../../../modules/tabix/bgziptabix/main'
 workflow ANNOTATION_SNPEFF {
    take:
    vcf            // channel: [ val(meta), vcf ]
    snpeff_db      //   value: version of db to use
    snpeff_cache   //    path: path_to_snpeff_cache (optionnal)
    main:
    SNPEFF(vcf, snpeff_db, snpeff_cache)
    ANNOTATION_BGZIPTABIX(SNPEFF.out.vcf)
    ch_versions = SNPEFF.out.versions.first().mix(ANNOTATION_BGZIPTABIX.out.versions.first())
    emit:
    vcf_tbi  = ANNOTATION_BGZIPTABIX.out.gz_tbi // channel: [ val(meta), vcf.gz, vcf.gz.tbi ]
    reports  = SNPEFF.out.report                //    path: *.html
    versions = ch_versions                      //    path: versions.yml
 }
--- a/tests/modules/ensemblvep/main.nf
+++ b/tests/modules/ensemblvep/main.nf
@ -10,5 +10,5 @@ workflow test_ensemblvep {
        file(params.test_data['sarscov2']['illumina']['test_vcf'], checkIfExists: true)
    ]
-    ENSEMBLVEP ( input, "WBcel235", "caenorhabditis_elegans", "104", [] )
+    ENSEMBLVEP ( input, "WBcel235", "caenorhabditis_elegans", "104", [], [] )
 }
--- a/tests/subworkflows/nf-core/annotation/ensemblvep/main.nf
+++ b/tests/subworkflows/nf-core/annotation/ensemblvep/main.nf
@ -2,7 +2,7 @@
 nextflow.enable.dsl = 2
-include { ANNOTATION_ENSEMBLVEP } from '../../../../subworkflows/nf-core/annotation_ensemblvep/main'
+include { ANNOTATION_ENSEMBLVEP } from '../../../../../subworkflows/nf-core/annotation/ensemblvep/main'
 workflow annotation_ensemblvep {
    input = [
@ -10,5 +10,5 @@ workflow annotation_ensemblvep {
        file(params.test_data['sarscov2']['illumina']['test_vcf'], checkIfExists: true)
    ]
-    ANNOTATION_ENSEMBLVEP ( input, "WBcel235", "caenorhabditis_elegans", "104", [] )
+    ANNOTATION_ENSEMBLVEP ( input, "WBcel235", "caenorhabditis_elegans", "104", [], [] )
 }
--- a/tests/subworkflows/nf-core/annotation/ensemblvep/nextflow.config
+++ b/tests/subworkflows/nf-core/annotation/ensemblvep/nextflow.config
@ -7,7 +7,7 @@ process {
        publishDir = [ enabled: false ]
    }
-    withName: ANNOTATION_BGZIPTABIX {
+    withName: TABIX_BGZIPTABIX {
        ext.prefix = { "${meta.id}_VEP.ann.vcf" }
    }
--- a/tests/subworkflows/nf-core/annotation/ensemblvep/test.yml
+++ b/tests/subworkflows/nf-core/annotation/ensemblvep/test.yml
--- a/tests/subworkflows/nf-core/annotation/snpeff/main.nf
+++ b/tests/subworkflows/nf-core/annotation/snpeff/main.nf
@ -2,7 +2,7 @@
 nextflow.enable.dsl = 2
-include { ANNOTATION_SNPEFF } from '../../../../subworkflows/nf-core/annotation_snpeff/main'
+include { ANNOTATION_SNPEFF } from '../../../../../subworkflows/nf-core/annotation_snpeff/main'
 workflow annotation_snpeff {
    input = [
--- a/tests/subworkflows/nf-core/annotation/snpeff/nextflow.config
+++ b/tests/subworkflows/nf-core/annotation/snpeff/nextflow.config
@ -7,7 +7,7 @@ process {
        publishDir = [ enabled: false ]
    }
-    withName: ANNOTATION_BGZIPTABIX {
+    withName: TABIX_BGZIPTABIX {
        ext.prefix = { "${meta.id}_snpEff.ann.vcf" }
    }
--- a/tests/subworkflows/nf-core/annotation/snpeff/test.yml
+++ b/tests/subworkflows/nf-core/annotation/snpeff/test.yml