nf-core · maxulysse · Jun 16, 2022 · Jun 8, 2022 · Jun 10, 2022 · Jun 10, 2022
@@ -29,6 +29,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 - [#540](https://github.com/nf-core/sarek/pull/540) - Add modules and subworkflows for `cnvkit` somatic mode
 - [#557](https://github.com/nf-core/sarek/pull/557) - Add `Haplotypecaller` single sample mode together with `CNNScoreVariants` and `FilterVariantTranches`
 - [#576](https://github.com/nf-core/sarek/pull/576) - Add modules and subworkflows for `cnvkit` germline mode
+- [#582](https://github.com/nf-core/sarek/pull/582) - Added option `--vep_out_format` for setting the format of the output-file from VEP to `json`, `tab` or `vcf` (default)
 
 ### Changed
 

@@ -1044,18 +1044,30 @@ process{
             (params.vep_dbnsfp && params.dbnsfp)                                  ? '--plugin dbNSFP,dbNSFP.gz,rs_dbSNP,HGVSc_VEP,HGVSp_VEP,1000Gp3_EAS_AF,1000Gp3_AMR_AF,LRT_score,GERP++_RS,gnomAD_exomes_AF' : '',
             (params.vep_loftee)                                                   ? '--plugin LoF,loftee_path:/opt/conda/envs/nf-core-vep-104.3/share/ensembl-vep-104.3-0'                                      : '',
             (params.vep_spliceai && params.spliceai_snv && params.spliceai_indel) ? '--plugin SpliceAI,snv=spliceai_scores.raw.snv.hg38.vcf.gz,indel=spliceai_scores.raw.indel.hg38.vcf.gz'                     : '',
-            (params.vep_spliceregion)                                             ? '--plugin SpliceRegion'                                                                                                     : ''
+            (params.vep_spliceregion)                                             ? '--plugin SpliceRegion'                                                                                                     : '',
+            (params.vep_out_format)                                               ? "--${params.vep_out_format}"                                                                                                : '--vcf'
         ].join(' ').trim()
         if (!params.vep_cache)    container = { params.vep_genome ? "nfcore/vep:104.3.${params.vep_genome}" : "nfcore/vep:104.3.${params.genome}" }
         publishDir       = [
-            mode: params.publish_dir_mode,
-            path: { "${params.outdir}/reports/EnsemblVEP/${meta.id}/${meta.variantcaller}" },
-            pattern: "*html"
+            [
+                mode: params.publish_dir_mode,
+                path: { "${params.outdir}/reports/EnsemblVEP/${meta.id}/${meta.variantcaller}" },
+                pattern: "*html"
+            ],
+            [
+                mode: params.publish_dir_mode,
+                path: { "${params.outdir}/annotation/${meta.id}/${meta.variantcaller}" },
+                pattern: "*{json,tab}"
+            ]
         ]
     }
 
+    withName: 'NFCORE_SAREK:SAREK:ANNOTATE:ANNOTATION_ENSEMBLVEP:ENSEMBLVEP' {
+        ext.prefix      = {"${meta.id}_VEP"}
+    }
+
     withName: ".*:ANNOTATION_MERGE:ENSEMBLVEP" {
-        // Output file will have format *_snpEff_VEP.ann.vcf
+        // Output file will have format *_snpEff_VEP.ann.vcf, *_snpEff_VEP.ann.json or *_snpEff_VEP.ann.tab
         ext.prefix       = { "${vcf.baseName.minus(".ann.vcf")}_VEP" }
     }
 

@@ -67,7 +67,7 @@
                 "git_sha": "e745e167c1020928ef20ea1397b6b4d230681b4d"
             },
             "ensemblvep": {
-                "git_sha": "40dd662fd26c3eb3160b7c8cbbe9bff80bbe2c30"
+                "git_sha": "30f72e24822576c6f90a0bf9db678b403c70eccf"
             },
             "fastqc": {
                 "git_sha": "49b18b1639f4f7104187058866a8fab33332bdfe"

@@ -67,6 +67,7 @@ params {
 
 
     // Annotation
+    vep_out_format = 'vcf'
     vep_dbnsfp = null // dbnsfp plugin disabled within VEP
     dbnsfp = null // No dbnsfp processed file
     dbnsfp_tbi = null // No dbnsfp processed file index

@@ -538,6 +538,14 @@
                     "description": "VEP cache version.",
                     "help_text": "If you use AWS iGenomes, this has already been set for you appropriately."
                 },
+                "vep_out_format": {
+                    "type": "string",
+                    "default": "vcf",
+                    "description": "VEP output-file format.",
+                    "enum": ["json", "tab", "vcf"],
+                    "help_text": "Sets the format of the output-file from VEP. Available formats: json, tab and vcf.",
+                    "fa_icon": "fas fa-table"
+                },
                 "save_reference": {
                     "type": "boolean",
                     "fa_icon": "fas fa-download",

@@ -8,20 +8,23 @@ include { ANNOTATION_ENSEMBLVEP                     } from '../nf-core/annotatio
 
 workflow ANNOTATE {
     take:
-        vcf                           // channel: [ val(meta), vcf ]
-        tools                         // Mandatory, list of tools to apply
-        snpeff_db
-        snpeff_cache
-        vep_genome
-        vep_species
-        vep_cache_version
-        vep_cache
-        vep_extra_files
-
+    vcf          // channel: [ val(meta), vcf ]
+    fasta
+    tools        // Mandatory, list of tools to apply
+    snpeff_db
+    snpeff_cache
+    vep_genome
+    vep_species
+    vep_cache_version
+    vep_cache
+    vep_extra_files
+
     main:
-    ch_reports  = Channel.empty()
-    ch_vcf_ann  = Channel.empty()
-    ch_versions = Channel.empty()
+    ch_reports   = Channel.empty()
+    ch_vcf_ann   = Channel.empty()
+    ch_tab_ann   = Channel.empty()
+    ch_json_ann  = Channel.empty()
+    ch_versions  = Channel.empty()
 
     if (tools.contains('merge') || tools.contains('snpeff')) {
         ANNOTATION_SNPEFF(vcf, snpeff_db, snpeff_cache)
@@ -33,23 +36,27 @@ workflow ANNOTATE {
 
     if (tools.contains('merge')) {
         vcf_ann_for_merge = ANNOTATION_SNPEFF.out.vcf_tbi.map{ meta, vcf, tbi -> [meta, vcf] }
-        ANNOTATION_MERGE(vcf_ann_for_merge, vep_genome, vep_species, vep_cache_version, vep_cache, vep_extra_files)
+        ANNOTATION_MERGE(vcf_ann_for_merge, fasta, vep_genome, vep_species, vep_cache_version, vep_cache, vep_extra_files)
 
         ch_reports  = ch_reports.mix(ANNOTATION_MERGE.out.reports)
         ch_vcf_ann  = ch_vcf_ann.mix(ANNOTATION_MERGE.out.vcf_tbi)
         ch_versions = ch_versions.mix(ANNOTATION_MERGE.out.versions.first())
     }
 
     if (tools.contains('vep')) {
-        ANNOTATION_ENSEMBLVEP(vcf, vep_genome, vep_species, vep_cache_version, vep_cache, vep_extra_files)
+        ANNOTATION_ENSEMBLVEP(vcf, fasta, vep_genome, vep_species, vep_cache_version, vep_cache, vep_extra_files)
 
-        ch_reports  = ch_reports.mix(ANNOTATION_ENSEMBLVEP.out.reports)
-        ch_vcf_ann  = ch_vcf_ann.mix(ANNOTATION_ENSEMBLVEP.out.vcf_tbi)
-        ch_versions = ch_versions.mix(ANNOTATION_ENSEMBLVEP.out.versions.first())
+        ch_reports   = ch_reports.mix(ANNOTATION_ENSEMBLVEP.out.reports)
+        ch_vcf_ann   = ch_vcf_ann.mix(ANNOTATION_ENSEMBLVEP.out.vcf_tbi)
+        ch_tab_ann   = ch_vcf_ann.mix(ANNOTATION_ENSEMBLVEP.out.tab)
+        ch_json_ann  = ch_vcf_ann.mix(ANNOTATION_ENSEMBLVEP.out.json)
+        ch_versions  = ch_versions.mix(ANNOTATION_ENSEMBLVEP.out.versions.first())
     }
 
     emit:
-    vcf_ann  = ch_vcf_ann      // channel: [ val(meta), vcf.gz, vcf.gz.tbi ]
-    reports  = ch_reports      //    path: *.html
-    versions = ch_versions     //    path: versions.yml
+    vcf_ann   = ch_vcf_ann      // channel: [ val(meta), vcf.gz, vcf.gz.tbi ]
+    tab_ann   = ch_tab_ann
+    json_ann  = ch_json_ann
+    reports   = ch_reports      //    path: *.html
+    versions  = ch_versions     //    path: versions.yml
 }
@@ -848,6 +848,7 @@ workflow SAREK {
         if (params.tools.contains('merge') || params.tools.contains('snpeff') || params.tools.contains('vep')) {
 
             ANNOTATE(vcf_to_annotate,
+                fasta,
                 params.tools,
                 snpeff_db,
                 snpeff_cache,