nuoxuxu
diff --git a/‎.nf-core.yml
Lines changed: 1 addition & 0 deletions b/‎.nf-core.yml
Lines changed: 1 addition & 0 deletions
diff --git a/‎00_illumina.nf
Lines changed: 57 additions & 0 deletions b/‎00_illumina.nf
Lines changed: 57 additions & 0 deletions
diff --git a/‎05_proteomic.nf
Lines changed: 0 additions & 72 deletions b/‎05_proteomic.nf
Lines changed: 0 additions & 72 deletions
diff --git a/‎main.nf
Lines changed: 15 additions & 0 deletions b/‎main.nf
Lines changed: 15 additions & 0 deletions
diff --git a/‎modules.json
Lines changed: 22 additions & 0 deletions b/‎modules.json
Lines changed: 22 additions & 0 deletions
diff --git a/‎modules/nf-core/salmon/index/environment.yml
Lines changed: 7 additions & 0 deletions b/‎modules/nf-core/salmon/index/environment.yml
Lines changed: 7 additions & 0 deletions
diff --git a/‎modules/nf-core/salmon/index/main.nf
Lines changed: 79 additions & 0 deletions b/‎modules/nf-core/salmon/index/main.nf
Lines changed: 79 additions & 0 deletions
diff --git a/‎modules/nf-core/salmon/index/meta.yml
Lines changed: 40 additions & 0 deletions b/‎modules/nf-core/salmon/index/meta.yml
Lines changed: 40 additions & 0 deletions
diff --git a/‎modules/nf-core/salmon/index/tests/main.nf.test
Lines changed: 92 additions & 0 deletions b/‎modules/nf-core/salmon/index/tests/main.nf.test
Lines changed: 92 additions & 0 deletions
@@ -0,0 +1 @@
+repository_type: pipeline
@@ -0,0 +1,57 @@
+process generateSalmonIndex {
+
+    label "short_slurm_job"
+
+    input:
+    path final_sample_fasta
+
+    output:
+    path "salmon_index"
+    script:
+    """
+    salmon index -p $task.cpus -t $final_sample_fasta -i salmon_index
+    """
+}
+
+process generateDecoyTranscriptome {
+    
+    label "short_slurm_job"
+
+    input:
+    path genome_fasta
+    path final_sample_gtf
+    path final_sample_fasta
+
+    output:
+    path "decoy_transcriptome/"
+    
+    script:
+    """
+    generateDecoyTranscriptome.sh \\
+        -j $task.cpus \\
+        -g $genome_fasta \\
+        -t $final_sample_fasta \\
+        -a $final_sample_gtf \\
+        -o decoy_transcriptome
+    """
+}
+process runSalmon {
+    input:
+    path salmon_index
+    path fastq_gz
+    
+    output:
+    path "salmon_quants/${fastq_gz.baseName}_quant"
+
+    script:
+    """
+    salmon quant -i proc/decoy_transcriptome -l A -1 data/illumina/SFARI_data/${1}_R1_001.fastq.gz -2 data/illumina/SFARI_data/${1}_R2_001.fastq.gz -p 30 --validateMappings -o proc/salmon_quants/${1}_quant    
+    """
+}
+
+workflow salmon {
+    take:
+
+    main:
+    generateSalmonIndex(params.transcriptome_fasta)
+}
@@ -0,0 +1,15 @@
+include {merge_and_collapse} from 'subworkflows/local/merge_and_collapse'
+include {classify_and_count} from 'subworkflows/local/classify_and_count'
+include {ORFanage} from 'subworkflows/local/ORFanage'
+include {proteoform_classification} from 'subworkflows/local/proteoform_classification'
+include {proteomic} from 'subworkflows/local/proteomic'
+include {peptide} from 'subworkflows/local/peptide'
+
+workflow {
+    merge_and_collapse(params.flnc_bam, params.mapped_bam)
+    classify_and_count(merge_and_collapse.out.isoform_gff, merge_and_collapse.out.id_to_sample, merge_and_collapse.out.read_stat)
+    ORFanage(classify_and_count.out.final_sample_gtf, classify_and_count.out.final_sample_classification, classify_and_count.out.final_sample_fasta)
+    proteoform_classification(ORFanage.out.predicted_cds_gtf, ORFanage.out.peptide_fasta, ORFanage.out.best_orf)
+    proteomic(proteoform_classification.out.protein_database, params.mzXMLfiles)
+    peptide(classify_and_count.out.final_sample_classification, ORFanage.out.predicted_cds_gtf, proteoform_classification.out.protein_database, proteomic.out.peptides)
+}    
@@ -0,0 +1,22 @@
+{
+  "name": "",
+  "homePage": "",
+  "repos": {
+    "https://github.com/nf-core/modules.git": {
+      "modules": {
+        "nf-core": {
+          "salmon/index": {
+            "branch": "master",
+            "git_sha": "81880787133db07d9b4c1febd152c090eb8325dc",
+            "installed_by": ["modules"]
+          },
+          "salmon/quant": {
+            "branch": "master",
+            "git_sha": "81880787133db07d9b4c1febd152c090eb8325dc",
+            "installed_by": ["modules"]
+          }
+        }
+      }
+    }
+  }
+}
@@ -0,0 +1,7 @@
+---
+# yaml-language-server: $schema=https://raw.githubusercontent.com/nf-core/modules/master/modules/environment-schema.json
+channels:
+  - conda-forge
+  - bioconda
+dependencies:
+  - bioconda::salmon=1.10.3
@@ -0,0 +1,79 @@
+process SALMON_INDEX {
+    tag "$transcript_fasta"
+    label "process_medium"
+
+    conda "${moduleDir}/environment.yml"
+    container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ?
+        'https://depot.galaxyproject.org/singularity/salmon:1.10.3--h6dccd9a_2' :
+        'biocontainers/salmon:1.10.3--h6dccd9a_2' }"
+
+    input:
+    path genome_fasta
+    path transcript_fasta
+
+    output:
+    path "salmon"      , emit: index
+    path "versions.yml", emit: versions
+
+    when:
+    task.ext.when == null || task.ext.when
+
+    script:
+    def args = task.ext.args ?: ''
+    def decoys = ''
+    def fasta = transcript_fasta
+    if (genome_fasta){
+        if (genome_fasta.endsWith('.gz')) {
+            genome_fasta = "<(gunzip -c $genome_fasta)"
+        }
+        decoys='-d decoys.txt'
+        fasta='gentrome.fa'
+    }
+    if (transcript_fasta.endsWith('.gz')) {
+        transcript_fasta = "<(gunzip -c $transcript_fasta)"
+    }
+    """
+    if [ -n '$genome_fasta' ]; then
+        grep '^>' $genome_fasta | cut -d ' ' -f 1 | cut -d \$'\\t' -f 1 | sed 's/>//g' > decoys.txt
+        cat $transcript_fasta $genome_fasta > $fasta
+    fi
+
+    salmon \\
+        index \\
+        --threads $task.cpus \\
+        -t $fasta \\
+        $decoys \\
+        $args \\
+        -i salmon
+
+    cat <<-END_VERSIONS > versions.yml
+    "${task.process}":
+        salmon: \$(echo \$(salmon --version) | sed -e "s/salmon //g")
+    END_VERSIONS
+    """
+
+    stub:
+    """
+    mkdir salmon
+    touch salmon/complete_ref_lens.bin
+    touch salmon/ctable.bin
+    touch salmon/ctg_offsets.bin
+    touch salmon/duplicate_clusters.tsv
+    touch salmon/info.json
+    touch salmon/mphf.bin
+    touch salmon/pos.bin
+    touch salmon/pre_indexing.log
+    touch salmon/rank.bin
+    touch salmon/refAccumLengths.bin
+    touch salmon/ref_indexing.log
+    touch salmon/reflengths.bin
+    touch salmon/refseq.bin
+    touch salmon/seq.bin
+    touch salmon/versionInfo.json
+
+    cat <<-END_VERSIONS > versions.yml
+    "${task.process}":
+        salmon: \$(echo \$(salmon --version) | sed -e "s/salmon //g")
+    END_VERSIONS
+    """
+}
@@ -0,0 +1,40 @@
+name: salmon_index
+description: Create index for salmon
+keywords:
+  - index
+  - fasta
+  - genome
+  - reference
+tools:
+  - salmon:
+      description: |
+        Salmon is a tool for wicked-fast transcript quantification from RNA-seq data
+      homepage: https://salmon.readthedocs.io/en/latest/salmon.html
+      manual: https://salmon.readthedocs.io/en/latest/salmon.html
+      doi: 10.1038/nmeth.4197
+      licence: ["GPL-3.0-or-later"]
+      identifier: biotools:salmon
+input:
+  - - genome_fasta:
+        type: file
+        description: Fasta file of the reference genome
+  - - transcript_fasta:
+        type: file
+        description: Fasta file of the reference transcriptome
+output:
+  - index:
+      - salmon:
+          type: directory
+          description: Folder containing the star index files
+          pattern: "salmon"
+  - versions:
+      - versions.yml:
+          type: file
+          description: File containing software versions
+          pattern: "versions.yml"
+authors:
+  - "@kevinmenden"
+  - "@drpatelh"
+maintainers:
+  - "@kevinmenden"
+  - "@drpatelh"
@@ -0,0 +1,92 @@
+nextflow_process {
+
+    name "Test Process SALMON_INDEX"
+    script "../main.nf"
+    process "SALMON_INDEX"
+    tag "modules"
+    tag "modules_nfcore"
+    tag "salmon"
+    tag "salmon/index"
+
+    test("sarscov2") {
+
+        when {
+            params {
+                outdir = "$outputDir"
+            }
+            process {
+                """
+                input[0] = Channel.of([file(params.modules_testdata_base_path + "genomics/homo_sapiens/genome/genome.fasta", checkIfExists: true)])
+                input[1] = Channel.of([file(params.modules_testdata_base_path + "genomics/sarscov2/genome/transcriptome.fasta", checkIfExists: true)])
+                """
+            }
+        }
+
+        then {
+            assertAll(
+                { assert process.success },
+                { assert path(process.out.index.get(0)).exists() },
+                { assert snapshot(
+                    file(process.out.index[0]).listFiles().collect { it.getName() }.sort().toString(),
+                    process.out.versions
+                ).match()}
+            )
+        }
+
+    }
+
+    test("sarscov2 transcriptome only") {
+
+        when {
+            params {
+                outdir = "$outputDir"
+            }
+            process {
+                """
+                input[0] = Channel.of([])
+                input[1] = Channel.of([file(params.modules_testdata_base_path + "genomics/sarscov2/genome/transcriptome.fasta", checkIfExists: true)])
+                """
+            }
+        }
+
+        then {
+            assertAll(
+                { assert process.success },
+                { assert path(process.out.index.get(0)).exists() },
+                { assert snapshot(
+                    file(process.out.index[0]).listFiles().collect { it.getName() }.sort().toString(),
+                    process.out.versions
+                ).match()}
+            )
+        }
+
+    }
+
+    test("sarscov2 stub") {
+        options "-stub"
+        when {
+            params {
+                outdir = "$outputDir"
+            }
+            process {
+                """
+                input[0] = Channel.of([file(params.modules_testdata_base_path + "genomics/homo_sapiens/genome/genome.fasta", checkIfExists: true)])
+                input[1] = Channel.of([file(params.modules_testdata_base_path + "genomics/sarscov2/genome/transcriptome.fasta", checkIfExists: true)])
+                """
+            }
+        }
+
+        then {
+            assertAll(
+                { assert process.success },
+                { assert path(process.out.index.get(0)).exists() },
+                { assert snapshot(
+                    file(process.out.index[0]).listFiles().collect { it.getName() }.sort().toString(),
+                    process.out.versions
+                ).match()}
+            )
+        }
+
+    }
+
+}