Skip to content

Commit

Permalink
Initialized changes
Browse files Browse the repository at this point in the history
  • Loading branch information
nschcolnicov committed Aug 26, 2024
1 parent 0a39d56 commit 4adf3d5
Show file tree
Hide file tree
Showing 8 changed files with 51 additions and 36 deletions.
1 change: 1 addition & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -19,6 +19,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
- [[#382]](https://github.com/nf-core/smrnaseq/pull/382) - Add [collapse_mirtop.R](https://github.com/nf-core/smrnaseq/issues/174) - Add nf-tests for local modules using custom R scripts.
- [[#383]](https://github.com/nf-core/smrnaseq/pull/383) - Fix [parameter `--skip_fastp` throws an error](https://github.com/nf-core/smrnaseq/issues/263) - Fix parameter --skip_fastp.
- [[#384]](https://github.com/nf-core/smrnaseq/pull/384) - Fix [filter status bug fix](https://github.com/nf-core/smrnaseq/issues/360) - Fix filter stats module and add filter contaminants test profile.
- [[#388]](https://github.com/nf-core/smrnaseq/pull/388) - Fix [igenomes fix](https://github.com/nf-core/smrnaseq/issues/360) - Fix workflow scripts so that they can use igenome parameters.

## v2.3.1 - 2024-04-18 - Gray Zinc Dalmation Patch

Expand Down
3 changes: 3 additions & 0 deletions main.nf
Original file line number Diff line number Diff line change
Expand Up @@ -61,6 +61,9 @@ workflow {
NFCORE_SMRNASEQ (
Channel.of(file(params.input, checkIfExists: true)),
PIPELINE_INITIALISATION.out.samplesheet,
params.fasta,
params.mirtrace_species,
params.bowtie_index,
ch_versions
)

Expand Down
3 changes: 2 additions & 1 deletion modules/local/mirtop_quant.nf
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,7 @@ process MIRTOP_QUANT {
path ("bams/*")
path hairpin
path gtf
val mirtrace_species

output:
path "mirtop/mirtop.gff" , emit: mirtop_gff
Expand All @@ -22,7 +23,7 @@ process MIRTOP_QUANT {
task.ext.when == null || task.ext.when

script:
def filter_species = params.mirgenedb ? params.mirgenedb_species : params.mirtrace_species
def filter_species = params.mirgenedb ? params.mirgenedb_species : mirtrace_species
"""
#Cleanup the GTF if mirbase html form is broken
GTF="$gtf"
Expand Down
3 changes: 2 additions & 1 deletion modules/local/mirtrace.nf
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,7 @@ process MIRTRACE_RUN {
input:
tuple val(adapter), val(ids), path(reads)
path(mirtrace_config)
val mirtrace_species

output:
path "mirtrace/*" , emit: mirtrace
Expand All @@ -30,7 +31,7 @@ process MIRTRACE_RUN {
export mirtracejar=\$(dirname \$(which mirtrace))
java $java_mem -jar \$mirtracejar/mirtrace.jar --mirtrace-wrapper-name mirtrace qc \\
--species $params.mirtrace_species \\
--species $mirtrace_species \\
$protocol \\
--config $mirtrace_config \\
--write-fasta \\
Expand Down
3 changes: 2 additions & 1 deletion modules/local/parse_fasta_mirna.nf
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,7 @@ process PARSE_FASTA_MIRNA {

input:
tuple val(meta2), path(fasta)
val mirtrace_species

output:
tuple val(meta2), path('*_igenome.fa'), emit: parsed_fasta
Expand All @@ -17,7 +18,7 @@ process PARSE_FASTA_MIRNA {
task.ext.when == null || task.ext.when

script:
def filter_species = params.mirgenedb ? params.mirgenedb_species : params.mirtrace_species
filter_species = params.mirgenedb ? params.mirgenedb_species : mirtrace_species
"""
# Uncompress FASTA reference files if necessary
FASTA="$fasta"
Expand Down
17 changes: 9 additions & 8 deletions subworkflows/local/mirna_quant.nf
Original file line number Diff line number Diff line change
Expand Up @@ -25,15 +25,16 @@ include { EDGER_QC } from '../../modules/local/edger_qc/edger_qc.nf'

workflow MIRNA_QUANT {
take:
mature // channel: [ val(meta), fasta file]
hairpin // channel: [ val(meta), fasta file]
gtf // channle: GTF file
reads // channel: [ val(meta), [ reads ] ]
mature // channel: [ val(meta), fasta file]
hairpin // channel: [ val(meta), fasta file]
gtf // channel: GTF file
reads // channel: [ val(meta), [ reads ] ]
mirtrace_species // value : params.mirtrace_species

main:
ch_versions = Channel.empty()

PARSE_MATURE ( mature ).parsed_fasta.set { mirna_parsed }
PARSE_MATURE ( mature, mirtrace_species ).parsed_fasta.set { mirna_parsed }
ch_versions = ch_versions.mix(PARSE_MATURE.out.versions)

FORMAT_MATURE ( mirna_parsed )
Expand All @@ -58,7 +59,7 @@ workflow MIRNA_QUANT {
BAM_STATS_MATURE ( BOWTIE_MAP_MATURE.out.bam, FORMAT_MATURE.out.formatted_fasta )
ch_versions = ch_versions.mix(BAM_STATS_MATURE.out.versions)

PARSE_HAIRPIN ( hairpin ).parsed_fasta.set { hairpin_parsed }
PARSE_HAIRPIN ( hairpin, mirtrace_species ).parsed_fasta.set { hairpin_parsed }
ch_versions = ch_versions.mix(PARSE_HAIRPIN.out.versions)

FORMAT_HAIRPIN ( hairpin_parsed )
Expand Down Expand Up @@ -95,8 +96,8 @@ workflow MIRNA_QUANT {
ch_versions = ch_versions.mix(BOWTIE_MAP_SEQCLUSTER.out.versions)

ch_mirtop_logs = Channel.empty()
if (params.mirtrace_species){
MIRTOP_QUANT ( BOWTIE_MAP_SEQCLUSTER.out.bam.collect{it[1]}, FORMAT_HAIRPIN.out.formatted_fasta.collect{it[1]}, gtf )
if (mirtrace_species){
MIRTOP_QUANT ( BOWTIE_MAP_SEQCLUSTER.out.bam.collect{it[1]}, FORMAT_HAIRPIN.out.formatted_fasta.collect{it[1]}, gtf, mirtrace_species )
ch_mirtop_logs = MIRTOP_QUANT.out.logs
ch_versions = ch_versions.mix(MIRTOP_QUANT.out.versions)

Expand Down
6 changes: 4 additions & 2 deletions subworkflows/local/mirtrace.nf
Original file line number Diff line number Diff line change
Expand Up @@ -6,7 +6,8 @@ include { MIRTRACE_RUN } from '../../modules/local/mirtrace'

workflow MIRTRACE {
take:
reads // channel: [ val(adapterseq), [ val(ids) ], [ path(reads) ] ]
reads // channel: [ val(adapterseq), [ val(ids) ], [ path(reads) ] ]
mirtrace_species // value : params.mirtrace_species

main:

Expand All @@ -20,7 +21,8 @@ workflow MIRTRACE {

MIRTRACE_RUN (
reads,
ch_mirtrace_config
ch_mirtrace_config,
mirtrace_species
)

emit:
Expand Down
51 changes: 28 additions & 23 deletions workflows/smrnaseq.nf
Original file line number Diff line number Diff line change
Expand Up @@ -43,22 +43,25 @@ workflow NFCORE_SMRNASEQ {
take:
ch_input // channel: samplesheet file as specified to --input
ch_samplesheet // channel: sample fastqs parsed from --input
fasta // params.fasta
mirtrace_species // mirtrace_species
bowtie_index // params.bowtie_index
ch_versions // channel: [ path(versions.yml) ]

main:
//Config checks
// Check optional parameters
if (!params.mirgenedb && !params.mirtrace_species) {
if (!params.mirgenedb && !mirtrace_species) {
exit 1, "Reference species for miRTrace is not defined via the --mirtrace_species parameter."
}

// Genome options
def mirna_gtf_from_species = params.mirtrace_species ? (params.mirtrace_species == 'hsa' ? "https://github.com/nf-core/test-datasets/raw/smrnaseq/miRBase/hsa.gff3" : "https://mirbase.org/download/CURRENT/genomes/${params.mirtrace_species}.gff3") : false
def mirna_gtf = params.mirna_gtf ?: mirna_gtf_from_species
mirna_gtf_from_species = mirtrace_species ? "https://mirbase.org/download/CURRENT/genomes/${mirtrace_species}.gff3" : false
mirna_gtf = params.mirna_gtf ?: mirna_gtf_from_species

if (!params.mirgenedb) {
if (params.mature) { reference_mature = file(params.mature, checkIfExists: true) } else { exit 1, "Mature miRNA fasta file not found: ${params.mature}" }
if (params.hairpin) { reference_hairpin = file(params.hairpin, checkIfExists: true) } else { exit 1, "Hairpin miRNA fasta file not found: ${params.hairpin}" }
if (params.mature) { reference_mature = Channel.fromPath(params.mature, checkIfExists: true).map{ it -> [ [id:it.baseName], it ] }.collect() } else { exit 1, "Mature miRNA fasta file not found: ${params.mature}" }
if (params.hairpin) { reference_hairpin = Channel.fromPath(params.hairpin, checkIfExists: true).map{ it -> [ [id:it.baseName], it ] }.collect() } else { exit 1, "Hairpin miRNA fasta file not found: ${params.hairpin}" }
} else {
if (params.mirgenedb_mature) { reference_mature = file(params.mirgenedb_mature, checkIfExists: true) } else { exit 1, "Mature miRNA fasta file not found via --mirgenedb_mature: ${params.mirgenedb_mature}" }
if (params.mirgenedb_hairpin) { reference_hairpin = file(params.mirgenedb_hairpin, checkIfExists: true) } else { exit 1, "Hairpin miRNA fasta file not found via --mirgenedb_hairpin: ${params.mirgenedb_hairpin}" }
Expand Down Expand Up @@ -108,21 +111,21 @@ workflow NFCORE_SMRNASEQ {
)
ch_versions = ch_versions.mix(FASTQ_FASTQC_UMITOOLS_FASTP.out.versions)

ch_fasta = params.fasta ? file(params.fasta): []
ch_fasta = fasta ? Channel.fromPath(fasta, checkIfExists: true): Channel.empty()
ch_reads_for_mirna = FASTQ_FASTQC_UMITOOLS_FASTP.out.reads

// even if bowtie index is specified, there still needs to be a fasta.
// without fasta, no genome analysis.
if(params.fasta) {
if(fasta) {
//Prepare bowtie index, unless specified
//This needs to be done here as the index is used by GENOME_QUANT
if(params.bowtie_index) {
ch_fasta = Channel.fromPath(params.fasta)
if (params.bowtie_index.endsWith(".tar.gz")) {
UNTAR_BOWTIE_INDEX ( [ [], params.bowtie_index ]).files.map { it[1] }.set {ch_bowtie_index}
if(bowtie_index) {
ch_fasta = Channel.fromPath(fasta)
if (bowtie_index.endsWith(".tar.gz")) {
UNTAR_BOWTIE_INDEX ( [ [], bowtie_index ]).files.map { it[1] }.set {ch_bowtie_index}
ch_versions = ch_versions.mix(UNTAR_BOWTIE_INDEX.out.versions)
} else {
Channel.fromPath("${params.bowtie_index}**ebwt", checkIfExists: true).ifEmpty{ error "Bowtie1 index directory not found: ${params.bowtie_index}" }.filter { it != null }.set { ch_bowtie_index }
Channel.fromPath("${bowtie_index}**ebwt", checkIfExists: true).ifEmpty{ error "Bowtie1 index directory not found: ${bowtie_index}" }.filter { it != null }.set { ch_bowtie_index }
}
} else {
INDEX_GENOME ( [ [:], ch_fasta ] )
Expand Down Expand Up @@ -173,16 +176,16 @@ workflow NFCORE_SMRNASEQ {
// Now join the adapter sequence channel with the reads channel
ch_adapter_seq
.join(ch_reads_for_mirna)
.map { meta, adapter_seq, reads -> [adapter_seq, meta.id, reads] }
.groupTuple()
.map { adapter_seq, ids, reads_list -> [adapter_seq, ids, reads_list.flatten()] }
.set { ch_mirtrace_inputs }
.map { meta, adapter_seq, reads -> [adapter_seq, meta.id, reads] }
.groupTuple()
.map { adapter_seq, ids, reads_list -> [adapter_seq, ids, reads_list.flatten()] }
.set { ch_mirtrace_inputs }

//
// SUBWORKFLOW: MIRTRACE
//
if (params.mirtrace_species) {
MIRTRACE(ch_mirtrace_inputs)
if (mirtrace_species) {
MIRTRACE(ch_mirtrace_inputs, mirtrace_species)
ch_versions = ch_versions.mix(MIRTRACE.out.versions)
} else {
log.warn "The parameter --mirtrace_species is absent. MIRTRACE quantification skipped."
Expand Down Expand Up @@ -211,18 +214,20 @@ workflow NFCORE_SMRNASEQ {
}

MIRNA_QUANT (
[ [:], reference_mature],
[ [:], reference_hairpin],
reference_mature,
reference_hairpin,
mirna_gtf,
ch_reads_for_mirna
ch_reads_for_mirna,
mirtrace_species

)
ch_versions = ch_versions.mix(MIRNA_QUANT.out.versions)

//
// GENOME
//
genome_stats = Channel.empty()
if (params.fasta){
if (fasta){
GENOME_QUANT ( ch_bowtie_index, ch_fasta, MIRNA_QUANT.out.unmapped )
genome_stats = GENOME_QUANT.out.stats
ch_versions = ch_versions.mix(GENOME_QUANT.out.versions)
Expand Down Expand Up @@ -306,7 +311,7 @@ workflow NFCORE_SMRNASEQ {
ch_multiqc_files = ch_multiqc_files.mix(MIRNA_QUANT.out.mature_stats.collect({it[1]}).ifEmpty([]))
ch_multiqc_files = ch_multiqc_files.mix(MIRNA_QUANT.out.hairpin_stats.collect({it[1]}).ifEmpty([]))
ch_multiqc_files = ch_multiqc_files.mix(MIRNA_QUANT.out.mirtop_logs.collect().ifEmpty([]))
if (params.mirtrace_species) {
if (mirtrace_species) {
ch_multiqc_files = ch_multiqc_files.mix(MIRTRACE.out.results.collect().ifEmpty([]))
}

Expand Down

0 comments on commit 4adf3d5

Please sign in to comment.