Skip to content

Commit 411a499

Browse files
authored
Merge pull request #486 from atrigila/csvtk_replace
Replace `CSVTK_JOIN` to improve processing in large amount of files
2 parents c06b188 + eab8687 commit 411a499

19 files changed

+187
-36
lines changed

CHANGELOG.md

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
77

88
- [[#481]](https://github.com/nf-core/smrnaseq/pull/481) - Fix [MIRTOP_STATS IndexError](https://github.com/nf-core/smrnaseq/issues/477) - Fix mirtop process execution when mirgenedb is used.
99
- [[#482]](https://github.com/nf-core/smrnaseq/pull/482) - Update documentation regarding MirgeneDB input files.
10+
- [[#486]](https://github.com/nf-core/smrnaseq/pull/486) - Replace `CSVTK_JOIN` to improve processing in large amount of files.
1011

1112
## v2.4.0 - 2024-10-14 - Navy Iron Boxer
1213

bin/pivot_longer.R

Lines changed: 29 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,29 @@
1+
#!/usr/bin/env Rscript
2+
3+
library(optparse)
4+
library(tidyr)
5+
library(vroom)
6+
7+
option_list <- list(
8+
make_option(c("--input"), type = "character", help = "Input TSV file", metavar = "character"),
9+
make_option(c("--output"), type = "character", help = "Output CSV file", metavar = "character")
10+
)
11+
12+
opt_parser <- OptionParser(option_list = option_list)
13+
opt <- parse_args(opt_parser)
14+
15+
# Read CSV with vroom
16+
data <- vroom::vroom(opt$input, delim = "\t", col_types = c(.default = "c"))
17+
18+
last_col <- names(data)[ncol(data)]
19+
20+
# Convert from wide to long format
21+
long_data <- data %>%
22+
pivot_longer(
23+
cols = last_col,
24+
names_to = "Sample_ID",
25+
values_to = "Counts"
26+
)
27+
28+
vroom_write(long_data, opt$output, delim = ",")
29+

bin/pivot_wider.R

Lines changed: 32 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,32 @@
1+
#!/usr/bin/env Rscript
2+
3+
library(optparse)
4+
library(tidyr)
5+
library(vroom)
6+
library(dplyr)
7+
8+
option_list <- list(
9+
make_option(c("--input"), type = "character", help = "Input CSV file in long format", metavar = "character"),
10+
make_option(c("--output"), type = "character", help = "Output CSV file in wide format", metavar = "character")
11+
)
12+
13+
opt_parser <- OptionParser(option_list = option_list)
14+
opt <- parse_args(opt_parser)
15+
16+
# Read CSV with vroom
17+
long_data <- vroom::vroom(opt$input, delim = ",",
18+
col_types = c(
19+
Counts = "d",
20+
.default = "c"
21+
))
22+
23+
# Transform to wide format
24+
wide_data <- long_data %>%
25+
pivot_wider(
26+
names_from = Sample_ID,
27+
values_from = Counts,
28+
values_fill = 0
29+
)
30+
31+
# Export wide format
32+
vroom_write(wide_data, opt$output, delim = "\t")

conf/modules.config

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -468,9 +468,11 @@ process {
468468
]
469469
}
470470

471-
withName: 'NFCORE_SMRNASEQ:MIRNA_QUANT:CSVTK_JOIN' {
472-
ext.args = "--fields 'UID,Read,miRNA,Variant,iso_5p,iso_3p,iso_add3p,iso_snp,iso_5p_nt,iso_3p_nt,iso_add3p_nt,iso_snp_nt' --tabs --outer-join --na \"0\" --out-delimiter \"\t\""
473-
ext.prefix = "joined_samples_mirtop"
471+
withName: 'NFCORE_SMRNASEQ:MIRNA_QUANT:PIVOT_LONGER' {
472+
publishDir = [ enabled: false ]
473+
}
474+
475+
withName: 'NFCORE_SMRNASEQ:MIRNA_QUANT:PIVOT_WIDER' {
474476
publishDir = [
475477
path: { "${params.outdir}/mirna_quant/mirtop" },
476478
mode: params.publish_dir_mode,
Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,5 @@
1+
channels:
2+
- conda-forge
3+
dependencies:
4+
- conda-forge::r-optparse
5+
- conda-forge::r-tidyverse

modules/local/pivot/longer/main.nf

Lines changed: 29 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,29 @@
1+
process PIVOT_LONGER {
2+
tag"$meta.id"
3+
label 'process_single'
4+
5+
conda "${moduleDir}/environment.yml"
6+
container "community.wave.seqera.io/library/r-optparse_r-tidyverse_r-vroom:3cbb224fea84a0e1"
7+
8+
input:
9+
tuple val(meta), path(tsv)
10+
11+
output:
12+
tuple val(meta), path("*_long.csv") , emit: csv
13+
path "versions.yml" , emit: versions
14+
15+
script:
16+
"""
17+
pivot_longer.R \\
18+
--input ${tsv} \\
19+
--output ${meta.id}_long.csv
20+
21+
cat <<-END_VERSIONS > versions.yml
22+
"${task.process}":
23+
r-base: \$(echo \$(R --version 2>&1) | sed 's/^.*R version //; s/ .*\$//')
24+
tidyr: \$(Rscript -e "library(tidyr); cat(as.character(packageVersion('tidyr')))")
25+
optparse: \$(Rscript -e "library(optparse); cat(as.character(packageVersion('optparse')))")
26+
END_VERSIONS
27+
"""
28+
29+
}
Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,5 @@
1+
channels:
2+
- conda-forge
3+
dependencies:
4+
- conda-forge::r-optparse
5+
- conda-forge::r-tidyverse

modules/local/pivot/wider/main.nf

Lines changed: 35 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,35 @@
1+
process PIVOT_WIDER {
2+
tag"$meta.id"
3+
label 'process_high'
4+
5+
conda "${moduleDir}/environment.yml"
6+
container "community.wave.seqera.io/library/r-optparse_r-tidyverse_r-vroom:3cbb224fea84a0e1"
7+
8+
input:
9+
tuple val(meta), path(csvs)
10+
11+
output:
12+
tuple val(meta), path("*joined_samples_mirtop.tsv") , emit: csv
13+
path "versions.yml" , emit: versions
14+
15+
script:
16+
"""
17+
awk 'NR == 1 || FNR > 1' ${csvs.join(' ')} > final_long_results_temp.csv
18+
19+
pivot_wider.R \\
20+
--input final_long_results_temp.csv \\
21+
--output ${meta.id}_concatenated_temp.csv
22+
23+
sort -t\$'\t' -k1,1 ${meta.id}_concatenated_temp.csv > joined_samples_mirtop.tsv
24+
25+
cat <<-END_VERSIONS > versions.yml
26+
"${task.process}":
27+
r-base: \$(echo \$(R --version 2>&1) | sed 's/^.*R version //; s/ .*\$//')
28+
tidyr: \$(Rscript -e "library(tidyr); cat(as.character(packageVersion('tidyr')))")
29+
dplyr: \$(Rscript -e "library(dplyr); cat(as.character(packageVersion('dplyr')))")
30+
optparse: \$(Rscript -e "library(optparse); cat(as.character(packageVersion('optparse')))")
31+
vroom: \$(Rscript -e "library(vroom); cat(as.character(packageVersion('vroom')))")
32+
END_VERSIONS
33+
"""
34+
35+
}

subworkflows/local/mirna_quant.nf

Lines changed: 16 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -24,6 +24,9 @@ include { EDGER_QC } from '../../modules/local/edger_qc/main'
2424
include { BAM_STATS_MIRNA_MIRTOP } from '../../subworkflows/nf-core/bam_stats_mirna_mirtop/main'
2525
include { CSVTK_JOIN } from '../../modules/nf-core/csvtk/join/main'
2626

27+
include { PIVOT_LONGER } from '../../modules/local/pivot/longer/main'
28+
include { PIVOT_WIDER } from '../../modules/local/pivot/wider/main'
29+
2730
workflow MIRNA_QUANT {
2831
take:
2932
ch_reference_mature // channel: [ val(meta), fasta file]
@@ -105,10 +108,20 @@ workflow MIRNA_QUANT {
105108
.collect{it[1]}
106109
.map{it -> return [[id:"TSVs"], it]}
107110

108-
CSVTK_JOIN ( ch_tsvs )
109-
ch_versions = ch_versions.mix(CSVTK_JOIN.out.versions)
111+
PIVOT_LONGER( BAM_STATS_MIRNA_MIRTOP.out.counts )
112+
ch_versions = ch_versions.mix(PIVOT_LONGER.out.versions)
113+
114+
ch_long_files = PIVOT_LONGER.out.csv
115+
.map { meta, file -> file }
116+
.collect()
117+
.map { files ->
118+
return [[id: "Long_Files"], files]
119+
}
120+
121+
PIVOT_WIDER( ch_long_files )
122+
ch_versions = ch_versions.mix(PIVOT_WIDER.out.versions)
110123

111-
DATATABLE_MERGE ( CSVTK_JOIN.out.csv )
124+
DATATABLE_MERGE ( PIVOT_WIDER.out.csv )
112125
ch_versions = ch_versions.mix(DATATABLE_MERGE.out.versions)
113126

114127
ch_reads_genome = BOWTIE_MAP_HAIRPIN.out.fastq

tests/test_contamination_tech_reps.nf.test

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@ nextflow_pipeline {
2020
assertAll(
2121
{ assert workflow.success },
2222
{ assert snapshot(UTILS.removeNextflowVersion("$outputDir")).match("software_versions") },
23-
{ assert workflow.trace.succeeded().size() == 100 },
23+
{ assert workflow.trace.succeeded().size() == 103 },
2424

2525
{ assert snapshot(
2626
path("$outputDir/contaminant_filter/filter/Clone1_N1_trimmed.contamination_mqc.yaml").exists(), //TODO see if we can make these deterministic or why they are non-deterministic

tests/test_contamination_tech_reps.nf.test.snap

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -34,13 +34,13 @@
3434
},
3535
"software_versions": {
3636
"content": [
37-
"{BLAT_CDNA={blat=36}, BLAT_NCRNA={blat=36}, BOWTIE2_ALIGN_CDNA={bowtie2=2.5.2, samtools=1.18, pigz=2.6}, BOWTIE2_ALIGN_NCRNA={bowtie2=2.5.2, samtools=1.18, pigz=2.6}, BOWTIE2_ALIGN_TRNA={bowtie2=2.5.2, samtools=1.18, pigz=2.6}, BOWTIE_MAP_HAIRPIN={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_MATURE={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_SEQCLUSTER={bowtie=1.3.0, samtools=1.16.1}, CAT_FASTQ={cat=8.3}, CSVTK_JOIN={csvtk=0.30.0}, DATATABLE_MERGE={r-base=3.6.2}, FASTP={fastp=0.23.4}, FILTER_STATS={BusyBox=1.32.1}, FORMAT_HAIRPIN={fastx_toolkit=0.0.14}, FORMAT_MATURE={fastx_toolkit=0.0.14}, GAWK_CDNA={gawk=5.3.0}, GAWK_NCRNA={gawk=5.3.0}, INDEX_CDNA={bowtie2=2.5.2}, INDEX_HAIRPIN={bowtie=1.3.0}, INDEX_MATURE={bowtie=1.3.0}, INDEX_NCRNA={bowtie2=2.5.2}, INDEX_TRNA={bowtie2=2.5.2}, MIRTOP_COUNTS={mirtop=0.4.28}, MIRTOP_EXPORT={mirtop=0.4.28}, MIRTOP_GFF={mirtop=0.4.28}, MIRTOP_STATS={mirtop=0.4.28}, MIRTRACE_QC={mirtrace=1.0.1}, PARSE_HAIRPIN={seqkit=2.6.1}, PARSE_MATURE={seqkit=2.6.1}, SAMTOOLS_FLAGSTAT={samtools=1.21}, SAMTOOLS_IDXSTATS={samtools=1.21}, SAMTOOLS_INDEX={samtools=1.21}, SAMTOOLS_SORT={samtools=1.21}, SAMTOOLS_STATS={samtools=1.21}, SEQCLUSTER_COLLAPSE={seqcluster=1.2.9}, SEQKIT_GREP_CDNA={seqkit=2.8.0}, SEQKIT_GREP_NCRNA={seqkit=2.8.0}, STATS_GAWK_CDNA={gawk=5.3.0}, STATS_GAWK_NCRNA={gawk=5.3.0}, STATS_GAWK_TRNA={gawk=5.3.0}, Workflow={nf-core/smrnaseq=v2.4.0}}"
37+
"{BLAT_CDNA={blat=36}, BLAT_NCRNA={blat=36}, BOWTIE2_ALIGN_CDNA={bowtie2=2.5.2, samtools=1.18, pigz=2.6}, BOWTIE2_ALIGN_NCRNA={bowtie2=2.5.2, samtools=1.18, pigz=2.6}, BOWTIE2_ALIGN_TRNA={bowtie2=2.5.2, samtools=1.18, pigz=2.6}, BOWTIE_MAP_HAIRPIN={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_MATURE={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_SEQCLUSTER={bowtie=1.3.0, samtools=1.16.1}, CAT_FASTQ={cat=8.3}, DATATABLE_MERGE={r-base=3.6.2}, FASTP={fastp=0.23.4}, FILTER_STATS={BusyBox=1.32.1}, FORMAT_HAIRPIN={fastx_toolkit=0.0.14}, FORMAT_MATURE={fastx_toolkit=0.0.14}, GAWK_CDNA={gawk=5.3.0}, GAWK_NCRNA={gawk=5.3.0}, INDEX_CDNA={bowtie2=2.5.2}, INDEX_HAIRPIN={bowtie=1.3.0}, INDEX_MATURE={bowtie=1.3.0}, INDEX_NCRNA={bowtie2=2.5.2}, INDEX_TRNA={bowtie2=2.5.2}, MIRTOP_COUNTS={mirtop=0.4.28}, MIRTOP_EXPORT={mirtop=0.4.28}, MIRTOP_GFF={mirtop=0.4.28}, MIRTOP_STATS={mirtop=0.4.28}, MIRTRACE_QC={mirtrace=1.0.1}, PARSE_HAIRPIN={seqkit=2.6.1}, PARSE_MATURE={seqkit=2.6.1}, PIVOT_LONGER={r-base=4.4.2, tidyr=1.3.1, optparse=1.7.5}, PIVOT_WIDER={r-base=4.4.2, tidyr=1.3.1, dplyr=1.1.4, optparse=1.7.5, vroom=1.6.5}, SAMTOOLS_FLAGSTAT={samtools=1.21}, SAMTOOLS_IDXSTATS={samtools=1.21}, SAMTOOLS_INDEX={samtools=1.21}, SAMTOOLS_SORT={samtools=1.21}, SAMTOOLS_STATS={samtools=1.21}, SEQCLUSTER_COLLAPSE={seqcluster=1.2.9}, SEQKIT_GREP_CDNA={seqkit=2.8.0}, SEQKIT_GREP_NCRNA={seqkit=2.8.0}, STATS_GAWK_CDNA={gawk=5.3.0}, STATS_GAWK_NCRNA={gawk=5.3.0}, STATS_GAWK_TRNA={gawk=5.3.0}, Workflow={nf-core/smrnaseq=v2.4.0}}"
3838
],
3939
"meta": {
4040
"nf-test": "0.9.0",
41-
"nextflow": "24.04.4"
41+
"nextflow": "24.10.2"
4242
},
43-
"timestamp": "2024-10-08T23:16:26.853242481"
43+
"timestamp": "2024-12-10T00:29:32.052341"
4444
},
4545
"mirna_quant_bam": {
4646
"content": [
@@ -65,9 +65,9 @@
6565
],
6666
"meta": {
6767
"nf-test": "0.9.0",
68-
"nextflow": "24.04.4"
68+
"nextflow": "24.10.2"
6969
},
70-
"timestamp": "2024-10-01T20:06:04.974546479"
70+
"timestamp": "2024-12-10T00:29:32.116301175"
7171
},
7272
"mirna_quant_edger_qc": {
7373
"content": [
@@ -90,9 +90,9 @@
9090
],
9191
"meta": {
9292
"nf-test": "0.9.0",
93-
"nextflow": "24.04.4"
93+
"nextflow": "24.10.2"
9494
},
95-
"timestamp": "2024-10-01T20:06:05.025175321"
95+
"timestamp": "2024-12-10T00:29:32.164075991"
9696
},
9797
"contaminant_filter_filter": {
9898
"content": [
@@ -113,8 +113,8 @@
113113
],
114114
"meta": {
115115
"nf-test": "0.9.0",
116-
"nextflow": "24.04.4"
116+
"nextflow": "24.10.2"
117117
},
118-
"timestamp": "2024-10-01T20:06:05.070939602"
118+
"timestamp": "2024-12-10T00:29:32.208602197"
119119
}
120-
}
120+
}

tests/test_mirgenedb.nf.test

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@ nextflow_pipeline {
1919
assertAll(
2020
{ assert workflow.success },
2121
{ assert snapshot(UTILS.removeNextflowVersion("$outputDir")).match("software_versions") },
22-
{ assert workflow.trace.succeeded().size() == 104 },
22+
{ assert workflow.trace.succeeded().size() == 107 },
2323
{ assert workflow.trace.failed().size() == 1 },
2424

2525
{ assert snapshot(

tests/test_mirgenedb.nf.test.snap

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -19,13 +19,13 @@
1919
},
2020
"software_versions": {
2121
"content": [
22-
"{BOWTIE_MAP_GENOME={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_HAIRPIN={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_MATURE={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_SEQCLUSTER={bowtie=1.3.0, samtools=1.16.1}, CSVTK_JOIN={csvtk=0.30.0}, DATATABLE_MERGE={r-base=3.6.2}, FASTP={fastp=0.23.4}, FASTQC_RAW={fastqc=0.12.1}, FASTQC_TRIM={fastqc=0.12.1}, FORMAT_HAIRPIN={fastx_toolkit=0.0.14}, FORMAT_MATURE={fastx_toolkit=0.0.14}, INDEX_HAIRPIN={bowtie=1.3.0}, INDEX_MATURE={bowtie=1.3.0}, MIRDEEP2_MAPPER={mirdeep2=2.0.1}, MIRDEEP2_MIRDEEP2={mirdeep2=2.0.1}, MIRTOP_COUNTS={mirtop=0.4.28}, MIRTOP_EXPORT={mirtop=0.4.28}, MIRTOP_GFF={mirtop=0.4.28}, MIRTOP_STATS={mirtop=0.4.28}, PARSE_HAIRPIN={seqkit=2.6.1}, PARSE_MATURE={seqkit=2.6.1}, SAMTOOLS_FLAGSTAT={samtools=1.21}, SAMTOOLS_IDXSTATS={samtools=1.21}, SAMTOOLS_INDEX={samtools=1.21}, SAMTOOLS_SORT={samtools=1.21}, SAMTOOLS_STATS={samtools=1.21}, SEQCLUSTER_COLLAPSE={seqcluster=1.2.9}, SEQKIT_FQ2FA={seqkit=2.8.0}, SEQKIT_REPLACE={seqkit=2.8.0}, Workflow={nf-core/smrnaseq=v2.4.0}}"
22+
"{BOWTIE_MAP_GENOME={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_HAIRPIN={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_MATURE={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_SEQCLUSTER={bowtie=1.3.0, samtools=1.16.1}, DATATABLE_MERGE={r-base=3.6.2}, FASTP={fastp=0.23.4}, FASTQC_RAW={fastqc=0.12.1}, FASTQC_TRIM={fastqc=0.12.1}, FORMAT_HAIRPIN={fastx_toolkit=0.0.14}, FORMAT_MATURE={fastx_toolkit=0.0.14}, INDEX_HAIRPIN={bowtie=1.3.0}, INDEX_MATURE={bowtie=1.3.0}, MIRDEEP2_MAPPER={mirdeep2=2.0.1}, MIRDEEP2_MIRDEEP2={mirdeep2=2.0.1}, MIRTOP_COUNTS={mirtop=0.4.28}, MIRTOP_EXPORT={mirtop=0.4.28}, MIRTOP_GFF={mirtop=0.4.28}, MIRTOP_STATS={mirtop=0.4.28}, PARSE_HAIRPIN={seqkit=2.6.1}, PARSE_MATURE={seqkit=2.6.1}, PIVOT_LONGER={r-base=4.4.2, tidyr=1.3.1, optparse=1.7.5}, PIVOT_WIDER={r-base=4.4.2, tidyr=1.3.1, dplyr=1.1.4, optparse=1.7.5, vroom=1.6.5}, SAMTOOLS_FLAGSTAT={samtools=1.21}, SAMTOOLS_IDXSTATS={samtools=1.21}, SAMTOOLS_INDEX={samtools=1.21}, SAMTOOLS_SORT={samtools=1.21}, SAMTOOLS_STATS={samtools=1.21}, SEQCLUSTER_COLLAPSE={seqcluster=1.2.9}, SEQKIT_FQ2FA={seqkit=2.8.0}, SEQKIT_REPLACE={seqkit=2.8.0}, Workflow={nf-core/smrnaseq=v2.4.0}}"
2323
],
2424
"meta": {
2525
"nf-test": "0.9.0",
26-
"nextflow": "24.10.0"
26+
"nextflow": "24.10.2"
2727
},
28-
"timestamp": "2024-11-11T13:44:14.583324793"
28+
"timestamp": "2024-12-10T00:35:18.448206326"
2929
},
3030
"mirna_quant_bam": {
3131
"content": [

tests/test_nextflex.nf.test

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@ nextflow_pipeline {
1919
assertAll(
2020
{ assert workflow.success },
2121
{ assert snapshot(UTILS.removeNextflowVersion("$outputDir")).match("software_versions") },
22-
{ assert workflow.trace.succeeded().size() == 79 },
22+
{ assert workflow.trace.succeeded().size() == 82 },
2323

2424
{ assert snapshot(
2525
path("$outputDir/mirna_quant/bam/mature/sample2_mature.sorted.idxstats"),

tests/test_nextflex.nf.test.snap

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -34,13 +34,13 @@
3434
},
3535
"software_versions": {
3636
"content": [
37-
"{BOWTIE_MAP_HAIRPIN={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_MATURE={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_SEQCLUSTER={bowtie=1.3.0, samtools=1.16.1}, CSVTK_JOIN={csvtk=0.30.0}, DATATABLE_MERGE={r-base=3.6.2}, FASTP={fastp=0.23.4}, FASTQC_RAW={fastqc=0.12.1}, FASTQC_TRIM={fastqc=0.12.1}, FORMAT_HAIRPIN={fastx_toolkit=0.0.14}, FORMAT_MATURE={fastx_toolkit=0.0.14}, INDEX_HAIRPIN={bowtie=1.3.0}, INDEX_MATURE={bowtie=1.3.0}, MIRTOP_COUNTS={mirtop=0.4.28}, MIRTOP_EXPORT={mirtop=0.4.28}, MIRTOP_GFF={mirtop=0.4.28}, MIRTOP_STATS={mirtop=0.4.28}, MIRTRACE_QC={mirtrace=1.0.1}, PARSE_HAIRPIN={seqkit=2.6.1}, PARSE_MATURE={seqkit=2.6.1}, SAMTOOLS_FLAGSTAT={samtools=1.21}, SAMTOOLS_IDXSTATS={samtools=1.21}, SAMTOOLS_INDEX={samtools=1.21}, SAMTOOLS_SORT={samtools=1.21}, SAMTOOLS_STATS={samtools=1.21}, SEQCLUSTER_COLLAPSE={seqcluster=1.2.9}, Workflow={nf-core/smrnaseq=v2.4.0}}"
37+
"{BOWTIE_MAP_HAIRPIN={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_MATURE={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_SEQCLUSTER={bowtie=1.3.0, samtools=1.16.1}, DATATABLE_MERGE={r-base=3.6.2}, FASTP={fastp=0.23.4}, FASTQC_RAW={fastqc=0.12.1}, FASTQC_TRIM={fastqc=0.12.1}, FORMAT_HAIRPIN={fastx_toolkit=0.0.14}, FORMAT_MATURE={fastx_toolkit=0.0.14}, INDEX_HAIRPIN={bowtie=1.3.0}, INDEX_MATURE={bowtie=1.3.0}, MIRTOP_COUNTS={mirtop=0.4.28}, MIRTOP_EXPORT={mirtop=0.4.28}, MIRTOP_GFF={mirtop=0.4.28}, MIRTOP_STATS={mirtop=0.4.28}, MIRTRACE_QC={mirtrace=1.0.1}, PARSE_HAIRPIN={seqkit=2.6.1}, PARSE_MATURE={seqkit=2.6.1}, PIVOT_LONGER={r-base=4.4.2, tidyr=1.3.1, optparse=1.7.5}, PIVOT_WIDER={r-base=4.4.2, tidyr=1.3.1, dplyr=1.1.4, optparse=1.7.5, vroom=1.6.5}, SAMTOOLS_FLAGSTAT={samtools=1.21}, SAMTOOLS_IDXSTATS={samtools=1.21}, SAMTOOLS_INDEX={samtools=1.21}, SAMTOOLS_SORT={samtools=1.21}, SAMTOOLS_STATS={samtools=1.21}, SEQCLUSTER_COLLAPSE={seqcluster=1.2.9}, Workflow={nf-core/smrnaseq=v2.4.0}}"
3838
],
3939
"meta": {
4040
"nf-test": "0.9.0",
41-
"nextflow": "24.04.4"
41+
"nextflow": "24.10.2"
4242
},
43-
"timestamp": "2024-10-08T23:25:57.880948228"
43+
"timestamp": "2024-12-10T00:37:47.333537716"
4444
},
4545
"mirna_quant_bam": {
4646
"content": [
@@ -142,4 +142,4 @@
142142
},
143143
"timestamp": "2024-09-20T17:11:24.369706104"
144144
}
145-
}
145+
}

tests/test_skipfastp.nf.test

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@ nextflow_pipeline {
1919
assertAll(
2020
{ assert workflow.success },
2121
{ assert snapshot(UTILS.removeNextflowVersion("$outputDir")).match("software_versions") },
22-
{ assert workflow.trace.succeeded().size() == 64 },
22+
{ assert workflow.trace.succeeded().size() == 66 },
2323

2424
{ assert snapshot(
2525
path("$outputDir/mirna_quant/mirtop/joined_samples_mirtop.tsv").exists(),

tests/test_skipfastp.nf.test.snap

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -41,13 +41,13 @@
4141
},
4242
"software_versions": {
4343
"content": [
44-
"{BOWTIE_MAP_GENOME={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_HAIRPIN={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_MATURE={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_SEQCLUSTER={bowtie=1.3.0, samtools=1.16.1}, CSVTK_JOIN={csvtk=0.30.0}, DATATABLE_MERGE={r-base=3.6.2}, FASTQC_RAW={fastqc=0.12.1}, FORMAT_HAIRPIN={fastx_toolkit=0.0.14}, FORMAT_MATURE={fastx_toolkit=0.0.14}, INDEX_HAIRPIN={bowtie=1.3.0}, INDEX_MATURE={bowtie=1.3.0}, MIRTOP_COUNTS={mirtop=0.4.28}, MIRTOP_EXPORT={mirtop=0.4.28}, MIRTOP_GFF={mirtop=0.4.28}, MIRTOP_STATS={mirtop=0.4.28}, MIRTRACE_QC={mirtrace=1.0.1}, PARSE_HAIRPIN={seqkit=2.6.1}, PARSE_MATURE={seqkit=2.6.1}, SAMTOOLS_FLAGSTAT={samtools=1.21}, SAMTOOLS_IDXSTATS={samtools=1.21}, SAMTOOLS_INDEX={samtools=1.21}, SAMTOOLS_SORT={samtools=1.21}, SAMTOOLS_STATS={samtools=1.21}, SEQCLUSTER_COLLAPSE={seqcluster=1.2.9}, Workflow={nf-core/smrnaseq=v2.4.0}}"
44+
"{BOWTIE_MAP_GENOME={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_HAIRPIN={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_MATURE={bowtie=1.3.0, samtools=1.16.1}, BOWTIE_MAP_SEQCLUSTER={bowtie=1.3.0, samtools=1.16.1}, DATATABLE_MERGE={r-base=3.6.2}, FASTQC_RAW={fastqc=0.12.1}, FORMAT_HAIRPIN={fastx_toolkit=0.0.14}, FORMAT_MATURE={fastx_toolkit=0.0.14}, INDEX_HAIRPIN={bowtie=1.3.0}, INDEX_MATURE={bowtie=1.3.0}, MIRTOP_COUNTS={mirtop=0.4.28}, MIRTOP_EXPORT={mirtop=0.4.28}, MIRTOP_GFF={mirtop=0.4.28}, MIRTOP_STATS={mirtop=0.4.28}, MIRTRACE_QC={mirtrace=1.0.1}, PARSE_HAIRPIN={seqkit=2.6.1}, PARSE_MATURE={seqkit=2.6.1}, PIVOT_LONGER={r-base=4.4.2, tidyr=1.3.1, optparse=1.7.5}, PIVOT_WIDER={r-base=4.4.2, tidyr=1.3.1, dplyr=1.1.4, optparse=1.7.5, vroom=1.6.5}, SAMTOOLS_FLAGSTAT={samtools=1.21}, SAMTOOLS_IDXSTATS={samtools=1.21}, SAMTOOLS_INDEX={samtools=1.21}, SAMTOOLS_SORT={samtools=1.21}, SAMTOOLS_STATS={samtools=1.21}, SEQCLUSTER_COLLAPSE={seqcluster=1.2.9}, Workflow={nf-core/smrnaseq=v2.4.0}}"
4545
],
4646
"meta": {
4747
"nf-test": "0.9.0",
48-
"nextflow": "24.04.4"
48+
"nextflow": "24.10.2"
4949
},
50-
"timestamp": "2024-10-08T23:28:49.241105443"
50+
"timestamp": "2024-12-10T00:40:10.829696529"
5151
},
5252
"mirna_quant_bam": {
5353
"content": [
@@ -142,4 +142,4 @@
142142
},
143143
"timestamp": "2024-10-01T20:19:25.557700049"
144144
}
145-
}
145+
}

0 commit comments

Comments
 (0)