Skip to content

Commit 43a4f37

Browse files
committed
Merge branch 'dev' into seqtk_sample_size_warning
2 parents e55f0e5 + f1a3b8c commit 43a4f37

8 files changed

Lines changed: 1146 additions & 1122 deletions

File tree

CHANGELOG.md

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -39,10 +39,11 @@ Initial release of nf-core/seqinspector, created with the [nf-core](https://nf-c
3939
### `Fixed`
4040

4141
- [#71](https://github.com/nf-core/seqinspector/pull/71) FASTQSCREEN does not fail when multiple reads are provided.
42+
- [#94](https://github.com/nf-core/seqinspector/issues/94) Go through and validate test data
4243
- [#99](https://github.com/nf-core/seqinspector/pull/99) Fix group reports for paired reads
4344
- [#107](https://github.com/nf-core/seqinspector/pull/107) Put SeqFU-stats section reports together
4445
- [#112](https://github.com/nf-core/seqinspector/pull/112) Making fastq_screen_references value to use parentDir
45-
- [#94] (https://github.com/nf-core/seqinspector/issues/94) Go through and validate test data
46+
- [#121](https://github.com/nf-core/seqinspector/pull/121) Cleanup sample naming for MultiQC report (#105)
4647
- [#162](https://github.com/nf-core/seqinspector/pull/162) Fix bugs in qc_bam and prepare_genome subworkflows and add tests
4748
- [#163](https://github.com/nf-core/seqinspector/pull/163) Run fastqscreen with subsampled data if available
4849

assets/multiqc_config.yml

Lines changed: 19 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -15,3 +15,22 @@ report_section_order:
1515
export_plots: true
1616

1717
disable_version_detection: true
18+
19+
fn_clean_trim:
20+
- "_screen" # Added by FastqScreen
21+
22+
# Make sample name with indexes a bit prettier
23+
# for SE: "SampleName_01" -> "SampleName #01"
24+
# for PE: "SampleName_01_1" -> "SampleName #01_1"
25+
# and: "SampleName_01_2" -> "SampleName #01_2"
26+
sample_names_replace_regex: True
27+
sample_names_replace:
28+
"(.+)_(\\d{2,}|\\d{2,}_[12])$": "\\1 #\\2"
29+
30+
table_sample_merge:
31+
"Read1":
32+
- type: regex
33+
pattern: "_1$"
34+
"Read2":
35+
- type: regex
36+
pattern: "_2$"

subworkflows/local/utils_nfcore_seqinspector_pipeline/main.nf

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -100,6 +100,8 @@ workflow PIPELINE_INITIALISATION {
100100
//
101101
// Create channel from input file provided through params.input
102102
//
103+
nr_samples = Channel.fromList(samplesheetToList(params.input, "${projectDir}/assets/schema_input.json"))
104+
.toList().size()
103105

104106
channel
105107
.fromList(samplesheetToList(params.input, "${projectDir}/assets/schema_input.json"))
@@ -108,7 +110,9 @@ workflow PIPELINE_INITIALISATION {
108110
.map {
109111
meta, fastq_1, fastq_2, idx ->
110112
def tags = meta.tags ? meta.tags.tokenize(":") : []
111-
def updated_meta = meta + [ id:"${meta.sample}_${idx}", tags:tags ]
113+
def pad_positions = [nr_samples.length(), 2].max()
114+
def zero_padded_idx = idx.padLeft(pad_positions, "0")
115+
def updated_meta = meta + [ id:"${meta.sample}_${zero_padded_idx}", tags:tags ]
112116
if (!fastq_2) {
113117
return [
114118
updated_meta.id,

tests/MiSeq.main.nf.test.snap

Lines changed: 100 additions & 100 deletions
Large diffs are not rendered by default.

tests/MiSeq_PairedEnd.main.nf.test.snap

Lines changed: 127 additions & 127 deletions
Large diffs are not rendered by default.

tests/NovaSeq6000.main.nf.test.snap

Lines changed: 281 additions & 281 deletions
Large diffs are not rendered by default.

tests/NovaSeq6000.main_subsample.nf.test.snap

Lines changed: 581 additions & 581 deletions
Large diffs are not rendered by default.

tests/PromethION.main.nf.test.snap

Lines changed: 31 additions & 31 deletions
Original file line numberDiff line numberDiff line change
@@ -17,12 +17,12 @@
1717
},
1818
[
1919
"fastqc",
20-
"fastqc/hg001_1_fastqc.html",
21-
"fastqc/hg001_1_fastqc.zip",
20+
"fastqc/hg001_01_fastqc.html",
21+
"fastqc/hg001_01_fastqc.zip",
2222
"fastqscreen",
23-
"fastqscreen/hg001_1_screen.html",
24-
"fastqscreen/hg001_1_screen.png",
25-
"fastqscreen/hg001_1_screen.txt",
23+
"fastqscreen/hg001_01_screen.html",
24+
"fastqscreen/hg001_01_screen.png",
25+
"fastqscreen/hg001_01_screen.txt",
2626
"multiqc",
2727
"multiqc/global_report",
2828
"multiqc/global_report/multiqc_data",
@@ -47,7 +47,7 @@
4747
"multiqc/global_report/multiqc_data/multiqc_fastq_screen.txt",
4848
"multiqc/global_report/multiqc_data/multiqc_fastqc.txt",
4949
"multiqc/global_report/multiqc_data/multiqc_general_stats.txt",
50-
"multiqc/global_report/multiqc_data/multiqc_seqfu.txt",
50+
"multiqc/global_report/multiqc_data/multiqc_seqfu_mqc.txt",
5151
"multiqc/global_report/multiqc_data/multiqc_software_versions.txt",
5252
"multiqc/global_report/multiqc_data/multiqc_sources.txt",
5353
"multiqc/global_report/multiqc_plots",
@@ -66,7 +66,7 @@
6666
"multiqc/global_report/multiqc_plots/pdf/fastqc_sequence_duplication_levels_plot.pdf",
6767
"multiqc/global_report/multiqc_plots/pdf/fastqc_sequence_length_distribution_plot.pdf",
6868
"multiqc/global_report/multiqc_plots/pdf/fastqc_top_overrepresented_sequences_table.pdf",
69-
"multiqc/global_report/multiqc_plots/pdf/seqfu.pdf",
69+
"multiqc/global_report/multiqc_plots/pdf/seqfu_mqc.pdf",
7070
"multiqc/global_report/multiqc_plots/png",
7171
"multiqc/global_report/multiqc_plots/png/fastq_screen_plot-cnt.png",
7272
"multiqc/global_report/multiqc_plots/png/fastq_screen_plot-pct.png",
@@ -82,7 +82,7 @@
8282
"multiqc/global_report/multiqc_plots/png/fastqc_sequence_duplication_levels_plot.png",
8383
"multiqc/global_report/multiqc_plots/png/fastqc_sequence_length_distribution_plot.png",
8484
"multiqc/global_report/multiqc_plots/png/fastqc_top_overrepresented_sequences_table.png",
85-
"multiqc/global_report/multiqc_plots/png/seqfu.png",
85+
"multiqc/global_report/multiqc_plots/png/seqfu_mqc.png",
8686
"multiqc/global_report/multiqc_plots/svg",
8787
"multiqc/global_report/multiqc_plots/svg/fastq_screen_plot-cnt.svg",
8888
"multiqc/global_report/multiqc_plots/svg/fastq_screen_plot-pct.svg",
@@ -98,46 +98,46 @@
9898
"multiqc/global_report/multiqc_plots/svg/fastqc_sequence_duplication_levels_plot.svg",
9999
"multiqc/global_report/multiqc_plots/svg/fastqc_sequence_length_distribution_plot.svg",
100100
"multiqc/global_report/multiqc_plots/svg/fastqc_top_overrepresented_sequences_table.svg",
101-
"multiqc/global_report/multiqc_plots/svg/seqfu.svg",
101+
"multiqc/global_report/multiqc_plots/svg/seqfu_mqc.svg",
102102
"multiqc/global_report/multiqc_report.html",
103103
"pipeline_info",
104104
"pipeline_info/nf_core_seqinspector_software_mqc_versions.yml",
105105
"samtools_faidx",
106106
"samtools_faidx/genome.fa.fai",
107107
"samtools_faidx/genome.fa.sizes",
108108
"seqfu_stats",
109-
"seqfu_stats/hg001_1_seqfu.tsv",
110-
"seqfu_stats/hg001_1_seqfu_mqc.txt"
109+
"seqfu_stats/hg001_01_seqfu.tsv",
110+
"seqfu_stats/hg001_01_seqfu_mqc.txt"
111111
],
112112
[
113-
"hg001_1_screen.png:md5,b9c58e388f18ad11f4c2e29e9b573a5e",
114-
"hg001_1_screen.txt:md5,8e53ea043d658a130f4b8ca455e2ba9b",
115-
"fastq_screen_plot.txt:md5,3023b86477fecf6d46d8fc60d82cc53a",
116-
"fastqc-status-check-heatmap.txt:md5,825668e94de27356f0a112beb758e416",
117-
"fastqc_adapter_content_plot.txt:md5,1fa991080c20755e5e729a5eeab960e5",
118-
"fastqc_overrepresented_sequences_plot.txt:md5,e810a3d3eba0ba83b122763505f511a7",
119-
"fastqc_per_base_n_content_plot.txt:md5,cbdb64298ff839665e8c8c8e89896e87",
120-
"fastqc_per_base_sequence_quality_plot.txt:md5,4962950bc3ce77169ac510d64cb769c6",
121-
"fastqc_per_sequence_gc_content_plot_Counts.txt:md5,e62273533304be59dab5f13afef93b3e",
122-
"fastqc_per_sequence_gc_content_plot_Percentages.txt:md5,3d49290a15406cb5dac1460c02729f0f",
123-
"fastqc_per_sequence_quality_scores_plot.txt:md5,7cc10d1bc92ca09431a506c38d911228",
124-
"fastqc_sequence_counts_plot.txt:md5,0425d7298c24df6158d5bf7aca1d4190",
125-
"fastqc_sequence_duplication_levels_plot.txt:md5,9111d942c7eed5af0e9ccb8c42db8505",
126-
"fastqc_sequence_length_distribution_plot.txt:md5,04adfcd0125ebcc3e3bb631f1956c812",
113+
"hg001_01_screen.png:md5,b9c58e388f18ad11f4c2e29e9b573a5e",
114+
"hg001_01_screen.txt:md5,8e53ea043d658a130f4b8ca455e2ba9b",
115+
"fastq_screen_plot.txt:md5,f6883339d43a090e86e02fdf3feacbbd",
116+
"fastqc-status-check-heatmap.txt:md5,0ac9450d210de9ab4548378101877c8e",
117+
"fastqc_adapter_content_plot.txt:md5,6e2a760185573c44180ca43081cc7c99",
118+
"fastqc_overrepresented_sequences_plot.txt:md5,251ad51e27e966476911ff4c77c2a893",
119+
"fastqc_per_base_n_content_plot.txt:md5,230b2a0319f3b7490498e8edb47b17bf",
120+
"fastqc_per_base_sequence_quality_plot.txt:md5,4934bce34aec037e1ea590bd69f74781",
121+
"fastqc_per_sequence_gc_content_plot_Counts.txt:md5,028ada8fc060ce4af7476f339c57c50d",
122+
"fastqc_per_sequence_gc_content_plot_Percentages.txt:md5,6bab830c22525c15a6048d8054f685cf",
123+
"fastqc_per_sequence_quality_scores_plot.txt:md5,fd29224ed588e37e1fc85bf7f717e31e",
124+
"fastqc_sequence_counts_plot.txt:md5,cc83b291e21249f3c4e25d34cc898f0f",
125+
"fastqc_sequence_duplication_levels_plot.txt:md5,7b7665c78ca66d3e13b1850701b198dc",
126+
"fastqc_sequence_length_distribution_plot.txt:md5,d7bac93b11316846778b9d550f323371",
127127
"multiqc_citations.txt:md5,5f52d7a0141e4234c6069df9ef575c9a",
128-
"multiqc_fastq_screen.txt:md5,7c5d711e27c53d13c81644a1f2468dba",
129-
"multiqc_fastqc.txt:md5,1a4b472e13cadc770832b0e20d1de7b0",
130-
"multiqc_seqfu.txt:md5,9595d608ff5709f2bdec8cb1016416c0",
128+
"multiqc_fastq_screen.txt:md5,0ab0d1c4c3e3393afdb50ad0e116e394",
129+
"multiqc_fastqc.txt:md5,b71aaffef9767dfe9d83fde0d31a3a1b",
130+
"multiqc_seqfu_mqc.txt:md5,9595d608ff5709f2bdec8cb1016416c0",
131131
"genome.fa.fai:md5,59557cd3a71ca5e0840285b6088ec1d6",
132132
"genome.fa.sizes:md5,f154a58a25ba9c4d386003eaa1bb731b",
133-
"hg001_1_seqfu.tsv:md5,b133752c897afbb4d8721b911fa117d4",
134-
"hg001_1_seqfu_mqc.txt:md5,42e3506b02ceb72a6f05cb174505e722"
133+
"hg001_01_seqfu.tsv:md5,b133752c897afbb4d8721b911fa117d4",
134+
"hg001_01_seqfu_mqc.txt:md5,42e3506b02ceb72a6f05cb174505e722"
135135
]
136136
],
137137
"meta": {
138138
"nf-test": "0.9.3",
139139
"nextflow": "25.10.2"
140140
},
141-
"timestamp": "2025-12-03T11:01:17.46398"
141+
"timestamp": "2025-12-12T10:05:23.380990836"
142142
}
143143
}

0 commit comments

Comments
 (0)