Skip to content

Commit b0aa23a

Browse files
committed
toying with some nf-schema functionality, making small additions, removing dangling subworkflows
1 parent 9e2a589 commit b0aa23a

28 files changed

+164083
-924
lines changed

CITATIONS.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -36,7 +36,7 @@
3636
3737
- [alfred](https://www.gear-genomics.com/docs/alfred/)
3838

39-
> Rausch, T., Fritz, M.H., Korbel, J.O. and Benes, V. Alfred: interactive multi-sample BAM alignment statistics, feature counting and feature annotation for long- and short-read sequencing. Bioinformatics. 2019 Jul 15;35(14):2489-2491. https://doi.org/10.1093/bioinformatics/bty1007
39+
> Rausch, T., Fritz, M.H., Korbel, J.O. and Benes, V. Alfred: interactive multi-sample BAM alignment statistics, feature counting and feature annotation for long- and short-read sequencing. Bioinformatics. 2019 Jul 15;35(14):2489-2491. https://doi.org/10.1093/bioinformatics/bty1007
4040
4141
- [ngs-bits](https://github.com/imgag/ngs-bits/tree/master)
4242

README.md

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,6 +21,8 @@ Nanopore Technologies (ONT) libraries. It is recommended to provide raw FASTQ
2121
files to the pipeline, however, it will also accept already mapped sequencing
2222
reads in BAM format. These are provided to the samplesheet as input.
2323

24+
The general flow of the pipeline is as follows;
25+
2426
<!-- nf-core: Include a figure that guides the user through the major workflow steps. Many nf-core
2527
workflows use the "tube map" design for that. See https://nf-co.re/docs/contributing/design_guidelines#examples for examples. -->
2628

@@ -60,7 +62,7 @@ CONTROL1,2,data/long_reads_2.fastq.gz
6062
```
6163

6264
Each row represents a fastq file. Replicate refers to a technical replicate, biological replicates should be named uniquely. Be sure to pay attention to sample naming, in
63-
order to avoid duplication and file overwriting.
65+
order to avoid duplication and file overwriting. The replicate field is optional, the other two are mandatory.
6466

6567
The basic reference files required to run the pipeline are 1) a genome in fasta format, and 2) a transcriptome annotation in gtf format. It is advised that the files be gzipped, but it is fine if they are not.
6668

assets/email_template.html

Lines changed: 104 additions & 42 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

conf/test.config

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -13,6 +13,7 @@
1313
params {
1414
config_profile_name = 'Test profile'
1515
config_profile_description = 'Minimal test dataset to check pipeline function'
16+
config_profile_url = "https://github.com/number-25/LongTranscriptomics/blob/dev/conf/test.config"
1617

1718
// Limit resources so that this can run on GitHub Actions
1819
max_cpus = 2
@@ -44,12 +45,12 @@ params {
4445
skip_bam_qc = false
4546
skip_nanoq = false
4647
skip_sequali = false
47-
skip_alredy = false
48+
skip_alfred = false
4849
skip_cramino = false
4950
skip_samtools_flagstat = false
5051
skip_ngs_bits = true
5152
ngs_bits_skip_contamination = true // default: [false]
52-
ngs_bits_build = 'non_human' // options: [hg38, hg19, non_human]
53+
ngs_bits_build = 'hg38' // options: [hg38, hg19, non_human]
5354
cramino_min_length = 0 // minimum re
5455
skip_jaccard = true
5556
skip_flair = true
@@ -67,22 +68,21 @@ params {
6768
// TRANSCRIPT QUANTIFICATION
6869
skip_transcript_quantification = false
6970
skip_oarfish = false
70-
skip_transigner = false
7171
skip_sqanti_all = true
7272
skip_gffcompare = false
7373
extra_gffcompare_options = null
7474
skip_sqanti_qc = true
7575
sqanti_qc_reference = 'human'
7676
sqanti_qc_cage = true
77-
sqanti_qc_cage_path = '/path/to/cage'
77+
sqanti_qc_cage_path = null
7878
sqanti_qc_polyA_sites = true
79-
sqanti_qc_polyA_sites_path = 'path/to/polyA'
79+
sqanti_qc_polyA_sites_path = null
8080
sqanti_qc_polyA_motif = true
81-
sqanti_qc_polyA_motif_path = 'path/to/polyA/path'
81+
sqanti_qc_polyA_motif_path = null
8282
sqanti_qc_intron_junctions = true
83-
sqanti_qc_intron_path = 'path/to/intro/path'
83+
sqanti_qc_intron_path = null
8484
extra_sqanti_qc_options = null
85-
85+
help = false
8686
}
8787

8888
includeConfig "../modules/local/isoquant/isoquant/test_nextflow.config"

conf/test_full.config

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -66,7 +66,6 @@ params {
6666
// TRANSCRIPT QUANTIFICATION
6767
skip_transcript_quantification = false
6868
skip_oarfish = false
69-
skip_transigner = false
7069
// TRANSCRIPTOME ASSESSMENT
7170
skip_gffcompare = false
7271
extra_gffcompare_options = null
@@ -82,4 +81,5 @@ params {
8281
sqanti_qc_intron_junctions = false
8382
sqanti_qc_intron_path = null
8483
extra_sqanti_qc_options = null
84+
help = false
8585
}

docs/usage.md

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -24,11 +24,11 @@ CONTROL1,1,data/long_reads_1.fastq.gz
2424
CONTROL1,2,data/long_reads_2.fastq.gz
2525
```
2626

27-
| Column | Description |
28-
| ------------------------- | ------------------------------------------------------------------------ |
29-
| `sample` | Sample name. |
30-
| `replicate` | Technical replicate number |
31-
| `read_path` | Full path to fastq reads. |
27+
| Column | Description |
28+
| ----------- | -------------------------- |
29+
| `sample` | Sample name. |
30+
| `replicate` | Technical replicate number |
31+
| `read_path` | Full path to fastq reads. |
3232

3333
An [example samplesheet](../assets/samplesheet.csv) has been provided with the pipeline.
3434

main.nf

Lines changed: 17 additions & 64 deletions
Original file line numberDiff line numberDiff line change
@@ -10,72 +10,37 @@
1010

1111
nextflow.enable.dsl = 2
1212

13-
/*
14-
========================================================================================
15-
VALIDATE & PRINT PARAMETER SUMMARY
16-
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
17-
*/
18-
19-
//WorkflowMain.initialise(workflow, params, log)
20-
21-
/*
22-
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
23-
IMPORT FUNCTIONS / MODULES / SUBWORKFLOWS / WORKFLOWS
24-
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
25-
*/
26-
27-
//include { DIRECTRNA } from './workflows/directrna'
28-
//include { PREPARE_REFERENCE } from './subworkflows/local/prepare_reference'
29-
//include { PIPELINE_INITIALISATION } from 'subworkflows/local/utils_nfcore_directrna_pipeline'
30-
//include { PIPELINE_COMPLETION } from 'subworkflows/local/utils_nfcore_directrna_pipeline'
31-
//include { getGenomeAttribute } from './subworkflows/local/utils_nfcore_directrna_pipeline'
32-
33-
/*
34-
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
35-
GENOME PARAMETER VALUES
36-
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
37-
*/
38-
39-
//nf-core: Remove this line if you don't need a FASTA file
40-
// This is an example of how to use getGenomeAttribute() to fetch parameters
41-
// from igenomes.config using `--genome`
42-
//params.genome_fasta = getGenomeAttribute('fasta')
43-
44-
//
45-
// SUBWORKFLOW: Prepare reference genome files
46-
//
47-
//PREPARE_REFERENCE
48-
49-
5013
/*
5114
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
5215
NAMED WORKFLOWS FOR PIPELINE
5316
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
5417
*/
5518

56-
include { DIRECTRNA } from './workflows/directrna'
19+
include { DIRECTRNA } from './workflows/directrna'
20+
include { validateParameters } from 'plugin/nf-schema'
21+
include { paramsSummaryLog } from 'plugin/nf-schema'
5722

58-
//
59-
// WORKFLOW: Run main analysis pipeline depending on type of input
60-
//
6123
workflow{
62-
DIRECTRNA ()
63-
//samplesheet
64-
}
65-
//take:
66-
//samplesheet // channel: samplesheet read in from --input
67-
68-
//main:
6924

7025
//
71-
// WORKFLOW: Run pipeline
26+
// nf-scheme validations
7227
//
7328

29+
validateParameters()
30+
log.info paramsSummaryLog(workflow)
31+
32+
if (params.help) {
33+
log.info paramsHelp(
34+
beforeText: "Welcome to LongTranscriptomics, I see you are seeking help.",
35+
afterText: "Farewell, hopefully this was helpful.",
36+
command: "nextflow run . -profile <profile> --outdir <outdir>",
37+
)
38+
exit 0
39+
}
7440

75-
//emit:
76-
//multiqc_report = DIRECTRNA.out.multiqc_report // channel: /path/to/multiqc_report.html
7741

78-
//}
42+
DIRECTRNA ()
43+
}
7944
/*
8045
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
8146
RUN MAIN WORKFLOW
@@ -98,18 +63,6 @@ workflow {
9863
params.outdir,
9964
params.input
10065
)
101-
102-
//
103-
// WORKFLOW: Run main workflow
104-
//
105-
//MEDGEN_DIRECTRNA (
106-
// PIPELINE_INITIALISATION.out.samplesheet
107-
)
108-
109-
//
110-
// SUBWORKFLOW: Run completion tasks
111-
//
112-
11366
PIPELINE_COMPLETION (
11467
params.email,
11568
params.email_on_fail,

0 commit comments

Comments
 (0)