forked from nf-core/circrna
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathnextflow_schema.json
668 lines (668 loc) · 41 KB
/
nextflow_schema.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
{
"$schema": "http://json-schema.org/draft-07/schema",
"$id": "https://raw.githubusercontent.com/nf-core/circrna/master/nextflow_schema.json",
"title": "nf-core/circrna pipeline parameters",
"description": "circRNA quantification, differential expression analysis and miRNA target prediction of RNA-Seq data",
"type": "object",
"definitions": {
"input_output_options": {
"title": "Input/output options",
"type": "object",
"fa_icon": "fas fa-terminal",
"description": "Define where the pipeline should find input data and write output data.",
"required": [
"input",
"input_type",
"outdir"
],
"properties": {
"input": {
"type": "string",
"fa_icon": "fas fa-dna",
"description": "Path to directory containing FASTQ/BAM files or a CSV file containing the absolute path to FASTQ/BAM files.",
"help_text": "There are two ways to supply input data to nf-core/circrna:\n\n1. Provide the path to the directory containing FASTQ or BAM files, with the appropriate wildcard glob pattern *e.g:*\n```bash\n--input \"/data/*_r{1,2}.fastq.gz\"\n```\n2. Provide a CSV file containing the absolute paths to FASTQ or BAM files *e.g:*\n\n| Sample_ID | Read1 | Read2 | Bam |\n|------------- |------------------------------- |------------------------------- |----- |\n| control_rep1 | /data/control_rep1_r1.fastq.gz | /data/control_rep1_r2.fastq.gz | NA |\n| control_rep2 | /data/control_rep2_r1.fastq.gz | /data/control_rep2_r2.fastq.gz | NA |\n| control_rep3 | /data/control_rep3_r1.fastq.gz | /data/control_rep3_r2.fastq.gz | NA |\n| lung_rep1 | /data/lung_rep1_r1.fastq.gz | /data/lung_rep1_r2.fastq.gz | NA |\n| lung_rep2 | /data/lung_rep2_r1.fastq.gz | /data/lung_rep2_r2.fastq.gz | NA |\n| lung_rep3 | /data/lung_rep3_r1.fastq.gz | /data/lung_rep3_r2.fastq.gz | NA |\n| melanoma_rep1 | /data/melanoma_rep1_r1.fastq.gz | /data/melanoma_rep1_r2.fastq.gz | NA |\n| melanoma_rep2 | /data/melanoma_rep2_r1.fastq.gz | /data/melanoma_rep2_r2.fastq.gz | NA |\n| melanoma_rep3 | /data/melanoma_rep3_r1.fastq.gz | /data/melanoma_rep3_r2.fastq.gz | NA |\n\n When supplying BAM files to the CSV file, set Read1 & Read2 columns to 'NA'."
},
"input_type": {
"type": "string",
"fa_icon": "fas fa-dna",
"description": "Input data type, 'fastq' or 'bam'.",
"help_text": "If the user wishes to save the converted raw FASTQ files, set `--save_bamtofastq true`",
"enum": [
"fastq",
"bam"
]
},
"outdir": {
"type": "string",
"description": "The output directory where the results will be saved.",
"default": "./results",
"fa_icon": "fas fa-folder-open"
},
"save_bamtofastq": {
"type": "boolean",
"description": "Save outputs from Picard SamToFastq conversion (i.e raw Fastq files).",
"fa_icon": "fas fa-save",
"default": false,
"hidden": true
},
"phenotype": {
"type": "string",
"description": "Phenotype CSV file specifying the experimental design for DESeq2.",
"fa_icon": "far fa-file-alt",
"help_text": "The response variable containing the phenotype of primary interest in the experiment must have the column name condition. An example phenotype file is given below:\n\n| Sample_ID | condition | replicates |\n|---------|-----------|------------|\n| control_rep1 | control | 1 |\n| control_rep2 | control | 2 |\n| control_rep3 | control | 3 |\n| lung_rep1 | lung | 1 |\n| lung_rep2 | lung | 2 |\n| lung_rep3 | lung | 3 |\n| melanoma_rep1 | melanoma | 1 |\n| melanoma_rep2 | melanoma | 2 |\n| melanoma_rep3 | melanoma | 3 |\n\nThis will produce the DESeq2 design formula '~ replicates + condition' i.e all columns not named condition will be controlled for in the linear mixed model.",
"pattern": "\\.csv$"
}
}
},
"pipeline_options": {
"title": "Pipeline Options",
"type": "object",
"fa_icon": "fas fa-terminal",
"description": "Options for circRNA, miRNA predictions",
"help_text": "Documentation for selecting circRNA quantification tools, analysis modules, outputs etc.",
"required": [
"module",
"tool"
],
"properties": {
"tool": {
"type": "string",
"fa_icon": "fas fa-wrench",
"description": "Comma separated list of circRNA quantification tools to use. Supported tools: ciriquant, circexplorer2, find_circ, circrna_finder, mapsplice, dcc, segemehl",
"help_text": "Select one or a combination of circRNA quantification tools for the pipeline e.g:\n```bash\n--tool 'circexplorer2, ciriquant, find_circ'\n```\n\n> N.B: Selecting more than one circRNA quantification tool will trigger the circRNA filtering parameter --tool_filter",
"default": "circexplorer2"
},
"module": {
"type": "string",
"fa_icon": "fas fa-sliders-h",
"description": "Comma separated list of modules to run: 'circrna_discovery', 'mirna_prediction' & 'differential_expression'.",
"mandatory": "circrna_discovery",
"help_text": "The 'circrna_discovery' module is mandatory. After circRNA quantification, the user can select 'mirna_prediction', 'differential_expression' or both to deploy additional analyses e.g:\n\n```bash\n--module 'circrna_discovery, mirna_prediction, differential_expression'\n```",
"default": "circrna_discovery"
},
"bsj_reads": {
"type": "integer",
"fa_icon": "fas fa-circle-notch",
"description": "Minimum number of required reads spanning circRNA back-splice junction for circRNA to be output by workflow.",
"help_text": "Filter low confidence circRNAs by removing circRNAs with read counts below a specified value. To disable, set the value to 0.",
"default": 2,
"minimum": 0
},
"tool_filter": {
"type": "integer",
"fa_icon": "fas fa-intersection",
"description": "Specify the minimum number of tools circRNAs must be called by to be output by the workflow.",
"help_text": "When multiple circRNA quantification tools have been provided to `--tool`, the user can set a filtering method whereby circRNAs are output if they have been called by at least *n* quantification tools.\n\nSetting `--tool_filter` to 0/1 is the same as taking the union, all circRNAs are included in the output.\n\nSetting `--tool_filter` to 2 will output circRNAs that have been called by at least 2 quantification tools and so on.\n\n> The integer provided to the parameter must be less than or equal to the number of quantification tools provided to `--tool`. ",
"default": 2,
"minimum": 0,
"maximum": 6
},
"save_quantification_intermediates" :{
"type": "boolean",
"fa_icon": "fas fa-save",
"description": "Save raw outputs from circRNA quantification?",
"default": true
},
"save_mirna_predictions": {
"type": "boolean",
"fa_icon": "fas fa-save",
"description": "Save raw miRanda, TargetScan prediction outputs?",
"default": true
}
}
},
"reference_genome_options": {
"title": "Reference genome options",
"type": "object",
"fa_icon": "fas fa-dna",
"description": "Reference genome options used in the analysis.",
"help_text": "`nf-core/circrna` will automatically download reference files if none are provided and generate genome index files based on the tools selected by the user.",
"properties": {
"fasta": {
"type": "string",
"fa_icon": "fas fa-font",
"description": "Path to FASTA genome file.",
"help_text": "If set to null, the parameter `--genome` must be supplied and the reference FASTA file will be automatically downloaded.\n\n```bash\n--fasta '/reference/GRCh38.fa'\n```",
"pattern": "\\.(fa|fasta)$"
},
"genome": {
"type": "string",
"fa_icon": "fas fa-clone",
"description": "iGenome version to use.",
"help_text": "Required if `--fasta`, `--gtf`, `--gene` are set to null."
},
"gtf": {
"type": "string",
"fa_icon": "fas fa-address-book",
"description": "Path to reference GTF file.",
"help_text": "If left empty, the parameter `--genome` must be supplied and the reference GTF file will be automatically downloaded.\n```bash\n--gtf \"/reference/GRCh38.gtf\"\n```\n\n*N.B:* The pipleine has been developed using reference files, UCSC/ENSEMBL files have not been tested.",
"pattern": "\\.gtf$"
},
"gene": {
"type": "string",
"fa_icon": "fas fa-address-book",
"description": "Path to custom annotation text file.",
"help_text": "If left empty, the parameter --genome must be supplied and the customised annotation text file will be automatically generated.\n\n```bash\n--gene \"/reference/GRCh38.txt\"\n```\n\n> NB: The gene annotation text file is generated using a combination of `gtfToGenePred` and perl commands for CIRCexplorer2 [compatability](https://github.com/YangLab/CIRCexplorer2/issues/43). The file cannot be downloaded and it is recommended to leave the parameter null unless re-running the pipeline.",
"pattern": "\\.txt$"
},
"igenomes_base": {
"type": "string",
"description": "Directory / URL base for iGenomes references.",
"default": "s3://ngi-igenomes/igenomes",
"fa_icon": "fas fa-cloud-download-alt",
"hidden": false
},
"igenomes_ignore": {
"type": "boolean",
"description": "Do not load the iGenomes reference config.",
"fa_icon": "fas fa-ban",
"hidden": false,
"help_text": "Do not load `igenomes.config` when running the pipeline. You may choose this option if you observe clashes between custom parameters and those supplied in `igenomes.config`."
},
"samtools": {
"type": "string",
"fa_icon": "fas fa-address-book",
"description": "Path to SAMtools index file.",
"help_text": "Automatically generated if left set to null. \n\nWhen re-running the pipeline, provide the absolute path to the SAMtools index file e.g:\n\n```bash\n--fasta_fai '/data/results/circrna_discovery/index/GRCh38.fa.fai'\n```",
"pattern": "/.fai$"
},
"bowtie": {
"type": "string",
"fa_icon": "fas fa-address-book",
"description": "Path to Bowtie index files.",
"help_text": "Automatically generated if set to null.\n\nWhen re-running the pipeline, provide the absolute path to Bowtie indices directory e.g:\n\n```bash\n--bowtie_index \"/data/results/circrna_discovery/index/bowtie\"\n```"
},
"bowtie2": {
"type": "string",
"fa_icon": "fas fa-address-book",
"description": "Path to Bowtie2 index files.",
"help_text": "Automatically generated if left empty. \n\nWhen re-running the pipeline, provide the absolute path to the Bowtie2 indices directory e.g:\n\n```bash\n--bowtie2_index \"/data/results/circrna_discovery/index/bowtie2\"\n```"
},
"bwa": {
"type": "string",
"fa_icon": "fas fa-address-book",
"description": "Path to BWA index directory.",
"help_text": "Automatically generated if left empty.\n\nWhen re-running the pipeline, provide the absolute path to BWA indices directory e.g:\n\n```bash\n--bwa_index \"/data/results/circrna_discovery/index/bwa\"\n```"
},
"hisat2": {
"type": "string",
"fa_icon": "fas fa-address-book",
"description": "Path to HISAT2 index directory.",
"help_text": "Automatically generated if left empty. \n\nWhen re-running the pipeline, provide the absolute path to HISAT2 indices directory e.g:\n\n```bash\n--hisat2_index \"/data/results/circrna_discovery/index/hisat2\"\n```"
},
"save_reference": {
"type": "boolean",
"default": true,
"description": "Save generated reference genome files to results.",
"help_text": "Saving generated references means that you can use them for future pipeline runs, reducing processing times.",
"fa_icon": "fas fa-save"
},
"segemehl":{
"type": "string",
"fa_icon": "fa-address-book",
"description": "Path to Segemehl Index file"
},
"star": {
"type": "string",
"fa_icon": "fas fa-address-book",
"description": "Path to STAR index directory.",
"help_text": "Automatically generated if left empty.\n\nWhen re-running the pipeline, provide the absolute path to STAR indices directory e.g:\n\n```bash\n--star_index \"/data/results/circrna_discovery/index/STAR\"\n```"
}
}
},
"read_trimming_and_adapter_removal": {
"title": "Read trimming & adapter removal",
"type": "object",
"fa_icon": "fas fa-cut",
"description": "Parameters for BBDUK",
"help_text": "BBDUK read filtering is deployed when `--trim_fastq true`. The user can choose to implement one or a combination of the following 3 operations performed by BBDUK:\n\n1. Adapter removal. Must specify values for `--adapters`, `--k`, `--ktrim` & optionally `--hdist` \n2. Quality trimming. Must specify values for `--trimq` & `--qtrim` \n3. Read length filtering. Must provide value for `--minlen`",
"properties": {
"trim_fastq": {
"type": "boolean",
"fa_icon": "fas fa-fast-forward",
"description": "Trim Fastq?",
"help_text": "If set to true, the BBDUK process is executed. If false, the BBDUK process is skipped and raw reads will be supplied to circRNA quantification tools.",
"default": false
},
"adapters": {
"type": "string",
"fa_icon": "fas fa-file-alt",
"description": "Reference adapter file supplied to BBDUK",
"deafult": "adapters.fa",
"help_text": "BBDUK provides Illumina Truseq and Nextera adapters sequences in FASTA format suitable for most adapter removal situations. The adapters.fa file is located at \"${projectDir}/bin/adapters.fa\" should the user wish to modify the file. \n\nMake sure to specify the absolute path to the 'adapters.fa' file if modified.",
"default": "${projectDir}/bin/adapters.fa",
"pattern": "\\.(fa|fasta)$"
},
"k": {
"type": "integer",
"fa_icon": "fab fa-kickstarter",
"description": "Specifies K-mer size to use for adapter removal",
"default": 12,
"help_text": "'k' specifies the kmer size to use (must be at most the length of the adapters). For example, `--k 32` removes all reads that have a 32 kmer match with the adapter sequences provided."
},
"ktrim": {
"type": "string",
"fa_icon": "fas fa-exchange-alt",
"description": "Which end of reads to perform kmer trimming",
"default": "r",
"help_text": "Specify which end of the reads to perform kmer trimming on. Options are 'r', 'l', and 'f' (right, left, don't trim).",
"enum": [
"r",
"l",
"f"
]
},
"hdist": {
"type": "integer",
"fa_icon": "fas fa-ruler-horizontal",
"description": "Maximum Hamming distance for reference kmers",
"default": 1,
"help_text": "Specify the number of mismatches allowed when aligning kmers to reference adapters. This paramter is optional for adapter trimming.\n\n> Warning: setting `--hdist` to values higher than 1 will result in high memory usage."
},
"trimq": {
"type": "integer",
"fa_icon": "fas fa-award",
"description": "Trimming performed on regions in reads with an average Phred score below specified value",
"default": 20,
"help_text": "> NB: This action is performed after adapter removal if specified."
},
"qtrim": {
"type": "string",
"fa_icon": "fas fa-exchange-alt",
"description": "Which end of reads to perform quality trimming",
"default": "r",
"help_text": "Used in conjunction with `--trimq`, performs quality trimming on the specified end of reads. Options are 'r', 'l' and 'rl' (right, left, both).",
"enum": [
"r",
"l",
"rl"
]
},
"minlen": {
"type": "integer",
"fa_icon": "fas fa-ruler-horizontal",
"description": "Remove reads below length *n*",
"default": 30
},
"save_trimmed":{
"type": "boolean",
"fa_icon": "fas fa-save",
"description": "Save trimmed FASTQ files?",
"default": false
}
}
},
"star_general": {
"title": "STAR",
"type": "object",
"description": "Define parameters for STAR 2 pass mode",
"help_text": "STAR 2 pass mode is performed to identify novel splice sites in *all* samples. STAR takes the novel splice sites into account when performig re-alignment during the second pass. STAR is used for CIRCexplorer2, circRNA_finder & DCC",
"properties": {
"alignIntronMax": {
"type": "integer",
"default": 1000000,
"description": "The maximum intron length is set to 1,000,000",
"fa_icon": "fas fa-sliders-h"
},
"alignIntronMin": {
"type": "integer",
"default": 20,
"description": "The minimum intron length is set to 20. If the genomic gap is smaller than this value, it is considered as a deletion",
"fa_icon": "fas fa-sliders-h"
},
"alignMatesGapMax": {
"type": "integer",
"default": 1000000,
"description": "The maximum genomic distance between mates is 1,000,000",
"fa_icon": "fas fa-sliders-h"
},
"alignSJDBoverhangMin": {
"type": "integer",
"default": 1,
"description": "The number of minimum overhang for annotated junctions",
"fa_icon": "fas fa-sliders-h"
},
"alignSJoverhangMin": {
"type": "integer",
"default": 1,
"description": "The number of minimum overhang for unannotated junctions",
"fa_icon": "fas fa-sliders-h"
},
"alignSoftClipAtReferenceEnds": {
"type": "string",
"default": "No",
"description": "Allow the soft-clipping of the alignments past the end of chromosomes",
"fa_icon": "fas fa-sliders-h"
},
"alignTranscriptsPerReadNmax": {
"type": "integer",
"default": 10000,
"description": "Max number of different alignments per read to consider",
"fa_icon": "fas fa-sliders-h"
},
"chimJunctionOverhangMin": {
"type": "integer",
"default": 15,
"description": "Minimum overhang for a chimeric junction",
"fa_icon": "fas fa-sliders-h"
},
"chimScoreMin": {
"type": "integer",
"default": 15,
"description": "Minimum total (summed) score of the chimeric segments",
"fa_icon": "fas fa-sliders-h"
},
"chimScoreSeparation": {
"type": "integer",
"default": 15,
"description": "Minimum difference (separation) between the best chimeric score and the next one",
"fa_icon": "fas fa-sliders-h"
},
"chimSegmentMin": {
"type": "integer",
"default": 10,
"description": " Minimum length of chimeric segment length, if == 0, no chimeric output",
"fa_icon": "fas fa-sliders-h",
"help_text": "Do not set to 0, this will disable outputs compatible with circRNA quantification."
},
"genomeLoad": {
"type": "string",
"default": "NoSharedMemory",
"description": "Mode of shared memory usage for the genome files",
"fa_icon": "fas fa-sliders-h",
"help_text": "Users can select a variety of options depending on their resource configuration:\n\n1. `LoadAndKeep`: load genome into shared and keep it in memory after run\n2. `LoadAndRemove`: load genome into shared but remove it after run\n3. `LoadAndExit`: load genome into shared memory and exit, keeping the genome in memory for future runs\n4. `Remove`: do not map anything, just remove loaded genome from memory\n5. `NoSharedMemory`: do not use shared memory, each job will have its own private copy of the genome",
"enum": [
"LoadAndKeep",
"LoadAndRemove",
"LoadAndExit",
"Remove",
"NoSharedMemory"
]
},
"limitSjdbInsertNsj": {
"type": "integer",
"default": 1000000,
"description": "Maximum number of junction to be inserted to the genome on the fly at the mapping stage, including those from annotations and those detected in the 1st step of the 2-pass run",
"fa_icon": "fas fa-sliders-h"
},
"outFilterMatchNminOverLread": {
"type": "number",
"default": 0.33,
"description": "Alignment output if ratio of matched bases relative to read length is equal to or higher than this value",
"fa_icon": "fas fa-sliders-h",
"help_text": "Consider 75bp paired end reads with sum matched bases of 120bp. Matched bp is summmed over combined read length (120/150 = 0.8). Simply put, lowering this ratio reduces the number of required matches in reads.\n\n`outFilterMatchNminOverLread` is preferred over `outFilterMatchNmin` as it considers read length, suitable for experiments with varying read length."
},
"outFilterMismatchNoverLmax": {
"type": "number",
"default": 0.05,
"description": "Alignment output if ratio of mismatched bases relative to **mapped** read length is lower than value",
"fa_icon": "fas fa-sliders-h",
"help_text": "For example, for reads <20b no mismatches are allowed (1/19 = 0.0526), 20-39b: 1 mismatch, 40-59b 2 mismatches and so on. Simply put, increasing this value will allow for more mismatches in the mapped reads.\n\n`outFilterMismatchNoverLmax` is preferred over `outFilterMismatchNmax` as it considers the mapped read length, suitable for experiments with varying read length."
},
"outFilterMultimapNmax": {
"type": "integer",
"default": 20,
"description": "Max number of multiple alignments allowed for a read: if exceeded, the read is considered unmapped",
"fa_icon": "fas fa-sliders-h"
},
"outFilterMultimapScoreRange": {
"type": "integer",
"default": 1,
"description": " Score range below the maximum score for multimapping alignments",
"fa_icon": "fas fa-sliders-h"
},
"outFilterScoreMinOverLread": {
"type": "number",
"default": 0.33,
"description": "Alignment will be output only if its score relative to read length is higher than or equal to this value",
"fa_icon": "fas fa-sliders-h"
},
"outSJfilterOverhangMin": {
"type": "string",
"default": "15 15 15 15",
"description": "Minimum overhang length for novel splice junctions",
"fa_icon": "fas fa-sliders-h",
"help_text": "4 integers: minimum overhang length for splice junctions on both sides for:\n1. non-canonical motifs\n2. GT/AG and CT/AC motif\n3. GC/AG and CT/GC motif\n4. AT/AC and GT/AT motif\n\n-1 means no output for that motif"
},
"sjdbOverhang": {
"type": "integer",
"default": 100,
"description": "Option to specify the length of the donor/acceptor sequence on each side of the junctions used in constructing the splice junctions database",
"fa_icon": "fas fa-sliders-h",
"help_text": "By default the option is set to 100. However, we recommend setting a value depending on the read length: read/mate length - 1"
},
"sjdbScore": {
"type": "integer",
"default": 2,
"description": "Alignment score for alignmets that cross database junctions",
"fa_icon": "fas fa-sliders-h"
},
"winAnchorMultimapNmax": {
"type": "integer",
"default": 999,
"description": "The maximum number of loci anchors that are allowed to map. By default, the pipeline uses a large number 999 to switch this filter off.",
"fa_icon": "fas fa-sliders-h"
}
},
"fa_icon": "fas fa-star"
},
"generic_options": {
"title": "Generic options",
"type": "object",
"fa_icon": "fas fa-file-import",
"description": "Less common options for the pipeline, typically set in a config file.",
"help_text": "These options are common to all nf-core pipelines and allow you to customise some of the core preferences for how the pipeline runs.\n\nTypically these options would be set in a Nextflow config file loaded for all pipeline runs, such as `~/.nextflow/config`.",
"properties": {
"help": {
"type": "boolean",
"description": "Display help text.",
"hidden": true,
"fa_icon": "fas fa-question-circle"
},
"publish_dir_mode": {
"type": "string",
"default": "copy",
"hidden": true,
"description": "Method used to save pipeline results to output directory.",
"help_text": "The Nextflow `publishDir` option specifies which intermediate files should be saved to the output directory. This option tells the pipeline what method should be used to move these files. See [Nextflow docs](https://www.nextflow.io/docs/latest/process.html#publishdir) for details.",
"fa_icon": "fas fa-copy",
"enum": [
"symlink",
"rellink",
"link",
"copy",
"copyNoFollow",
"move"
]
},
"validate_params": {
"type": "boolean",
"description": "Boolean whether to validate parameters against the schema at runtime",
"default": true,
"fa_icon": "fas fa-check-square",
"hidden": true
},
"name": {
"type": "string",
"description": "Workflow name.",
"fa_icon": "fas fa-fingerprint",
"hidden": true,
"help_text": "A custom name for the pipeline run. Unlike the core nextflow `-name` option with one hyphen this parameter can be reused multiple times, for example if using `-resume`. Passed through to steps such as MultiQC and used for things like report filenames and titles."
},
"email": {
"type": "string",
"description": "Email address for completion summary.",
"fa_icon": "fas fa-envelope",
"hidden": true,
"help_text": "An email address to send a summary email to when the pipeline is completed.",
"pattern": "^([a-zA-Z0-9_\\-\\.]+)@([a-zA-Z0-9_\\-\\.]+)\\.([a-zA-Z]{2,5})$"
},
"email_on_fail": {
"type": "string",
"description": "Email address for completion summary, only when pipeline fails.",
"fa_icon": "fas fa-exclamation-triangle",
"pattern": "^([a-zA-Z0-9_\\-\\.]+)@([a-zA-Z0-9_\\-\\.]+)\\.([a-zA-Z]{2,5})$",
"hidden": true,
"help_text": "This works exactly as with `--email`, except emails are only sent if the workflow is not successful."
},
"plaintext_email": {
"type": "boolean",
"description": "Send plain-text email instead of HTML.",
"fa_icon": "fas fa-remove-format",
"hidden": true,
"help_text": "Set to receive plain-text e-mails instead of HTML formatted."
},
"max_multiqc_email_size": {
"type": "string",
"description": "File size limit when attaching MultiQC reports to summary emails.",
"default": "25.MB",
"fa_icon": "fas fa-file-upload",
"hidden": true,
"help_text": "If file generated by pipeline exceeds the threshold, it will not be attached."
},
"monochrome_logs": {
"type": "boolean",
"description": "Do not use coloured log outputs.",
"fa_icon": "fas fa-palette",
"hidden": true,
"help_text": "Set to disable colourful command line output and live life in monochrome."
},
"multiqc_config": {
"type": "string",
"description": "Custom config file to supply to MultiQC.",
"fa_icon": "fas fa-cog",
"hidden": true
},
"tracedir": {
"type": "string",
"description": "Directory to keep pipeline Nextflow logs and reports.",
"default": "${params.outdir}/pipeline_info",
"fa_icon": "fas fa-cogs",
"hidden": true
},
"show_hidden_params": {
"type": "boolean",
"fa_icon": "far fa-eye-slash",
"description": "Show all params when using `--help`",
"hidden": true,
"help_text": "By default, parameters set as _hidden_ in the schema are not shown on the command line when a user runs with `--help`. Specifying this option will tell the pipeline to show all parameters."
}
}
},
"max_job_request_options": {
"title": "Max job request options",
"type": "object",
"fa_icon": "fab fa-acquisitions-incorporated",
"description": "Set the top limit for requested resources for any single job.",
"help_text": "If you are running on a smaller system, a pipeline step requesting more resources than are available may cause the Nextflow to stop the run with an error. These options allow you to cap the maximum resources requested by any single job so that the pipeline will run on your system.\n\nNote that you can not _increase_ the resources requested by any job using these options. For that you will need your own configuration file. See [the nf-core website](https://nf-co.re/usage/configuration) for details.",
"properties": {
"max_cpus": {
"type": "integer",
"description": "Maximum number of CPUs that can be requested for any single job.",
"default": 16,
"fa_icon": "fas fa-microchip",
"help_text": "Use to set an upper-limit for the CPU requirement for each process. Should be an integer e.g. `--max_cpus 1`"
},
"max_memory": {
"type": "string",
"description": "Maximum amount of memory that can be requested for any single job.",
"default": "128.GB",
"fa_icon": "fas fa-memory",
"pattern": "^\\d+(\\.\\d+)?\\.?\\s*(K|M|G|T)?B$",
"hidden": true,
"help_text": "Use to set an upper-limit for the memory requirement for each process. Should be a string in the format integer-unit e.g. `--max_memory '8.GB'`"
},
"max_time": {
"type": "string",
"description": "Maximum amount of time that can be requested for any single job.",
"default": "240.h",
"fa_icon": "far fa-clock",
"pattern": "^(\\d+\\.?\\s*(s|m|h|day)\\s*)+$",
"hidden": true,
"help_text": "Use to set an upper-limit for the time requirement for each process. Should be a string in the format integer-unit e.g. `--max_time '2.h'`"
}
}
},
"institutional_config_options": {
"title": "Institutional config options",
"type": "object",
"fa_icon": "fas fa-university",
"description": "Parameters used to describe centralised config profiles. These should not be edited.",
"help_text": "The centralised nf-core configuration profiles use a handful of pipeline parameters to describe themselves. This information is then printed to the Nextflow log when you run a pipeline. You should not need to change these values when you run a pipeline.",
"properties": {
"custom_config_version": {
"type": "string",
"description": "Git commit id for Institutional configs.",
"default": "master",
"hidden": true,
"fa_icon": "fas fa-users-cog",
"help_text": "Provide git commit id for custom Institutional configs hosted at `nf-core/configs`. This was implemented for reproducibility purposes. Default: `master`.\n\n```bash\n## Download and use config file with following git commit id\n--custom_config_version d52db660777c4bf36546ddb188ec530c3ada1b96\n```"
},
"custom_config_base": {
"type": "string",
"description": "Base directory for Institutional configs.",
"default": "https://raw.githubusercontent.com/nf-core/configs/master",
"hidden": true,
"help_text": "If you're running offline, nextflow will not be able to fetch the institutional config files from the internet. If you don't need them, then this is not a problem. If you do need them, you should download the files from the repo and tell nextflow where to find them with the `custom_config_base` option. For example:\n\n```bash\n## Download and unzip the config files\ncd /path/to/my/configs\nwget https://github.com/nf-core/configs/archive/master.zip\nunzip master.zip\n\n## Run the pipeline\ncd /path/to/my/data\nnextflow run /path/to/pipeline/ --custom_config_base /path/to/my/configs/configs-master/\n```\n\n> Note that the nf-core/tools helper package has a `download` command to download all required pipeline files + singularity containers + institutional configs in one go for you, to make this process easier.",
"fa_icon": "fas fa-users-cog"
},
"hostnames": {
"type": "string",
"description": "Institutional configs hostname.",
"hidden": true,
"fa_icon": "fas fa-users-cog"
},
"config_profile_name": {
"type": "string",
"description": "Institutional config name.",
"hidden": true,
"fa_icon": "fas fa-users-cog"
},
"config_profile_description": {
"type": "string",
"description": "Institutional config description.",
"hidden": true,
"fa_icon": "fas fa-users-cog"
},
"config_profile_contact": {
"type": "string",
"description": "Institutional config contact information.",
"hidden": true,
"fa_icon": "fas fa-users-cog"
},
"config_profile_url": {
"type": "string",
"description": "Institutional config URL link.",
"hidden": true,
"fa_icon": "fas fa-users-cog"
}
}
}
},
"allOf": [
{
"$ref": "#/definitions/input_output_options"
},
{
"$ref": "#/definitions/pipeline_options"
},
{
"$ref": "#/definitions/reference_genome_options"
},
{
"$ref": "#/definitions/read_trimming_and_adapter_removal"
},
{
"$ref": "#/definitions/star_general"
},
{
"$ref": "#/definitions/generic_options"
},
{
"$ref": "#/definitions/max_job_request_options"
},
{
"$ref": "#/definitions/institutional_config_options"
}
]
}