Skip to content

Commit 49c6e05

Browse files
nextstrain-botrneher
authored andcommitted
chore: rebuild [skip ci]
1 parent ddfbe57 commit 49c6e05

51 files changed

Lines changed: 158326 additions & 85128 deletions

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

data/community/collection.json

Lines changed: 7 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -38,6 +38,12 @@
3838
"community/v-gen-lab/chikV/genotypes",
3939
"community/masphl-bioinformatics/hav/vp1-2b-junction",
4040
"community/masphl-bioinformatics/hav/whole-genome",
41-
"community/itps/zikav"
41+
"community/itps/zikav",
42+
"community/itps/orov/L/refseq",
43+
"community/itps/orov/M/refseq",
44+
"community/itps/orov/M/tefe",
45+
"community/itps/orov/L/tefe",
46+
"community/itps/orov/S/tefe",
47+
"community/itps/orov/S/refseq"
4248
]
4349
}
Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,5 @@
1+
## Unreleased
2+
3+
Initial release of a Oropouche Virus (OROV) dataset for segment L based on NCBI refseq reference genome.
4+
5+
Read more about Nextclade datasets in the documentation: https://docs.nextstrain.org/projects/nextclade/en/stable/user/datasets.html
Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,20 @@
1+
# Nextclade Dataset for "OROV" L segment based on RefSeq reference genome
2+
3+
## Dataset Attributes
4+
5+
| Attribute | Value |
6+
| -------------------- | ---------------------------------------- |
7+
| Name | orov/L/refseq |
8+
| RefName | Oropouche virus segment L |
9+
| RefAccession | NC_005776.1 |
10+
11+
## Scope of This Dataset
12+
13+
The dataset aims to enable the quality control of segment L ofOropouche virus using ncbi refseq as reference.
14+
15+
16+
The source code is available at [InstitutoTodosPelaSaude/nextclade-datasets-workflows](https://github.com/InstitutoTodosPelaSaude/nextclade-datasets-workflows/tree/main/orov).
17+
18+
For bugs, please open an [issue](https://github.com/InstitutoTodosPelaSaude/nextclade-datasets-workflows/issues).
19+
20+
Read more about Nextclade datasets in the Nextclade documentation: [Nextclade Datasets](https://docs.nextstrain.org/projects/nextclade/en/stable/user/datasets.html).
1.32 MB
Binary file not shown.
Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,7 @@
1+
##gff-version 3
2+
#!gff-spec-version 1.21
3+
#!processor NCBI annotwriter
4+
##sequence-region NC_005776.1 1 6846
5+
##species https://www.ncbi.nlm.nih.gov/Taxonomy/Browser/wwwtax.cgi?id=118655
6+
NC_005776.1 RefSeq region 1 6846 . + . ID=NC_005776.1:1..6846;Dbxref=taxon:118655;Name=L;gbkey=Src;genome=genomic;mol_type=genomic RNA;segment=L
7+
NC_005776.1 GenBank gene 44 6796 . + . gene_name=L
Lines changed: 102 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,102 @@
1+
{
2+
"$schema": "https://raw.githubusercontent.com/nextstrain/nextclade/refs/heads/release/packages/nextclade-schemas/input-pathogen-json.schema.json",
3+
"alignmentParams": {
4+
"retryReverseComplement": true,
5+
"alignmentPreset": "high-diversity"
6+
},
7+
"attributes": {
8+
"name": "orov/L/refseq",
9+
"reference accession": "NC_005776.1",
10+
"reference name": "Oropouche virus, L segment"
11+
},
12+
"compatibility": {
13+
"cli": "3.0.0-alpha.0",
14+
"web": "3.0.0-alpha.0"
15+
},
16+
"placementMaskRanges": [
17+
{
18+
"begin": 0,
19+
"end": 43
20+
},
21+
{
22+
"begin": 6796,
23+
"end": 6846
24+
}
25+
],
26+
"deprecated": false,
27+
"enabled": true,
28+
"experimental": true,
29+
"files": {
30+
"changelog": "CHANGELOG.md",
31+
"examples": "sequences.fasta",
32+
"genomeAnnotation": "genome_annotation.gff3",
33+
"pathogenJson": "pathogen.json",
34+
"readme": "README.md",
35+
"reference": "reference.fasta",
36+
"treeJson": "tree.json"
37+
},
38+
"meta": {
39+
"bugs": "https://github.com/InstitutoTodosPelaSaude/nextclade-datasets-workflows/issues",
40+
"source code": "https://github.com/InstitutoTodosPelaSaude/nextclade-datasets-workflows/tree/main/orov"
41+
},
42+
"qc": {
43+
"frameShifts": {
44+
"enabled": true,
45+
"ignoredFrameShifts": [
46+
{
47+
"codonRange": {
48+
"begin": 788,
49+
"end": 792
50+
},
51+
"cdsName": "L"
52+
},
53+
{
54+
"codonRange": {
55+
"begin": 797,
56+
"end": 800
57+
},
58+
"cdsName": "L"
59+
},
60+
{
61+
"codonRange": {
62+
"begin": 846,
63+
"end": 855
64+
},
65+
"cdsName": "L"
66+
}
67+
]
68+
},
69+
"missingData": {
70+
"enabled": true,
71+
"missingDataThreshold": 1369,
72+
"scoreBias": 95
73+
},
74+
"mixedSites": {
75+
"enabled": true,
76+
"mixedSitesThreshold": 7
77+
},
78+
"privateMutations": {
79+
"cutoff": 30,
80+
"enabled": true,
81+
"typical": 10,
82+
"weightLabeledSubstitutions": 2,
83+
"weightReversionSubstitutions": 1,
84+
"weightUnlabeledSubstitutions": 1
85+
},
86+
"snpClusters": {
87+
"enabled": false
88+
},
89+
"stopCodons": {
90+
"enabled": true
91+
}
92+
},
93+
"schemaVersion": "3.0.0",
94+
"version": {
95+
"tag": "unreleased",
96+
"compatibility": {
97+
"cli": "3.0.0-alpha.0",
98+
"web": "3.0.0-alpha.0"
99+
}
100+
},
101+
"defaultCds": "L"
102+
}
Lines changed: 116 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,116 @@
1+
>NC_005776.1 Oropouche virus segment L, complete genome
2+
AGTAGTGTGCTCCTATTCCGAAACAAACAAAAACAATCTCAAAATGTCACAACTGTTGCT
3+
CAACCAATATCGGAATAGGATATTGCACTGCCGTGAACCTGAGATAGCAAAGGATATATG
4+
GCGAGATCTATTAAATGATCGACACAATTACTTTTCTCGGGAATTTTGCAGAGCTGCAAA
5+
TCTTGAGTACAGAAATGATGTTCCTGCTGAGGATATTTGTGCTGAAGTTCTTGATGGTTA
6+
TAAAGCAAGGAAAGTTCGCTTTTGTACACCTGATAATTACTTACTACATGATGGAAAGAT
7+
GTATATAATAGACTTCAAAGTGTCTGTAGACGACCGATCTTCTAGAATCACAAGGGAGAA
8+
ATATAATGAGATTTTTGGAGAGGTATTCAATCCAGAAGGTGTAGATTTTGAAATTGTTAT
9+
TATTAGATTAGATCCTTCAAATATGACGATACATGTGGACTCTCGAGATTTCGTGAATAC
10+
AATTGGGCCGATTACATTAAACATTAGTATGCAATGGTTTTTTGATATGAAAGACTTCTT
11+
GTTCGGGAAATTTCGGGATGATGATAAATTCCATGCTATAATAAGTCAAGGAGAATTCAC
12+
AATGACATTGCCATGGATTGAAGAAGACACCCCAGAATTGCTTACTCATCCTATATACAA
13+
TGAATTCATGAGTTCAATGCCAGAGGCAGAACAGGCCCTATTCAAGGAAGCATTGGAATT
14+
CAAATCATTTGGGGCAGAAAAATGGAATATCTTTTTGAAGGGGGTGATGTCAAAGTATGG
15+
TGAATATTATAAAGAATTTACTAAAGGACATGCTCATTCTATATTTCTGACAACAGGGGA
16+
CTACCCCAAGCCAGACAAAGACCAAATTTCAGCAGGTTGGAGAGAAATGGTAAACAGAGT
17+
AAGCTCTGAACGTGACATGTCAAATGACATAAATCAGGAAAAACCAAGCATGCATTTTAT
18+
ATGGGCAAAGAATGATTCAAATAGCAACAATAATATACAAAAGCTAATCAAACTATCTAA
19+
ATCACTGCAAGCTATGAGCGGGACAGGGAGCTATGTAAATGCTTTCAAGTCATTAGGGAG
20+
ATTAATGGATATATCATCAGATGTTAAAAAATATGAATCATTTTGTGGGAAATTGAAATC
21+
TCTGGCAAGGTCTAGTATAAAAAAACTTGACAGGAAAATAGAGCCAATACAAATTGGGAC
22+
TGCAACTGTCTTATGGGAACAGCAATTTAAACTAGATACAGATGTTATAAAAAGAGAAGA
23+
CAGAATACATTTAATGAAAGATTATCTTGGGATCGGTAAGCACAAATCATTTTCAAAGAA
24+
ATTAAACAACGACATAAATACTGATAAGCCTAAAATATTAAATTTCAACAATGATGATAT
25+
AGTCAGGAAATGCAAAGATAAATATAATCAAGTCATACATAACCTATCCCAAATCAATGA
26+
ATTAGATAAGATTGGAAACTACCTAGAGCACTTTTCAGCTAAAATTAGTGCCTGCAGTGT
27+
AGAAATGTGGGATTTTATATATAATACAACCAAAACTAAATACTGGCAATGCATCAATGA
28+
CTATTCCACCCTAATGAAAAACATGTTAGCTGTCTCTCAATATAATAGACACAATACGTT
29+
TAGAATTGTCTCATGTGCAAACAATAATGTATTTGGTCTAGTAATGCCAAGCTCAGATAT
30+
AAAGACAAAAAAAGCAACTTTAGTCTATGCAATAATGGCTCTCCATAATGAGGAGGCAGA
31+
AATAGCAGAACTTGGCTCACTCTACTCAACTTTTAAGACAGCAACAGGATATATTTCAAT
32+
ATCAAAGGCTTTTAGGCTGGATAAAGAAAGATGCCAACGCATAGTATCCTCTCCAGGCTT
33+
GTTCCTCATGACAAGCTGCCTATTATTCAACGGTAACAAGAGTTTAGAATTTGATAAATT
34+
ACTAGGATTTTCATTTTTTACGTCAATATCAATTACGAAAGCTATGCTCTCCCTTACTGA
35+
GCCTTCACGTTATATGATCATGAACTCGTTAGCAGTTTCCAGCCATGTAAGAGAGTATAT
36+
ATCTGAAAAATTCTCCCCTTATACAAAAACATCATTTTCTGTGGTAATGACAGACTTAAT
37+
CAAGAAGGGTTGCTATTCAGCATATGAACAGAGAAAAAAAGTACAAATAAGAGACATAAA
38+
ATTAACAGATTATGATATAACACAAAAGGGAGTGGATTCCAAAAGAGATCTTAAATCTAT
39+
TTGGTTCCCAGGAAAGGTAAACCTGAAAGAATATTTAAACCAAATTTATCTACCATTTTA
40+
TTTTAACTCTAAAGGATTACATGAAAAACATCATGTCTTGATAGATTTGGCTAAAACAGT
41+
ACTAGAAATCGAAAAAGAGCAAAGGGAGTCATTACCTGAGCCATGGTCAGAGATACCTGC
42+
TAAGCGACTGTCACTTAATGTTTTAATTTACTCATTGCAGGAACTGAATTTAGATACTTC
43+
AAGACATAATTTTGTAAGAAGCCGGGTGGAAAACGCAAATAATTTCAACAGATCTATAAC
44+
GACAATATCTACTTTTACCAGCTCAAAATCATGCATTAAGATTGGTGATTTTGAAGAAGA
45+
AAAAAGAGAAAAACTAAGAATGATACAAAAGAAACTTGCAAAGGATATTTCTAAATTAAC
46+
CATAGCCAACCCAGCATTCTTAGATGAGATCACAAACGAACATGAGATAAGGCATTCAAC
47+
TTATGAGGACTTAAAACAATCTATCCCAGATTACACAGATTATATGTCTGTGAAAGTTTT
48+
TGACAGATTGTACGAGAAGATTACTACCAATGAAATAAATGATAAGGAAACAGTCAAGCT
49+
GATTCTAGAGACCATGAAAAAACATAAAATATTTCATTTTGGATTCTTCAATAAAGGACA
50+
AAAAACAGCCAAAGATAGAGAAATATTTTTAGGTGAATTTGAAGCAAAAATGTGTCTGTA
51+
CCTTGTCGAAAGAATAGCTAAAGAGAGGTGCAAATTAAACCCTGAAGAAATGATAAGTGA
52+
ACCAGGCGACTCGAAACTAAGGGTATTAGAGAAGCAATCAGAAGACGAAATCAGGTATAT
53+
TAGCAATACAATAAAGACATTAGGGAATGCCATAGAGAACTTGCAATCTGGATCTTTAAA
54+
TTGGGCAGATATATGCGAAAACAAAGCAAGAGGACTTAAGATAGAAATAAATGCTGATAT
55+
GTCCAAATGGAGTGCCCAAGATGTACTTTTTAAATATTTTTGGTTGATAGTGCTTGATCC
56+
CATCTTATATCCTGCTGAGAGGAAAAGGATAATTTATTTCCTCTGTAATTATATGCAGAA
57+
AAGGCTTATAATGCCCGATGAATTGCTCACTACTATATTGGATCAAAGAGTTCCTTATTC
58+
AAATGACATAATTGGATTAATGACAAACAATTATAGGTCTAATACAGTAGAAATAAAGCG
59+
TAACTGGCTTCAAGGCAACTTAAATTATACAAGCAGTTACTTACACAGCTGTAGTATGTC
60+
TGTGTACAAAGATATAATAAGAGAAGCAGCAATATTATTAGAAGGAGAAGCCCTTGTGAA
61+
CTCAATGGTACATTCTGATGATAATCAAACATCTATATGTATGGTGCAGAATAAATTACC
62+
AGATGACAATATAATTGAATTTTGCATTAAGATATTCGAGAAGATATGCTTAACTTTTGG
63+
CAATCAGGCAAATATGAAGAAGACATATCTAACTAACTTCATCAAAGAGTTTGTTTCTTT
64+
ATTTAATATACATGGAGAACCATTTTCTATATATGGGAGATTTCTACTCACAGCAGTAGG
65+
AGACTGTGCCTATCTAGGGCCTTATGAAGATTTAGCAAGTAGGCTATCTGCAACACAAAC
66+
TGCTATAAAGCATGGTTGCCCACCATCACTTGCATGGGTATCTATCGCTCTAAATCACTG
67+
GATAACCCACACTACATATAATATGTTGCCTGGCCAAAATAATGACCCGTTACCATTCTT
68+
CCCTACTAACAATAGAAGTGAAATACCAGTAGAGATGTGCGGAATACTAGAAAGTGATTT
69+
ATCAACAATTGCACTAACTGGTTTAGAAGCAGGGAATGTCACGTTTCTAACAAATATAGC
70+
AAGGAAGTTATCATCCCCAATCTTACAAAGAGAAAGTATTCAAGATCAATACAATTCTAT
71+
AGAAAAGTGGGATCTGAGCAAATTATCACAGATCGACATTCTAAGGCTTAAAATGCTCAG
72+
GTATATATCTCTTGATAGTTCAGTCACATCTGATGATGGTATGGGGGAGACTAGTGAAAT
73+
GAGATCTCGATCACTTTTAACACCTCGTAAATTCACAACAAGTGGGTCACTTAATAGGTT
74+
GAAATCATATAAAGACTTTCAAGATATAATAGCAGATGAGGACAAGACAAACGAACTATT
75+
TGAGAATTTCATTAGACACCCAGAGTTACTGGTTACAAAAGGCGAAACATTTGAAGAATT
76+
TGTTAATACGATATTATTTAGGTACAATTCAAAGAAATTCAAAGAATCTTTGTCAATACA
77+
AAACCCAGCACAGCTTTTTATTGAGCAAATATTATTTTCCAATAAACCAGTAATTGACTA
78+
CACTAGCATACATGACAAGATTTTTGGATTACAAGACATGCCAGGAATTGAAGAACTAGA
79+
TACAATTATAGGTCGCAAAACATTTGTTGAGAGTTATGTTCAAATCGTAGATGACTTAAG
80+
CAATTTAACATTGGATATAAACGATGTCAAGACTATATTTGCCTTTTGTCTTATGAATGA
81+
CCCACTACTGATCACATCTGCTAACAATATAATAATGTCTGTTAAGGGACATAGTCAAGA
82+
AAGAATAGGTCAATCAGCATGCAAAATGCCAGAGGTCCGAAGTCTAAAACTCATACATTA
83+
TTCACCAGCAGTTGTTTTGAGAGCCTATGTGAGAGGGCCAACAAATGTACCGAATGTAGA
84+
TATAGATGAACTTGCAAGGGATCTATCTCATTTAGAAGACTTCATACAAAGTACAAAACT
85+
CAGAGAAAATATGAGAGAGAGAATAGAAATAAATGAGAAGCGGCACTTAGGAAGGGATTT
86+
CAAATTTGAAATCAAAGAACTAACTAGATTTTACCAAGTGTGTTATGATTACATAAAGTC
87+
TACAGAACATAAAGTCAAGGTATTCATATTGCCATACAAAGTTTTCACATCAATAGAATT
88+
CTGCGGGGCACTGACAGGTAACTTGATAAATGACAAATTATGGTACATAACGCATTATCT
89+
GAAAAATATAGTGTCTACTACACATAAGGCACAAATTTCTTCTTCACCTGAATTGGAATT
90+
GCAAATTGCTGATGAGGCACTAAGACTAGTAGCACATTTTGCTGATACTTTCTTGGCATC
91+
AGAATCAAGAATACAATTTCTGAAGAAAATTATTGAAGAATTCACATACAAAGGGATACC
92+
TGTAAAACATTTATACTCAAAAATAAAGAACTCCAAGTTGAGGGTTAAATTTCTAGGGAT
93+
TCTTTTATGGTTAGATGATCTAACACAGAATGATCTGGATAAATTTGATGCAGATAAATC
94+
AGATGAAAAGATTATATGGAATAACTGGCAAGTGTCAAGAGATATGAATACTGGACCAAT
95+
AGACTTAATGATAAGCGGTTACTCTAGACAGCTGCGGATCACTGGGGAAGATGACAAATT
96+
GATTGCTGCTGAATTGCAGGTTACTAGATTGTCAGAAGATTTAATTTATAGACACGGTCA
97+
GGCAATGTTGAATAAGCCACACGGCTTAAAGCTTGAAAAAATGCAACCTGTGACTGAGAT
98+
GTCTAAACGATTACATTATATCGTTTTCCAGCAAAGATCACGGAAACGATACTTCTATTC
99+
TATATTACCCACCCAAGTAATTGAGGACCATAATTCTAGAGTTGAATCATCTAGGCTAAG
100+
CAGAGATTCAAAATGGGTTCCTGTATGCCCTGTTGCAATATCAAAACTCTACCAACAAGG
101+
ACGGCCTATACTTTCCAAAGTTAGAAATCTGAATATGCAGACTCATTCGCTTTCCAGAAT
102+
ACAAGTTAATGTAGATGAATATGCCATCACGAGAAGAGCACATTTTCAGAAAATGCCTTT
103+
CTTCGAAGGACCATCAATCCCTTCTGGTGGTATGGATTTGTCTGAGTTGATGAAATCTAC
104+
ATCCCTATTAAGCTTGAATTATGATAACATAAAAAATGCATCCTTATTGGACATGTCTAG
105+
GGTATTTAAGTGCAATGGCAGTGGAGATGACCAAATGGCTTTCGAATTTCTATCGGACGA
106+
AATTTTGGAGCAAGATGTAGTTGAAGAAATAGAATGCAACCCTATATTTTCTATTAGTTA
107+
TACAAAAAGAGGAGAATCCAATATGACTTATAAAAATGCTTTCCACAAAGCCTTAATCTC
108+
AGAATGTGACAAATTTGAAGAAGCATTTGACTTCCTCGACATGGGATTTTGCTCGAATGA
109+
AAATCTTAGTATTCTGGAGGAAATACATTGGATAATCAGTTATTTAAAAACAAATCAATG
110+
GTCTACGGAACTAGACAATTGTATTCACATGTGCATGTACAGGAATGGATATGATGCAGA
111+
ATATCATAAATTTGATATACCCTCTAAATTCCTCAAAGACCCAATAAACCGAACAATAAA
112+
TTGGACTGAAGTCATTGAATTTATATTATTAATTGAAGATTTCCAAACAAAAATTGAGCC
113+
ATGGTCTAGTATGAAGTCACACTTCTGTTCAAAAGCACACAGTGTAGCACTAGAGTGTAT
114+
GAAAAATGAGAAAAGATCATTGGCAGAATTTGTAGACAAAAGTAAGAAAACTGGCAAATC
115+
CAAATTTGACTTCTAAGGTATACACATGTAAAAGTAGTGTTTGTTTCTAAATAGGAGCAC
116+
ACTACT

0 commit comments

Comments
 (0)