-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathconfig.yaml
More file actions
101 lines (101 loc) · 2.44 KB
/
config.yaml
File metadata and controls
101 lines (101 loc) · 2.44 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
ALIGNMENT_REFERENCE:
"NC_045512.2"
PROBLEMATIC_VCF:
"https://raw.githubusercontent.com/W-L/ProblematicSites_SARS-CoV2/da322c32004f7b16bdaa6a8ee7fd24d56e79d9dc/problematic_sites_sarsCov2.vcf"
GENETIC_CODE_JSON:
"config/standard_genetic_code.json"
TREE_MODEL:
"GTR+F+I+G4"
UFBOOT:
REPS: 1000
THRESHOLD: 0.95
SHALRT:
REPS: 1000
THRESHOLD: 0.80
VC:
MIN_QUALITY: 20
MIN_FREQ: 0.05
MIN_DEPTH: 30
MAX_DEPTH: 1000000
DEMIX:
PATHOGEN: "SARS-CoV-2"
MIN_QUALITY: 20
MAX_DEPTH: 1000000
COV_CUTOFF: 30
MIN_ABUNDANCE: 0.0001
CONFIRMED_ONLY: false
DEPTH_CUTOFF: 0
RELAXED_MRCA: false
RELAXED_MRCA_THRESH: 0.9
AUTO_ADAPT: false
SOLVER: "CLARABEL"
WINDOW:
WIDTH: 1000
STEP: 50
GB_FEATURES:
INCLUDE: # any
product:
- "ORF1ab polyprotein"
- "surface glycoprotein"
- "ORF3a protein"
- "envelope protein"
- "membrane glycoprotein"
- "ORF6 protein"
- "ORF7a protein"
- "ORF7b"
- "ORF8 protein"
- "nucleocapsid phosphoprotein"
- "ORF10 protein"
# EXCLUDE: ... # all
ANNOTATION:
# see: https://pcingola.github.io/SnpEff/adds/VCFannotationformat_v1.0.pdf
SNPEFF_COLS:
CHROM: CHROM
POS: POS
REF: REF
ALT: ALT
EFFECT: "ANN[*].EFFECT"
IMPACT: "ANN[*].IMPACT"
BIOTYPE: "ANN[*].BIOTYPE"
GENE: "ANN[*].GENE"
GENEID: "ANN[*].GENEID"
FEATURE: "ANN[*].FEATURE"
FEATUREID: "ANN[*].FEATUREID"
HGVS_P: "ANN[*].HGVS_P"
HGVS_C: "ANN[*].HGVS_C"
ERRORS: "ANN[*].ERRORS"
FILTER_INCLUDE:
# IMPACT: [HIGH, MODERATE, LOW]
FILTER_EXCLUDE:
EFFECT: [upstream_gene_variant, downstream_gene_variant]
ERRORS:
- ERROR_CHROMOSOME_NOT_FOUND
- ERROR_OUT_OF_CHROMOSOME_RANGE
- WARNING_REF_DOES_NOT_MATCH_GENOME
- WARNING_SEQUENCE_NOT_AVAILABLE
- WARNING_TRANSCRIPT_INCOMPLETE
- WARNING_TRANSCRIPT_MULTIPLE_STOP_CODONS
- WARNING_TRANSCRIPT_NO_START_CODON
- WARNING_TRANSCRIPT_NO_STOP_CODON
VARIANT_NAME_PATTERN: "{GENE}:{coalesce(HGVS_P, HGVS_C)}"
GISAID:
CREDENTIALS: "config/gisaid.yaml"
DATE_COLUMN: "CollectionDate"
LOCATION_COLUMN: "ResidenceCity"
ACCESSION_COLUMN: "GISAIDEPI"
DIVERSITY_REPS:
1000
USE_BIONJ: false
COR:
METHOD: "pearson"
EXACT: null
LOG_PY_FMT:
"%(asctime)s - %(name)s - %(levelname)-8s - %(message)s"
PLOTS:
"config/design_plots.R"
PLOT_GENOME_REGIONS:
"config/nsp_annotation.csv"
REPORT_QMD:
"template.qmd"
REPORT_CSS:
"config/report.styles.css"