diff --git a/ingest/defaults/annotations.tsv b/ingest/defaults/annotations.tsv index 6315093..a5f7a2a 100644 --- a/ingest/defaults/annotations.tsv +++ b/ingest/defaults/annotations.tsv @@ -294,3 +294,13 @@ KT163243 date 1968-XX-XX AF260968 date 1951-XX-XX AF260968 region Africa AF260968 country Egypt +AF260968 host Homo sapians +AF196835 host Phoenicopterus chilensis +AF196835 date 1999-XX-XX +AY765264 date 1997-XX-XX +AY765264 country Czech Republic +AY765264 region Europe +DQ318020 date 1972-XX-XX +DQ318020 host Culex tigripes +D00246 country Australia +D00246 date 1960-XX-XX \ No newline at end of file diff --git a/phylogenetic/build-configs/washington-state/config.yaml b/phylogenetic/build-configs/washington-state/config.yaml index 6268f41..a243cb7 100644 --- a/phylogenetic/build-configs/washington-state/config.yaml +++ b/phylogenetic/build-configs/washington-state/config.yaml @@ -20,7 +20,7 @@ subsampling: force_include: --exclude-all --include ../nextclade/defaults/include.txt refine: - treetime_params: --coalescent opt --clock-filter-iqd 4 --date-inference marginal --date-confidence + treetime_params: --coalescent opt --clock-filter-iqd 4 --date-inference marginal --date-confidence --clock-rate 0.000653 traits: metadata_columns: [ diff --git a/phylogenetic/defaults/config.yaml b/phylogenetic/defaults/config.yaml index a86b515..ef9c5c5 100644 --- a/phylogenetic/defaults/config.yaml +++ b/phylogenetic/defaults/config.yaml @@ -2,7 +2,7 @@ strain_id_field: "accession" # Use 'Egypt 1951' as the reference and root, following Mencattelli et al, 2023 # https://www.nature.com/articles/s41467-023-42185-7 reference: "defaults/reference_global.gb" -root: "AF260968" +root: "mid_point" # Sequences must be FASTA and metadata must be TSV # Both files must be zstd compressed @@ -69,7 +69,7 @@ subsampling: force_include: --exclude-all --include defaults/include.txt refine: - treetime_params: --coalescent opt --date-inference marginal --date-confidence + treetime_params: --coalescent opt --date-inference marginal --date-confidence --keep-polytomies --clock-rate 0.000755 traits: metadata_columns: [ diff --git a/phylogenetic/defaults/exclude.txt b/phylogenetic/defaults/exclude.txt index 49028e0..602d881 100644 --- a/phylogenetic/defaults/exclude.txt +++ b/phylogenetic/defaults/exclude.txt @@ -1,3 +1,4 @@ +AF260968 # Egypt 1951 will added back in during augur align reference HW816192 # 11029 bp PAT 27-MAY-2015 CS543188 # 11029 bp PAT 20-APR-2007 CS568914 # 11029 bp PAT 18-MAY-2007 @@ -53,3 +54,4 @@ OM202905 # Clusters below PAT FV537222 OM202932 # Clusters below PAT FV537222 FV537223 # Clusters below PAT FV537222 FV537222 # Clusters below PAT FV537222 +AY688948 # Laboratory strain Sarafend based on https://pmc.ncbi.nlm.nih.gov/articles/PMC3320449/ \ No newline at end of file diff --git a/phylogenetic/defaults/include.txt b/phylogenetic/defaults/include.txt index 8161a2a..bbef20d 100644 --- a/phylogenetic/defaults/include.txt +++ b/phylogenetic/defaults/include.txt @@ -1,4 +1,4 @@ -AF260968 # Egypt 1951 +# AF260968 # Egypt 1951 will be used as augur align reference NC_001563 # Lineage 2 reference NC_009942 # Lineage 1 reference HM051416 # Isreal 1953 @@ -68,3 +68,24 @@ KJ501222 # SW03 MG004537 # SW03 MF175866 # SW03 MG004540 # SW03 +MW383507 # Lineage 2 +HM147822 # Lineage 2 +GQ903680 # Lineage 2 +DQ176636 # Lineage 2 +KU978767 # Lineage 2 +HM147823 # Lineage 2 +PP445212 # Lineage 3 +AY765264 # Lineage 3 +AY277251 # Lineage 4 +FJ159131 # Lineage 4 +FJ159129 # Lineage 4 +FJ159130 # Lineage 4 +KJ831223 # Lineage 4 +KU978770 # Lineage 5 +DQ256376 # Lineage 5 +JX041632 # Lineage 5 +GQ851604 # Lineage 5 +GQ851605 # Lineage 5 +KY703855 # Lineage 7 +OP846972 # Lineage 7 +KY703856 # Lineage 8 diff --git a/phylogenetic/defaults/reference_global.gb b/phylogenetic/defaults/reference_global.gb index 61356c7..8e4fc84 100644 --- a/phylogenetic/defaults/reference_global.gb +++ b/phylogenetic/defaults/reference_global.gb @@ -1,6 +1,6 @@ -LOCUS AF260968_REF 11029 bp RNA linear VRL 27-AUG-2000 +LOCUS AF260968 11029 bp RNA linear VRL 27-AUG-2000 DEFINITION West Nile virus strain Eg101, complete genome. -ACCESSION AF260968_REF +ACCESSION AF260968 VERSION AF260968.1 KEYWORDS . SOURCE West Nile virus (WNV)