diff --git a/ingest/build-configs/ncbi/defaults/annotations.tsv b/ingest/build-configs/ncbi/defaults/annotations.tsv index b0c03f6..2259113 100644 --- a/ingest/build-configs/ncbi/defaults/annotations.tsv +++ b/ingest/build-configs/ncbi/defaults/annotations.tsv @@ -5,5 +5,4 @@ # Lines starting with '#' are treated as comments # Any '#' after the field value are treated as comments. A/environment/USA/CO-UW-9084466/2024 division Colorado # Based on linked BioSample https://www.ncbi.nlm.nih.gov/biosample/SAMN41462555 -A/domesticcat/UnitedStates/24-009311-006/2024 division ? # Better to unknown division be listed as unknown than as "USA" A/environment/USA/CO-UW-9084466/2024 host Cattle # This sequence from commercial milk is definitively from cattle, strain name guidelines are going to be updated here diff --git a/ingest/defaults/geolocation_rules.tsv b/ingest/defaults/geolocation_rules.tsv index 4ea4caa..6491d27 100644 --- a/ingest/defaults/geolocation_rules.tsv +++ b/ingest/defaults/geolocation_rules.tsv @@ -1,5 +1,6 @@ -North America/USA// North America/USA/USA/USA -North America/USA/UNK/UNK North America/USA/USA/USA +# Better to unknown division be listed as unknown than as "USA" +North America/USA// North America/USA/?/? +North America/USA/UNK/UNK North America/USA/?/? North America/USA/CA/CA North America/USA/California/California North America/USA/KS/KS North America/USA/Kansas/Kansas North America/USA/MI/MI North America/USA/Michigan/Michigan