diff --git a/DESCRIPTION b/DESCRIPTION index 22ce737..201b592 100644 --- a/DESCRIPTION +++ b/DESCRIPTION @@ -1,7 +1,7 @@ Package: strayr Type: Package Title: Ready-to-use Australian common structures and classifications and tools for working with them -Version: 0.2.2.9001 +Version: 0.2.2.9002 Authors@R: c(person("Will", "Mackey", email = "wfmackey@gmail.com", role = c("aut", "cre")), person("Matt", "Johnson", email = "mrjoh3@gmail.com", role = c("aut")), person("David", "Diviny", email = "david.diviny@nousgroup.com.au", role = c("aut")), diff --git a/NEWS.md b/NEWS.md index 051bedd..ecf718d 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,4 +1,5 @@ # strayr (development version) +* Threshold for fuzzy matching (`max_dist`) in clean_state() has been reduced to 0.2 from 0.4 * `create read_correspondence_tbl()` reads correspondence tables from `absmapsdata` similarly to `read_absmap()` * updated `anzsco2006` to include leading zeros in codes (see ). This is a backwards incompatible change that may cause issues (not enough for a major version progression) diff --git a/R/clean_state.R b/R/clean_state.R index a90f179..7e08a18 100644 --- a/R/clean_state.R +++ b/R/clean_state.R @@ -50,7 +50,7 @@ #' @importFrom stringdist amatch #' @export -clean_state <- function(x, to = "state_abbr", fuzzy_match = TRUE, max_dist = 0.4, method = "jw"){ +clean_state <- function(x, to = "state_abbr", fuzzy_match = TRUE, max_dist = 0.2, method = "jw"){ if(!is.logical(fuzzy_match)){ diff --git a/R/sysdata.rda b/R/sysdata.rda index fcac893..184a25d 100644 Binary files a/R/sysdata.rda and b/R/sysdata.rda differ diff --git a/data/anzsco2009.rda b/data/anzsco2009.rda index 4d05540..2c9f6f0 100644 Binary files a/data/anzsco2009.rda and b/data/anzsco2009.rda differ diff --git a/data/anzsco2013.rda b/data/anzsco2013.rda index 1d8b0ae..8314ddf 100644 Binary files a/data/anzsco2013.rda and b/data/anzsco2013.rda differ diff --git a/data/anzsco2019.rda b/data/anzsco2019.rda index a59323d..1f7a4c8 100644 Binary files a/data/anzsco2019.rda and b/data/anzsco2019.rda differ diff --git a/data/anzsco2021.rda b/data/anzsco2021.rda index 3a329b5..ec75ead 100644 Binary files a/data/anzsco2021.rda and b/data/anzsco2021.rda differ diff --git a/data/anzsco2022.rda b/data/anzsco2022.rda index a77148c..517c32f 100644 Binary files a/data/anzsco2022.rda and b/data/anzsco2022.rda differ diff --git a/data/anzsic2006.rda b/data/anzsic2006.rda index a261e14..b721718 100644 Binary files a/data/anzsic2006.rda and b/data/anzsic2006.rda differ diff --git a/data/anzsic_isic.rda b/data/anzsic_isic.rda index bf6e25d..cd809e9 100644 Binary files a/data/anzsic_isic.rda and b/data/anzsic_isic.rda differ diff --git a/data/asced_foe2001.rda b/data/asced_foe2001.rda index c883461..b437a34 100644 Binary files a/data/asced_foe2001.rda and b/data/asced_foe2001.rda differ diff --git a/data/asced_qual2001.rda b/data/asced_qual2001.rda index 2656010..8a5e7a2 100644 Binary files a/data/asced_qual2001.rda and b/data/asced_qual2001.rda differ diff --git a/data/palette_state_name_2016.rda b/data/palette_state_name_2016.rda index 320a91e..941276c 100644 Binary files a/data/palette_state_name_2016.rda and b/data/palette_state_name_2016.rda differ diff --git a/data/school_terms.rda b/data/school_terms.rda index aa09cac..80b8f62 100644 Binary files a/data/school_terms.rda and b/data/school_terms.rda differ diff --git a/data/state_abb_au.rda b/data/state_abb_au.rda index 30df4e1..ef55af9 100644 Binary files a/data/state_abb_au.rda and b/data/state_abb_au.rda differ diff --git a/data/state_name_au.rda b/data/state_name_au.rda index 4e95a90..6b7a357 100644 Binary files a/data/state_name_au.rda and b/data/state_name_au.rda differ diff --git a/man/clean_state.Rd b/man/clean_state.Rd index 95c4a62..8d93938 100644 --- a/man/clean_state.Rd +++ b/man/clean_state.Rd @@ -9,7 +9,7 @@ clean_state( x, to = "state_abbr", fuzzy_match = TRUE, - max_dist = 0.4, + max_dist = 0.2, method = "jw" )