MattCowgill
diff --git a/‎.Rbuildignore
+1 b/‎.Rbuildignore
+1
diff --git a/‎.github/workflows/covr.yaml
+48 b/‎.github/workflows/covr.yaml
+48
diff --git a/‎.github/workflows/pkgdown.yaml
+48 b/‎.github/workflows/pkgdown.yaml
+48
diff --git a/‎.gitignore
+1 b/‎.gitignore
+1
diff --git a/‎.travis.yml
-14 b/‎.travis.yml
-14
diff --git a/‎DESCRIPTION
+1-4 b/‎DESCRIPTION
+1-4
diff --git a/‎NAMESPACE
+1-6 b/‎NAMESPACE
+1-6
diff --git a/‎NEWS.md
+3 b/‎NEWS.md
+3
diff --git a/‎R/check_abs_connection.R
+2-1 b/‎R/check_abs_connection.R
+2-1
diff --git a/‎R/download_abs.R
+4-2 b/‎R/download_abs.R
+4-2
diff --git a/‎R/download_data_cube.r
+2-4 b/‎R/download_data_cube.r
+2-4
diff --git a/‎R/extract_abs_sheets.R
-1 b/‎R/extract_abs_sheets.R
-1
diff --git a/‎R/get_abs_xml_metadata.R
+2-2 b/‎R/get_abs_xml_metadata.R
+2-2
diff --git a/‎R/get_available_files.r
+5-7 b/‎R/get_available_files.r
+5-7
diff --git a/‎R/read_abs.R
+1-1 b/‎R/read_abs.R
+1-1
diff --git a/‎R/read_abs_local.R
+1-1 b/‎R/read_abs_local.R
+1-1
diff --git a/‎R/read_abs_sdmx.R
+1 b/‎R/read_abs_sdmx.R
+1
diff --git a/‎R/read_awe.R
+2-2 b/‎R/read_awe.R
+2-2
diff --git a/‎R/scrape_abs_catalogues.r
+12-12 b/‎R/scrape_abs_catalogues.r
+12-12
@@ -14,3 +14,4 @@
 ^doc$
 ^Meta$
 ^data-raw$
+^pkgdown$
@@ -0,0 +1,48 @@
+on:
+  push:
+    branches:
+      - main
+      - master
+  pull_request:
+    branches:
+      - main
+      - master
+
+name: test-coverage
+
+jobs:
+  test-coverage:
+    runs-on: macOS-latest
+    env:
+      GITHUB_PAT: ${{ secrets.GITHUB_TOKEN }}
+    steps:
+      - uses: actions/checkout@v2
+
+      - uses: r-lib/actions/setup-r@v1
+
+      - uses: r-lib/actions/setup-pandoc@v1
+
+      - name: Query dependencies
+        run: |
+          install.packages('remotes')
+          saveRDS(remotes::dev_package_deps(dependencies = TRUE), ".github/depends.Rds", version = 2)
+          writeLines(sprintf("R-%i.%i", getRversion()$major, getRversion()$minor), ".github/R-version")
+        shell: Rscript {0}
+
+      - name: Cache R packages
+        uses: actions/cache@v2
+        with:
+          path: ${{ env.R_LIBS_USER }}
+          key: ${{ runner.os }}-${{ hashFiles('.github/R-version') }}-1-${{ hashFiles('.github/depends.Rds') }}
+          restore-keys: ${{ runner.os }}-${{ hashFiles('.github/R-version') }}-1-
+
+      - name: Install dependencies
+        run: |
+          install.packages(c("remotes"))
+          remotes::install_deps(dependencies = TRUE)
+          remotes::install_cran("covr")
+        shell: Rscript {0}
+
+      - name: Test coverage
+        run: covr::codecov()
+        shell: Rscript {0}
@@ -0,0 +1,48 @@
+on:
+  push:
+    branches:
+      - main
+      - master
+
+name: pkgdown
+
+jobs:
+  pkgdown:
+    runs-on: macOS-latest
+    env:
+      GITHUB_PAT: ${{ secrets.GITHUB_TOKEN }}
+    steps:
+      - uses: actions/checkout@v2
+
+      - uses: r-lib/actions/setup-r@v1
+
+      - uses: r-lib/actions/setup-pandoc@v1
+
+      - name: Query dependencies
+        run: |
+          install.packages('remotes')
+          saveRDS(remotes::dev_package_deps(dependencies = TRUE), ".github/depends.Rds", version = 2)
+          writeLines(sprintf("R-%i.%i", getRversion()$major, getRversion()$minor), ".github/R-version")
+        shell: Rscript {0}
+
+      - name: Cache R packages
+        uses: actions/cache@v2
+        with:
+          path: ${{ env.R_LIBS_USER }}
+          key: ${{ runner.os }}-${{ hashFiles('.github/R-version') }}-1-${{ hashFiles('.github/depends.Rds') }}
+          restore-keys: ${{ runner.os }}-${{ hashFiles('.github/R-version') }}-1-
+
+      - name: Install dependencies
+        run: |
+          remotes::install_deps(dependencies = TRUE)
+          install.packages("pkgdown", type = "binary")
+        shell: Rscript {0}
+
+      - name: Install package
+        run: R CMD INSTALL .
+
+      - name: Deploy package
+        run: |
+          git config --local user.email "[email protected]"
+          git config --local user.name "GitHub Actions"
+          Rscript -e 'pkgdown::deploy_to_branch(new_process = FALSE)'
@@ -8,3 +8,4 @@ data
 .DS_Store
 doc
 .Rhistory (8140V-144300-W's conflicted copy 2020-09-19)
+docs
@@ -1,7 +1,7 @@
 Package: readabs
 Type: Package
 Title: Download and Tidy Time Series Data from the Australian Bureau of Statistics
-Version: 0.4.6
+Version: 0.4.6.900
 Authors@R: c(
            person("Matt", "Cowgill", role = c("aut", "cre"), email = "[email protected]"),
            person("Zoe", "Meers", role = "aut", email = "[email protected]"),
@@ -18,14 +18,12 @@ LazyData: true
 Depends: R (>= 3.5)
 Imports: 
     readxl (>= 1.2.0), 
-    tibble (>= 1.4.99),
     dplyr (>= 0.8.0), 
     hutils (>= 1.5.0),
     fst,
     curl,
     purrr,
     tidyr (>= 1.0.0), 
-    stringr,
     stringi,
     rsdmx, 
     tools,
@@ -42,5 +40,4 @@ Suggests:
     knitr,
     rmarkdown,
     testthat (>= 2.1.0),
-    RCurl,
     ggplot2
@@ -25,6 +25,7 @@ importFrom(dplyr,pull)
 importFrom(dplyr,select)
 importFrom(dplyr,slice)
 importFrom(dplyr,sym)
+importFrom(dplyr,tibble)
 importFrom(glue,glue)
 importFrom(httr,GET)
 importFrom(purrr,map)
@@ -42,12 +43,6 @@ importFrom(rvest,html_attr)
 importFrom(rvest,html_nodes)
 importFrom(rvest,html_text)
 importFrom(stringi,stri_trim_both)
-importFrom(stringr,str_count)
-importFrom(stringr,str_extract)
-importFrom(stringr,str_remove)
-importFrom(stringr,str_replace_all)
-importFrom(stringr,str_trim)
-importFrom(tibble,tibble)
 importFrom(tidyr,gather)
 importFrom(tidyr,pivot_longer)
 importFrom(tidyr,separate)
 
@@ -1,3 +1,6 @@
+# readabs 0.4.6.900
+* Package dependencies reduced
+
 # readabs 0.4.6
 * New read_payrolls() convenience function added
 * New read_awe() convenience function added
 
@@ -27,7 +27,8 @@ test_abs_robots <- function() {
       suppressWarnings(utils::download.file(
         "https://www.abs.gov.au/robots.txt",
         destfile = tmp,
-        quiet = TRUE
+        quiet = TRUE,
+        headers = c("User-Agent" = readabs_user_agent)
       ))
       file.exists(tmp)
     },
 
@@ -21,7 +21,8 @@ download_abs <- function(urls,
       quiet = !show_progress_bars,
       destfile = filenames,
       method = "libcurl",
-      cacheOK = FALSE
+      cacheOK = FALSE,
+      headers = c("User-Agent" = readabs_user_agent)
     )
   } else {
     purrr::walk2(
@@ -30,7 +31,8 @@ download_abs <- function(urls,
       .f = utils::download.file,
       mode = "wb",
       quiet = !show_progress_bars,
-      cacheOK = FALSE
+      cacheOK = FALSE,
+      headers = c("User-Agent" = readabs_user_agent)
     )
   }
 
 
@@ -45,11 +45,8 @@
 #'
 #' @importFrom dplyr %>%
 #' @importFrom glue glue
-#' @importFrom xml2 read_html
 #' @importFrom dplyr filter pull slice
-#' @importFrom tibble tibble
 #' @importFrom rvest html_nodes html_attr html_text
-#' @importFrom stringr str_remove str_extract str_replace_all
 #' @importFrom httr GET
 #'
 #' @export
@@ -82,7 +79,8 @@ download_abs_data_cube <- function(catalogue_string,
 
 
   # ==================download file======================
-  download_object <- httr::GET(file_download_url)
+  download_object <- httr::GET(file_download_url,
+                               httr::user_agent(readabs_user_agent))
 
   # save file path to disk
 
 
@@ -14,7 +14,6 @@
 #' `Sys.getenv("R_READABS_PATH", unset = tempdir())`.
 #'
 #' @importFrom readxl excel_sheets read_excel
-#' @importFrom tibble tibble
 #' @importFrom dplyr filter "%>%"
 #' @importFrom purrr map set_names
 #' @importFrom tools file_path_sans_ext
 
@@ -1,5 +1,4 @@
 
-#' @importFrom utils download.file
 #' @import dplyr
 
 # given a catalogue number, download the catalogue metadata via XML, then find
@@ -28,7 +27,8 @@ get_abs_xml_metadata <- function(url, issue = "latest") {
   # doesn't work then we try with a leading zero ("01"). If that fails,
   # it's an error.
 
-  first_page <- xml2::read_xml(first_url, encoding = "ISO-8859-1")
+  first_page <- xml2::read_xml(first_url, encoding = "ISO-8859-1",
+                               user_agent = readabs_user_agent)
   first_page_list <- xml2::as_list(first_page)
   first_page_list <- first_page_list[[1]]
   first_url_works <- ifelse(length(first_page_list) > 0,
 
@@ -19,11 +19,8 @@
 #' }
 #'
 #' @importFrom glue glue
-#' @importFrom xml2 read_html
-#' @importFrom dplyr  %>% filter pull slice
-#' @importFrom tibble tibble
+#' @importFrom dplyr  %>% filter pull slice tibble
 #' @importFrom rvest html_nodes html_attr html_text
-#' @importFrom stringr str_extract str_replace_all
 #' @importFrom rlang .data
 #'
 #' @export
@@ -52,7 +49,8 @@ get_available_files <- function(catalogue_string, refresh = FALSE) {
 
   # Try to download the page
   download_page <- tryCatch(
-    xml2::read_html(download_url),
+    xml2::read_html(download_url,
+                    user_agent = readabs_user_agent),
     error = function(cond) {
       message(paste("URL does not seem to exist:", download_url))
       message("Here's the original error message:")
@@ -85,11 +83,11 @@ get_available_files <- function(catalogue_string, refresh = FALSE) {
   }
 
 
-  available_downloads <- tibble::tibble(
+  available_downloads <- dplyr::tibble(
     url = urls,
     label = labels
   ) %>%
-    mutate(file = str_extract(url, "[^/]*$")) %>%
+    mutate(file = stringi::stri_extract_first_regex(url, "[^/]*$")) %>%
     select(.data$label, .data$file, .data$url)
 
   return(available_downloads)
 
@@ -92,7 +92,7 @@ read_abs <- function(cat_no = NULL,
       )
     }
     out <- fst::read_fst(path = catno2fst(cat_no = cat_no, path = path))
-    out <- tibble::as_tibble(out)
+    out <- dplyr::as_tibble(out)
     if (is.null(series_id)) {
       return(out)
     }
 
@@ -81,7 +81,7 @@ read_abs_local <- function(cat_no = NULL,
   # Retrieve cache if available
   if (is.null(filenames) && isTRUE(use_fst) && fst_available(cat_no, path)) {
     out <- fst::read_fst(path = catno2fst(cat_no = cat_no, path = path))
-    return(tibble::as_tibble(out))
+    return(dplyr::as_tibble(out))
   }
 
   # If catalogue number is specifid, that takes precedence
 
@@ -23,6 +23,7 @@
 #' }
 #'
 read_abs_sdmx <- function(url) {
+  .Deprecated(msg = "read_abs_sdmx() is deprecated and will be removed in a future version.")
   url <- url
   dataset <- rsdmx::readSDMX(url)
   abs_data <- as.data.frame(dataset)
 
@@ -114,9 +114,9 @@ tidy_awe <- function(df) {
 
   df$measure <- gsub(";", "", df$measure, fixed = TRUE)
   df$measure <- tolower(df$measure)
-  df$measure <- stringr::str_squish(df$measure)
+  df$measure <- fast_str_squish(df$measure)
 
-  df$sex <- stringr::str_squish(df$sex)
+  df$sex <- fast_str_squish(df$sex)
   df$sex <- tolower(df$sex)
 
   df <- df %>%
 
@@ -8,21 +8,20 @@
 #' @importFrom glue glue
 #' @importFrom xml2 read_html
 #' @importFrom dplyr  %>% filter pull slice
-#' @importFrom tibble tibble
 #' @importFrom rvest html_nodes html_attr html_text
-#' @importFrom stringr str_trim str_remove
 #' @importFrom purrr map_dfr
 #' @importFrom rlang .data
 #'
 
 scrape_abs_catalogues <- function() {
 
   # scrape the main page
-  abs_stats_page <- xml2::read_html("https://www.abs.gov.au/statistics")
+  abs_stats_page <- xml2::read_html("https://www.abs.gov.au/statistics",
+                                    user_agent = readabs_user_agent)
 
-  main_page_data <- tibble::tibble(
-    heading = abs_stats_page %>% rvest::html_nodes(".field--type-ds h3") %>% rvest::html_text() %>% stringr::str_trim(),
-    url_suffix = abs_stats_page %>% rvest::html_nodes(".card") %>% rvest::html_attr("href") %>% stringr::str_trim()
+  main_page_data <- dplyr::tibble(
+    heading = abs_stats_page %>% rvest::html_nodes(".field--type-ds h3") %>% rvest::html_text() %>% stringi::stri_trim_both(),
+    url_suffix = abs_stats_page %>% rvest::html_nodes(".card") %>% rvest::html_attr("href") %>% stringi::stri_trim_both()
   )
 
   # scrape each page
@@ -31,15 +30,16 @@ scrape_abs_catalogues <- function() {
     main_page_heading <- main_page_data$heading[main_page_data$url_suffix == sub_page_url_suffix]
 
 
-    sub_page <- xml2::read_html(glue::glue("https://www.abs.gov.au{sub_page_url_suffix}"))
+    sub_page <- xml2::read_html(glue::glue("https://www.abs.gov.au{sub_page_url_suffix}"),
+                                user_agent = readabs_user_agent)
 
-    sub_page_data <- tibble::tibble(
+    sub_page_data <- dplyr::tibble(
       heading = main_page_heading,
-      sub_heading = sub_page %>% rvest::html_nodes(".abs-layout-title") %>% rvest::html_text() %>% str_trim(),
+      sub_heading = sub_page %>% rvest::html_nodes(".abs-layout-title") %>% rvest::html_text() %>% stringi::stri_trim_both(),
       catalogue = sub_page %>% rvest::html_nodes("#content .card") %>% rvest::html_attr("href") %>%
-        stringr::str_remove(sub_page_url_suffix) %>%
-        stringr::str_remove("/[^/]*$") %>%
-        stringr::str_remove("/"),
+        stringi::stri_replace_all_fixed(sub_page_url_suffix, "") %>%
+        stringi::stri_replace_all_regex("/[^/]*$", "") %>%
+        stringi::stri_replace_all_fixed("/", ""),
       url = glue::glue("https://www.abs.gov.au{sub_page_url_suffix}/{catalogue}/latest-release")
     )
   }
Original file line number	Diff line number	Diff line change
`@@ -21,7 +21,8 @@ download_abs <- function(urls,`
`21`	`21`	`quiet = !show_progress_bars,`
`22`	`22`	`destfile = filenames,`
`23`	`23`	`method = "libcurl",`
`24`		`- cacheOK = FALSE`
	`24`	`+ cacheOK = FALSE,`
	`25`	`+ headers = c("User-Agent" = readabs_user_agent)`
`25`	`26`	`)`
`26`	`27`	`} else {`
`27`	`28`	`purrr::walk2(`
`@@ -30,7 +31,8 @@ download_abs <- function(urls,`
`30`	`31`	`.f = utils::download.file,`
`31`	`32`	`mode = "wb",`
`32`	`33`	`quiet = !show_progress_bars,`
`33`		`- cacheOK = FALSE`
	`34`	`+ cacheOK = FALSE,`
	`35`	`+ headers = c("User-Agent" = readabs_user_agent)`
`34`	`36`	`)`
`35`	`37`	`}`
`36`	`38`
Original file line number	Diff line number	Diff line change
`@@ -92,7 +92,7 @@ read_abs <- function(cat_no = NULL,`
`92`	`92`	`)`
`93`	`93`	`}`
`94`	`94`	`out <- fst::read_fst(path = catno2fst(cat_no = cat_no, path = path))`
`95`		`- out <- tibble::as_tibble(out)`
	`95`	`+ out <- dplyr::as_tibble(out)`
`96`	`96`	`if (is.null(series_id)) {`
`97`	`97`	`return(out)`
`98`	`98`	`}`
Original file line number	Diff line number	Diff line change
`@@ -81,7 +81,7 @@ read_abs_local <- function(cat_no = NULL,`
`81`	`81`	`# Retrieve cache if available`
`82`	`82`	`if (is.null(filenames) && isTRUE(use_fst) && fst_available(cat_no, path)) {`
`83`	`83`	`out <- fst::read_fst(path = catno2fst(cat_no = cat_no, path = path))`
`84`		`- return(tibble::as_tibble(out))`
	`84`	`+ return(dplyr::as_tibble(out))`
`85`	`85`	`}`
`86`	`86`
`87`	`87`	`# If catalogue number is specifid, that takes precedence`