Transforming PHE COVID-19 data

This script separates the latest COVID-19 data from coronavirus.data.gov.uk into separate geographic regions based on area_type. To allow users to join these data to boundaries from geoportal.statistics.gov.uk/ observations are pivoted to ensure all area_code values are unique.

Load libraries

library(tidyverse)
library(janitor)
library(glue)

Create folder structure in your working directory

dir.create("daily_download", showWarnings = FALSE)
dir.create("daily_output", showWarnings = FALSE)

Download PHE data

download_date <- Sys.Date()

if(!file.exists(glue("daily_download/coronavirus_cases_{download_date}.csv"))){
  download.file("https://coronavirus.data.gov.uk/downloads/csv/coronavirus-cases_latest.csv", glue("daily_download/coronavirus_cases_{download_date}.csv"))
}
if(!file.exists(glue("daily_download/coronavirus_deaths_{download_date}.csv"))){
  download.file("https://coronavirus.data.gov.uk/downloads/csv/coronavirus-deaths_latest.csv", glue("daily_download/coronavirus_deaths_{download_date}.csv"))
}

Load PHE data and clean up column names

phe_cases <- read_csv(glue("daily_download/coronavirus_cases_{download_date}.csv")) %>% clean_names()
phe_deaths <- read_csv(glue("daily_download/coronavirus_deaths_{download_date}.csv")) %>% clean_names()

Daily cases

clean_phe_cases_daily <- phe_cases %>% 
  select(-cumulative_lab_confirmed_cases) %>%
  group_by(area_type) %>% 
  arrange(specimen_date) %>% 
  pivot_wider(data=., names_from = specimen_date, values_from = daily_lab_confirmed_cases) %>% 
  clean_names() %>% 
  group_split() %>% 
  map(.,arrange,area_code)

names(clean_phe_cases_daily) <- map(clean_phe_cases_daily, `[[`,1,"area_type") %>% str_replace_all(" ","_")

Cumulative cases

clean_phe_cases_cumulative <- phe_cases %>% 
  select(-daily_lab_confirmed_cases) %>%
  group_by(area_type) %>% 
  arrange(specimen_date) %>% 
  pivot_wider(data=., names_from = specimen_date, values_from = cumulative_lab_confirmed_cases) %>% 
  clean_names() %>% 
  group_split() %>% 
  map(.,arrange,area_code)

names(clean_phe_cases_cumulative) <- map(clean_phe_cases_cumulative, `[[`,1,"area_type") %>% str_replace_all(" ","_")

Export cases data to .csv

map(names(clean_phe_cases_daily), function(x){
  write_csv(clean_phe_cases_daily[[x]], glue("daily_output/{x}_daily_cases_{download_date}.csv"))
  write_csv(clean_phe_cases_cumulative[[x]], glue("daily_output/{x}_cumulative_cases_{download_date}.csv"))
})

Daily deaths

clean_phe_deaths_daily <- phe_deaths %>% 
  mutate(area_type = case_when(area_type == "UK" ~ "Nation", 
                               TRUE ~ area_type)) %>% 
  select(-cumulative_hospital_deaths) %>%
  arrange(reporting_date) %>%
  pivot_wider(data=., names_from = reporting_date, values_from = daily_hospital_deaths) %>% 
  clean_names()

Cumulative deaths

clean_phe_deaths_cumulative <- phe_deaths %>% 
  mutate(area_type = case_when(area_type == "UK" ~ "Nation", 
                               TRUE ~ area_type)) %>% 
  select(-daily_hospital_deaths) %>%
  arrange(reporting_date) %>%
  pivot_wider(data=., names_from = reporting_date, values_from = cumulative_hospital_deaths) %>% 
  clean_names()

Export deaths data to .csv

write_csv(clean_phe_deaths_daily, glue("daily_output/Country_daily_deaths_{download_date}.csv"))
write_csv(clean_phe_deaths_cumulative, glue("daily_output/Country_cumulative_deaths_{download_date}.csv"))

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

README.md

README.md

Transforming PHE COVID-19 data

Load libraries

Create folder structure in your working directory

Download PHE data

Load PHE data and clean up column names

Daily cases

Cumulative cases

Export cases data to .csv

Daily deaths

Cumulative deaths

Export deaths data to .csv

Files

README.md

Latest commit

History

README.md

File metadata and controls

Transforming PHE COVID-19 data

Load libraries

Create folder structure in your working directory

Download PHE data

Load PHE data and clean up column names

Daily cases

Cumulative cases

Export cases data to .csv

Daily deaths

Cumulative deaths

Export deaths data to .csv