GitHub - ONSgeo/PHE_data_for_geospatial: Transforming PHE COVID-19 data to allow joining to statistical geographies.

Transforming PHE COVID-19 data

This script separates the latest COVID-19 data from coronavirus.data.gov.uk into separate geographic regions based on area_type. To allow users to join these data to boundaries from geoportal.statistics.gov.uk/ observations are pivoted to ensure all area_code values are unique.

Load libraries

library(tidyverse)
library(janitor)
library(glue)

Create folder structure in your working directory

dir.create("daily_download", showWarnings = FALSE)
dir.create("daily_output", showWarnings = FALSE)

Download PHE data

download_date <- Sys.Date()

if(!file.exists(glue("daily_download/coronavirus_cases_{download_date}.csv"))){
  download.file("https://coronavirus.data.gov.uk/downloads/csv/coronavirus-cases_latest.csv", glue("daily_download/coronavirus_cases_{download_date}.csv"))
}
if(!file.exists(glue("daily_download/coronavirus_deaths_{download_date}.csv"))){
  download.file("https://coronavirus.data.gov.uk/downloads/csv/coronavirus-deaths_latest.csv", glue("daily_download/coronavirus_deaths_{download_date}.csv"))
}

Load PHE data and clean up column names

phe_cases <- read_csv(glue("daily_download/coronavirus_cases_{download_date}.csv")) %>% clean_names()
phe_deaths <- read_csv(glue("daily_download/coronavirus_deaths_{download_date}.csv")) %>% clean_names()

Daily cases

clean_phe_cases_daily <- phe_cases %>% 
  select(-cumulative_lab_confirmed_cases) %>%
  group_by(area_type) %>% 
  arrange(specimen_date) %>% 
  pivot_wider(data=., names_from = specimen_date, values_from = daily_lab_confirmed_cases) %>% 
  clean_names() %>% 
  group_split() %>% 
  map(.,arrange,area_code)

names(clean_phe_cases_daily) <- map(clean_phe_cases_daily, `[[`,1,"area_type") %>% str_replace_all(" ","_")

Cumulative cases

clean_phe_cases_cumulative <- phe_cases %>% 
  select(-daily_lab_confirmed_cases) %>%
  group_by(area_type) %>% 
  arrange(specimen_date) %>% 
  pivot_wider(data=., names_from = specimen_date, values_from = cumulative_lab_confirmed_cases) %>% 
  clean_names() %>% 
  group_split() %>% 
  map(.,arrange,area_code)

names(clean_phe_cases_cumulative) <- map(clean_phe_cases_cumulative, `[[`,1,"area_type") %>% str_replace_all(" ","_")

Export cases data to .csv

map(names(clean_phe_cases_daily), function(x){
  write_csv(clean_phe_cases_daily[[x]], glue("daily_output/{x}_daily_cases_{download_date}.csv"))
  write_csv(clean_phe_cases_cumulative[[x]], glue("daily_output/{x}_cumulative_cases_{download_date}.csv"))
})

Daily deaths

clean_phe_deaths_daily <- phe_deaths %>% 
  mutate(area_type = case_when(area_type == "UK" ~ "Nation", 
                               TRUE ~ area_type)) %>% 
  select(-cumulative_hospital_deaths) %>%
  arrange(reporting_date) %>%
  pivot_wider(data=., names_from = reporting_date, values_from = daily_hospital_deaths) %>% 
  clean_names()

Cumulative deaths

clean_phe_deaths_cumulative <- phe_deaths %>% 
  mutate(area_type = case_when(area_type == "UK" ~ "Nation", 
                               TRUE ~ area_type)) %>% 
  select(-daily_hospital_deaths) %>%
  arrange(reporting_date) %>%
  pivot_wider(data=., names_from = reporting_date, values_from = cumulative_hospital_deaths) %>% 
  clean_names()

Export deaths data to .csv

write_csv(clean_phe_deaths_daily, glue("daily_output/Country_daily_deaths_{download_date}.csv"))
write_csv(clean_phe_deaths_cumulative, glue("daily_output/Country_cumulative_deaths_{download_date}.csv"))

Name		Name	Last commit message	Last commit date
Latest commit History 8 Commits
README.md		README.md
cleaning_up_PHE_data.R		cleaning_up_PHE_data.R

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Repository files navigation

Transforming PHE COVID-19 data

Load libraries

Create folder structure in your working directory

Download PHE data

Load PHE data and clean up column names

Daily cases

Cumulative cases

Export cases data to .csv

Daily deaths

Cumulative deaths

Export deaths data to .csv

About

Releases

Packages

Languages

ONSgeo/PHE_data_for_geospatial

Folders and files

Latest commit

History

Repository files navigation

Transforming PHE COVID-19 data

Load libraries

Create folder structure in your working directory

Download PHE data

Load PHE data and clean up column names

Daily cases

Cumulative cases

Export cases data to .csv

Daily deaths

Cumulative deaths

Export deaths data to .csv

About

Resources

Stars

Watchers

Forks

Releases

Packages 0

Languages

Packages