From 6ffef83aef61fcc4a98c13cec33c1bcead6a9a62 Mon Sep 17 00:00:00 2001 From: e-belfer Date: Thu, 24 Oct 2024 15:51:10 -0400 Subject: [PATCH 1/3] Add first WIP draft of diverse filetypes lesson --- episodes/working-with-diverse-filetypes.md | 31 ++++++++++++++++++++++ 1 file changed, 31 insertions(+) create mode 100644 episodes/working-with-diverse-filetypes.md diff --git a/episodes/working-with-diverse-filetypes.md b/episodes/working-with-diverse-filetypes.md new file mode 100644 index 0000000..09f85f6 --- /dev/null +++ b/episodes/working-with-diverse-filetypes.md @@ -0,0 +1,31 @@ +--- +title: "Handling diverse filetypes in Pandas" +teaching: 10 +exercises: 2 +--- + +:::::::::::::::::::::::::::::::::::::: questions + +- How can I read in different tabular data types to a familiar format in Python? +- What are some common errors that occur when importing data, and how can I troubleshoot them? + +:::::::::::::::::::::::::::::::::::::::::::::::: + +::::::::::::::::::::::::::::::::::::: objectives + +- Import tabular data from XML, JSON, and Parquet formats to pandas dataframes using the `pandas` library +- Import a table from a SQL database using the `pandas` library +- Implement strategies to handle common errors on data import + +:::::::::::::::::::::::::::::::::::::::::::::::: + + +::::::::::::::::::::::::::::::::::::: keypoints + +- `pandas` has functionality to read in many data formats (e.g., XML, JSON, SQL, +Parquet) into the same kind of DataFrame in Python. We can take advantage of this to +transform many kinds of data with similar functions in Python. +- `pandas` accepts both relative and absolute file paths on read-in. + +:::::::::::::::::::::::::::::::::::::::::::::::: + From af27d5eefa96cc538d932a7fc13de09ee64207e5 Mon Sep 17 00:00:00 2001 From: e-belfer Date: Thu, 24 Oct 2024 15:52:01 -0400 Subject: [PATCH 2/3] Add to episodes in config.yaml --- config.yaml | 1 + 1 file changed, 1 insertion(+) diff --git a/config.yaml b/config.yaml index c376faf..ab07bef 100644 --- a/config.yaml +++ b/config.yaml @@ -67,6 +67,7 @@ contact: 'hello@catalyst.coop' # Order of episodes in your lesson episodes: - introduction.md +- working-with-diverse-filetypes.md # Information for Learners learners: From f2b01dfd586f4a68cf304cc845c276bb1ad5ab04 Mon Sep 17 00:00:00 2001 From: e-belfer Date: Thu, 24 Oct 2024 15:54:18 -0400 Subject: [PATCH 3/3] Set teaching and exercises time to 0 --- episodes/working-with-diverse-filetypes.md | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/episodes/working-with-diverse-filetypes.md b/episodes/working-with-diverse-filetypes.md index 09f85f6..fff1e95 100644 --- a/episodes/working-with-diverse-filetypes.md +++ b/episodes/working-with-diverse-filetypes.md @@ -1,7 +1,7 @@ --- title: "Handling diverse filetypes in Pandas" -teaching: 10 -exercises: 2 +teaching: 0 +exercises: 0 --- :::::::::::::::::::::::::::::::::::::: questions