FIX: FutureWarning in heavy_tails (#581)

mmcky · web-flow · commit 3e07d3bd0389 · 2025-03-28T16:33:28.000+11:00
* FIX: FutureWarning in heavy_tails

* Update lectures/heavy_tails.md

* minor typo

* fix install of wbgapi

* fix cntry_mapper
diff --git a/lectures/heavy_tails.md b/lectures/heavy_tails.md
@@ -4,7 +4,7 @@ jupytext:
     extension: .md
     format_name: myst
     format_version: 0.13
-    jupytext_version: 1.16.1
+    jupytext_version: 1.16.7
 kernelspec:
   display_name: Python 3 (ipykernel)
   language: python
@@ -19,7 +19,7 @@ In addition to what's in Anaconda, this lecture will need the following librarie
 ```{code-cell} ipython3
 :tags: [hide-output]
 
-!pip install --upgrade yfinance pandas_datareader
+!pip install --upgrade yfinance wbgapi
 ```
 
 We use the following imports.
@@ -31,7 +31,7 @@ import yfinance as yf
 import pandas as pd
 import statsmodels.api as sm
 
-from pandas_datareader import wb
+import wbgapi as wb
 from scipy.stats import norm, cauchy
 from pandas.plotting import register_matplotlib_converters
 register_matplotlib_converters()
@@ -790,24 +790,21 @@ def empirical_ccdf(data,
 :tags: [hide-input]
 
 def extract_wb(varlist=['NY.GDP.MKTP.CD'], 
-               c='all_countries', 
+               c='all', 
                s=1900, 
                e=2021, 
                varnames=None):
-    if c == "all_countries":
-        # Keep countries only (no aggregated regions)
-        countries = wb.get_countries()
-        countries_name = countries[countries['region'] != 'Aggregates']['name'].values
-        c = "all"
     
-    df = wb.download(indicator=varlist, country=c, start=s, end=e).stack().unstack(0).reset_index()
-    df = df.drop(['level_1'], axis=1).transpose()
+    df = wb.data.DataFrame(varlist, economy=c, time=range(s, e+1, 1), skipAggs=True)
+    df.index.name = 'country'
+    
     if varnames is not None:
-        df.columns = varnames
-        df = df[1:]
+        df.columns = variable_names
+
+    cntry_mapper = pd.DataFrame(wb.economy.info().items)[['id','value']].set_index('id').to_dict()['value']
+    df.index = df.index.map(lambda x: cntry_mapper[x])  #map iso3c to name values
     
-    df1 =df[df.index.isin(countries_name)]
-    return df1
+    return df
 ```
 
 ### Firm size
@@ -914,9 +911,9 @@ variable_code = ['NY.GDP.MKTP.CD', 'NY.GDP.PCAP.CD']
 variable_names = ['GDP', 'GDP per capita']
 
 df_gdp1 = extract_wb(varlist=variable_code, 
-                     c="all_countries", 
-                     s="2021", 
-                     e="2021", 
+                     c="all", 
+                     s=2021, 
+                     e=2021, 
                      varnames=variable_names)
 df_gdp1.dropna(inplace=True)
 ```