ydataai · ssiegel · Nov 7, 2024
diff --git a/src/ydata_profiling/model/pandas/describe_categorical_pandas.py b/src/ydata_profiling/model/pandas/describe_categorical_pandas.py
@@ -19,7 +19,7 @@
 
 
 def get_character_counts_vc(vc: pd.Series) -> pd.Series:
-    series = pd.Series(vc.index, index=vc)
+    series = pd.Series(vc.index, index=vc, dtype=object)
     characters = series[series != ""].apply(list)
     characters = characters.explode()
 
@@ -169,7 +169,7 @@ def word_summary_vc(vc: pd.Series, stop_words: List[str] = []) -> dict:
     # TODO: configurable lowercase/punctuation etc.
     # TODO: remove punctuation in words
 
-    series = pd.Series(vc.index, index=vc)
+    series = pd.Series(vc.index, index=vc, dtype=object)
     word_lists = series.str.lower().str.split()
     words = word_lists.explode().str.strip(string.punctuation + string.whitespace)
     word_counts = pd.Series(words.index, index=words)
@@ -187,7 +187,7 @@ def word_summary_vc(vc: pd.Series, stop_words: List[str] = []) -> dict:
 
 
 def length_summary_vc(vc: pd.Series) -> dict:
-    series = pd.Series(vc.index, index=vc)
+    series = pd.Series(vc.index, index=vc, dtype=object)
     length = series.str.len()
     length_counts = pd.Series(length.index, index=length)
     length_counts = length_counts.groupby(level=0, sort=False).sum()

diff --git a/src/ydata_profiling/model/pandas/summary_pandas.py b/src/ydata_profiling/model/pandas/summary_pandas.py
@@ -36,7 +36,8 @@ def pandas_describe_1d(
     """
 
     # Make sure pd.NA is not in the series
-    series = series.fillna(np.nan)
+    with pd.option_context("future.no_silent_downcasting", True):
+        series = series.fillna(np.nan)
 
     if (
         isinstance(typeset, ProfilingTypeSet)

diff --git a/tests/unit/test_pd_future_infer_string.py b/tests/unit/test_pd_future_infer_string.py
@@ -0,0 +1,21 @@
+import pandas as pd
+import pytest
+
+from ydata_profiling import ProfileReport
+
+
+@pytest.fixture()
+def df():
+    df = pd.DataFrame(
+        {
+            "foo": [1, 2, 3],
+            "bar": ["", "", ""],
+        }
+    )
+    return df
+
+
+def test_pd_future_infer_string(df: pd.DataFrame):
+    with pd.option_context("future.infer_string", True):
+        profile_report = ProfileReport(df, title="Test Report", progress_bar=False)
+        assert len(profile_report.to_html()) > 0