From 9db72f45a605eef10d02de0c25ab631b000c591c Mon Sep 17 00:00:00 2001 From: Adam Kania <48769688+remilvus@users.noreply.github.com> Date: Wed, 7 Jun 2023 17:33:05 +0300 Subject: [PATCH] Load boston from url --- examples/clt_plot.py | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/examples/clt_plot.py b/examples/clt_plot.py index 5219f2c..222040c 100644 --- a/examples/clt_plot.py +++ b/examples/clt_plot.py @@ -1,11 +1,14 @@ import numpy as np -from sklearn.datasets import load_boston +import pandas as pd import deeprob.spn.structure as spn if __name__ == '__main__': # Load the boston dataset and binarize it - data, _ = load_boston(return_X_y=True) + data_url = "http://lib.stat.cmu.edu/datasets/boston" + raw_df = pd.read_csv(data_url, sep="\s+", skiprows=22, header=None) + data = np.hstack([raw_df.values[::2, :], raw_df.values[1::2, :2]]) + avg_features = np.mean(data, axis=0) data = (data < avg_features).astype(np.float32) n_samples, n_features = data.shape