From 7c1d9b5d3397334ce8d79ffd48ac31449d72b730 Mon Sep 17 00:00:00 2001 From: Rob <62107751+robsdavis@users.noreply.github.com> Date: Mon, 4 Sep 2023 09:49:47 +0100 Subject: [PATCH] Update airfoil URL (#231) * Update airfoil URL * fix columns headers --- tests/plugins/core/models/helpers.py | 5 ++--- tests/plugins/domain_adaptation/da_helpers.py | 5 ++--- tests/plugins/generic/generic_helpers.py | 5 ++--- tests/plugins/privacy/fhelpers.py | 5 ++--- tests/utils/test_compression.py | 17 +++++++++++------ 5 files changed, 19 insertions(+), 18 deletions(-) diff --git a/tests/plugins/core/models/helpers.py b/tests/plugins/core/models/helpers.py index d792833c..9e0c6b2e 100644 --- a/tests/plugins/core/models/helpers.py +++ b/tests/plugins/core/models/helpers.py @@ -4,9 +4,8 @@ def get_airfoil_dataset() -> pd.DataFrame: df = pd.read_csv( - "https://www.neuraldesigner.com/files/datasets/airfoil_self_noise.csv", - # "https://archive.ics.uci.edu/static/public/291/airfoil+self+noise.zip", # TODO: change to this source? - sep=";", + "https://archive.ics.uci.edu/static/public/291/airfoil+self+noise.zip", + sep="\t", engine="python", ) df.columns = df.columns.astype(str) diff --git a/tests/plugins/domain_adaptation/da_helpers.py b/tests/plugins/domain_adaptation/da_helpers.py index 3dd06bcb..c3f0e05d 100644 --- a/tests/plugins/domain_adaptation/da_helpers.py +++ b/tests/plugins/domain_adaptation/da_helpers.py @@ -25,9 +25,8 @@ def from_serde() -> Plugin: def get_airfoil_dataset() -> pd.DataFrame: df = pd.read_csv( - "https://www.neuraldesigner.com/files/datasets/airfoil_self_noise.csv", - # "https://archive.ics.uci.edu/static/public/291/airfoil+self+noise.zip", # TODO: change to this source? - sep=";", + "https://archive.ics.uci.edu/static/public/291/airfoil+self+noise.zip", + sep="\t", engine="python", ) df.columns = df.columns.astype(str) diff --git a/tests/plugins/generic/generic_helpers.py b/tests/plugins/generic/generic_helpers.py index 8c0264fc..af2bcd88 100644 --- a/tests/plugins/generic/generic_helpers.py +++ b/tests/plugins/generic/generic_helpers.py @@ -31,9 +31,8 @@ def from_serde() -> Plugin: def get_airfoil_dataset() -> pd.DataFrame: df = pd.read_csv( - "https://www.neuraldesigner.com/files/datasets/airfoil_self_noise.csv", - # "https://archive.ics.uci.edu/static/public/291/airfoil+self+noise.zip", # TODO: change to this source? - sep=";", + "https://archive.ics.uci.edu/static/public/291/airfoil+self+noise.zip", + sep="\t", engine="python", ) df.columns = df.columns.astype(str) diff --git a/tests/plugins/privacy/fhelpers.py b/tests/plugins/privacy/fhelpers.py index 3dd06bcb..c3f0e05d 100644 --- a/tests/plugins/privacy/fhelpers.py +++ b/tests/plugins/privacy/fhelpers.py @@ -25,9 +25,8 @@ def from_serde() -> Plugin: def get_airfoil_dataset() -> pd.DataFrame: df = pd.read_csv( - "https://www.neuraldesigner.com/files/datasets/airfoil_self_noise.csv", - # "https://archive.ics.uci.edu/static/public/291/airfoil+self+noise.zip", # TODO: change to this source? - sep=";", + "https://archive.ics.uci.edu/static/public/291/airfoil+self+noise.zip", + sep="\t", engine="python", ) df.columns = df.columns.astype(str) diff --git a/tests/utils/test_compression.py b/tests/utils/test_compression.py index 75bc9507..6807da0f 100644 --- a/tests/utils/test_compression.py +++ b/tests/utils/test_compression.py @@ -8,10 +8,18 @@ def get_airfoil_dataset() -> pd.DataFrame: df = pd.read_csv( - "https://www.neuraldesigner.com/files/datasets/airfoil_self_noise.csv", - # "https://archive.ics.uci.edu/static/public/291/airfoil+self+noise.zip", # TODO: change to this source? - sep=";", + "https://archive.ics.uci.edu/static/public/291/airfoil+self+noise.zip", + sep="\t", engine="python", + header=None, + names=[ + "frequency", + "angle_of_attack", + "chord_length", + "free_stream_velocity", + "suction_side_displacement_thickness", + "scaled_sound_pressure_level", + ], ) df.columns = df.columns.astype(str) @@ -77,10 +85,7 @@ def test_compression_sanity2() -> None: def test_compression_sanity_airfoil() -> None: df = get_airfoil_dataset() df["chord_length"] = df["chord_length"].astype(str) - print(df.head()) compressed_df, context = compress_dataset(df) - print(compressed_df) - print(context) assert len(compressed_df) == len(df) assert compressed_df.shape[1] > 0