From 287d87b6682ad31c318d62881719c6cf15c9705d Mon Sep 17 00:00:00 2001 From: Hannes Kuchelmeister Date: Thu, 20 May 2021 12:10:41 +0200 Subject: [PATCH] add code to remove NaN rows and columns --- voting_lib/voting_analysis.py | 8 +++++++- 1 file changed, 7 insertions(+), 1 deletion(-) diff --git a/voting_lib/voting_analysis.py b/voting_lib/voting_analysis.py index 624c388..3ba0f9a 100644 --- a/voting_lib/voting_analysis.py +++ b/voting_lib/voting_analysis.py @@ -80,7 +80,7 @@ def predict(model, data, grid_h, grid_w, comparison_data=pd.DataFrame()): comparison_data_dist = calc_party_distances(comparison_data) plot_party_distances(comparison_data_dist) plt.show() - err = normalize_df(part_distance_out) - normalize_df(comparison_data_dist) + err = remove_NaN_rows_columns(normalize_df(part_distance_out) - normalize_df(comparison_data_dist)) err = err * err plot_party_distances(err) plt.title(f'distance squared error, with mse={np.nanmean(err.to_numpy()):.2f}') @@ -251,3 +251,9 @@ def normalize_df(dataframe): df = df - np.min(df.to_numpy()) df = df / np.max(df.to_numpy()) return df + +def remove_NaN_rows_columns(dataframe): + df = dataframe.copy(deep=True) + df = df.dropna(axis=0, how='all', thresh=None, subset=None, inplace=False) + df = df.dropna(axis=1, how='all', thresh=None, subset=None, inplace=False) + return df