def locate_features_with_too_many_missing_values()

in blogs/wind-turbine-engie/utils.py [0:0]


def locate_features_with_too_many_missing_values(df, missing_threshold):
    bad_cols = []
    for col in df.columns:
        nan_count = df[col].isna().sum()
        num_rows = df.shape[0]
        nan_perc = nan_count/num_rows
        if nan_perc > 0.1:
            bad_cols.append(col)
    return bad_cols