in code/dataset_prep.py [0:0]
def get_region_columns(df, region): return [col for col in df.columns if region in col]