def get_name_basics()

in datasets/imdb/pipelines/_images/run_csv_transform_kub/csv_transform.py [0:0]


def get_name_basics(source_file: dict) -> pd.DataFrame:
    logging.info(f'Reading data from  {source_file.get("url_data", "")}')
    df = pd.read_csv(source_file.get("url_data", ""), sep="\t", compression="gzip")
    for col in df:
        if col in ("birthYear", "deathYear"):
            coldata_replace(df, col, REPLACE_DICT)
            convert_int(df, col, "Int64")
            continue
        elif col in ("knownForTitles"):
            coldata_replace(df, col, REPLACE_DICT)
    return df