in datasets/imdb/pipelines/_images/run_csv_transform_kub/csv_transform.py [0:0]
def get_name_basics(source_file: dict) -> pd.DataFrame:
logging.info(f'Reading data from {source_file.get("url_data", "")}')
df = pd.read_csv(source_file.get("url_data", ""), sep="\t", compression="gzip")
for col in df:
if col in ("birthYear", "deathYear"):
coldata_replace(df, col, REPLACE_DICT)
convert_int(df, col, "Int64")
continue
elif col in ("knownForTitles"):
coldata_replace(df, col, REPLACE_DICT)
return df