in src/responsibleai/rai_analyse/rai_component_utilities.py [0:0]
def load_dataset(dataset_path: str) -> pd.DataFrame:
_logger.info(f"Attempting to load: {dataset_path}")
exceptions = []
isLoadSuccessful = False
try:
df = load_mltable(dataset_path)
isLoadSuccessful = True
except Exception as e:
new_e = UserConfigError(
f"Input dataset {dataset_path} cannot be read as mltable."
f"You may disregard this error if dataset input is intended to be parquet dataset. Exception: {e}",
e
)
exceptions.append(new_e)
if not isLoadSuccessful:
try:
df = load_parquet(dataset_path)
isLoadSuccessful = True
except Exception as e:
new_e = UserConfigError(
f"Input dataset {dataset_path} cannot be read as parquet."
f"You may disregard this error if dataset input is intended to be mltable. Exception: {e}",
e
)
exceptions.append(new_e)
if not isLoadSuccessful:
raise UserConfigError(
f"Input dataset {dataset_path} cannot be read as MLTable or Parquet dataset."
f"Please check that input dataset is valid. Exceptions encountered during reading: {exceptions}"
)
print(df.dtypes)
print(df.head(10))
return df