in infra-as-code/modules/audio-data-format-change/function-source-code/record.py [0:0]
def check_current_file(self):
"""Verifies the current filename to see if was processed
or complies with business requirements
Args:
case_manager_email (str): case manager email
Raises:
Exception: No case manager email in filename
Exception: Repeated file with no case manager email
Exception: File is processing or was already processed
Returns:
pandas.DataFrame: dataframe for the parquet file
"""
# --------------------------------------------------------------------
#TODO: Add logic to avoid repeated files being processed in case needed.
# print('Checking if file was already processed')
# if(self.original_file_name in self.ingest_record_df["filename"].values):
# raise Exception('Repeated file with no case manager email')
# else:
# raise Exception('No case manager email in filename')
# if (self.original_file_name in self.ingest_record_df["filename"].values):
# if (self.ingest_record_df.loc[self.ingest_record_df["filename"] == self.original_file_name, "processed"].values[0] == True):
# #Ignore and log error
# print('Repeated file')
# raise Exception('File is processing or was already processed')
# else:
# if (self.ingest_record_df.loc[self.ingest_record_df["filename"] == self.original_file_name].values[0] == True):
# print('Will re process file')
# return self.replace_row(self.create_re_processed_record())
# else:
# --------------------------------------------------------------------
print('Will process file')
self.add_row(self.create_processed_record())
return self.ingest_record_df