in deploy_code/multipagepdfa2i_wrapup/gather_data.py [0:0]
def curate_data(base_image_keys, payload):
data = ""
for base_key in base_image_keys:
page_number = base_key[base_key.rfind("/")+1:]
page_number = "page " + str(int(page_number[:page_number.find(".")]) + 1)
data += page_number + ",-,-" + "\n"
if does_exsist(payload["bucket"], base_key + "/ai/output.json"):
temp_data = get_data_from_bucket(payload["bucket"], base_key + "/ai/output.json")
data += create_csv(temp_data, "ai")
if does_exsist(payload["bucket"], base_key + "/human/output.json"):
temp_data = get_data_from_bucket(payload["bucket"], base_key + "/human/output.json")
data += create_csv(temp_data, "human")
return data