def curate_data()

in deploy_code/multipagepdfa2i_wrapup/gather_data.py [0:0]


def curate_data(base_image_keys, payload):
    data = ""
    for base_key in base_image_keys:
        page_number = base_key[base_key.rfind("/")+1:]
        page_number = "page " + str(int(page_number[:page_number.find(".")]) + 1)
        
        data += page_number + ",-,-" +  "\n"

        if does_exsist(payload["bucket"], base_key + "/ai/output.json"):
            temp_data = get_data_from_bucket(payload["bucket"], base_key + "/ai/output.json")
            data += create_csv(temp_data, "ai")
        if does_exsist(payload["bucket"], base_key + "/human/output.json"):
            temp_data = get_data_from_bucket(payload["bucket"], base_key + "/human/output.json")
            data += create_csv(temp_data, "human")

    return data