def main()

in data_preparation/export_to_hub.py [0:0]


def main(args):
    instructions = load_instructions(args.instructions_path)

    data_paths = os.listdir(args.data_root)
    data_paths = [os.path.join(args.data_root, d) for d in data_paths]
    new_data_paths = []
    for data_path in data_paths:
        original_image = os.path.join(data_path, "original_image.png")
        cartoonized_image = os.path.join(data_path, "cartoonized_image.png")
        new_data_paths.append((original_image, cartoonized_image))

    generation_fn = generate_examples(new_data_paths, instructions)
    print("Creating dataset...")
    ds = Dataset.from_generator(
        generation_fn,
        features=Features(
            original_image=ImageFeature(),
            edit_prompt=Value("string"),
            cartoonized_image=ImageFeature(),
        ),
    )

    print("Pushing to the Hub...")
    ds.push_to_hub(DS_NAME)