in data_preparation/export_to_hub.py [0:0]
def main(args):
instructions = load_instructions(args.instructions_path)
data_paths = os.listdir(args.data_root)
data_paths = [os.path.join(args.data_root, d) for d in data_paths]
new_data_paths = []
for data_path in data_paths:
original_image = os.path.join(data_path, "original_image.png")
cartoonized_image = os.path.join(data_path, "cartoonized_image.png")
new_data_paths.append((original_image, cartoonized_image))
generation_fn = generate_examples(new_data_paths, instructions)
print("Creating dataset...")
ds = Dataset.from_generator(
generation_fn,
features=Features(
original_image=ImageFeature(),
edit_prompt=Value("string"),
cartoonized_image=ImageFeature(),
),
)
print("Pushing to the Hub...")
ds.push_to_hub(DS_NAME)