def main()

in distilvit/infere.py [0:0]


def main(before, after):
    # Load the dataset
    dataset = datasets.load_dataset("mozilla/alt-text-validation")

    # Filter images based on need_training
    filtered_images = [
        (item["image"], item["alt_text"])
        for item in dataset["train"]
        if item["alt_text"] != ""
    ]

    IMAGES = filtered_images
    print("expected|before|after")
    CAPTIONERS = [
        (
            "before",
            pipeline(
                "image-to-text",
                model=before,
                revision="main",
            ),
        ),
        (
            "after",
            pipeline(
                "image-to-text",
                model=after,
                # revision="main",
            ),
        ),
    ]

    logging.set_verbosity(40)
    for image, inclusive_alt_text in IMAGES:
        line = [f"{inclusive_alt_text}"]

        for name, image_captioner in CAPTIONERS:
            res = image_captioner(image)
            line.append(f"{res[0]['generated_text']}")

        print(" | ".join(line))