video_processing/add_aesthetic_laion

import pandas as pd import pathlib from PIL import Image from argparse import ArgumentParser from tqdm import tqdm from modules import load_aesthetic_laion, run_aesthetic_laion, separate_key_frames_from_row parser = ArgumentParser() parser.add_argument("--path", type=str, required=True) parser.add_argument("--parquet-path", type=str, required=True) parser.add_argument("--parquet-out-path", type=str, required=True) parser.add_argument("--device", type=str, required=True) parser.add_argument("--model", type=str, default=None) parser.add_argument("--dtype", type=str, required=True) args = parser.parse_args() path = pathlib.Path(args.path) parquet_path = pathlib.Path(args.parquet_path) parquet_out_path = pathlib.Path(args.parquet_out_path) device = args.device dtype = args.dtype model_path = args.model load_aesthetic_laion(device=device, model_path=model_path, dtype=dtype) df = pd.read_parquet(parquet_path) data = [] with tqdm() as pbar: for _, row in df.iterrows(): pbar.set_description(row["file"]) key_frames, first, mid, last = separate_key_frames_from_row(path, row) pbar.set_postfix_str(f"{len(key_frames)} key frames") frames = [frame for frame in [first, mid, last] if frame is not None] scores = [tensor.cpu().item() for tensor in run_aesthetic_laion(frames)] data.append({"aesthetic_score": scores}) pbar.update() aesthetic_df = pd.DataFrame(data) print(aesthetic_df) df = df.join(aesthetic_df) print(df) df.to_parquet(parquet_out_path)

video_processing/add_aesthetic_laion_score.py (37 lines of code) (raw):