in llm_perf/cli.py [0:0]
def run_benchmark( hardware: Hardware = typer.Option(..., help="Hardware to run on: CPU or CUDA"), backend: Backend = typer.Option( ..., help="Backend to use: ONNXRUNTIME, PYTORCH, or OPENVINO" ),