mcloud_oaieval.yaml (21 lines of code) (raw):
# Ultravox eval with vllm configuration
name: ultravox-oaieval
image: mosaicml/composer:latest
compute:
gpus: 8
cluster: r15z1p1
integrations:
- integration_type: git_repo
git_repo: fixie-ai/ultravox
git_branch: $UV_BRANCH
pip_install: poetry==1.7.1
scheduling:
max_duration: 2 # 2 hours max for jobs to avoid hanging jobs
command: >-
cd ultravox &&
poetry install --no-dev &&
poetry run pip install vllm &&
HF_TOKEN=$HF_WRITE_TOKEN poetry run python -m ultravox.inference.run_vllm_inference $EVAL_ARGS
env_variables:
MLFLOW_TRACKING_URI: databricks
UV_BRANCH: main
EVAL_ARGS: --evalset audio-core --model fixie-ai/ultravox-v0_5-llama-3_1-8b