ultravox/data/configs/boolq.py (15 lines of code) (raw):
from ultravox.data import types
BOOLQ_CONFIG = types.DatasetConfig(
name="boolq",
path="fixie-ai/boolq-audio",
splits=[
types.DatasetSplitConfig(name="train", num_samples=10000),
types.DatasetSplitConfig(name="validation", num_samples=1000),
],
user_template=f"{{{{passage}}}}\n\n{types.AUDIO_PLACEHOLDER}",
assistant_template="{{'True' if answer else 'False'}}",
transcript_template="{{question}}",
)
configs = [
BOOLQ_CONFIG,
]