text/data/smoltalk/constraints/pipeline/json_schemas.py (192 lines of code) (raw):
IFEVAL_RESPONSE_VERIFICATION_FUNCTION_ARGUMENTS_JSON_SCHEMA = {
"type": "object",
"properties": {
"language": {
"type": ["string", "null"],
},
"num_sentences": {
"type": ["integer", "null"],
"minimum": 1,
},
"relation": {
"type": ["string", "null"],
"enum": ["less than", "at least"],
},
"num_placeholders": {
"type": ["integer", "null"],
"minimum": 1,
},
"num_bullets": {
"type": ["integer", "null"],
"minimum": 1,
},
"starter": {
"type": ["string", "null"],
},
"num_highlights": {
"type": ["integer", "null"],
"minimum": 1,
},
"section_spliter": {
"type": ["string", "null"],
"enum": ["Section", "SECTION"],
},
"num_sections": {
"type": ["integer", "null"],
"minimum": 1,
},
"num_paragraphs": {
"type": ["integer", "null"],
"minimum": 1,
},
"postscript_marker": {
"type": ["string", "null"],
"enum": ["P.S.", "P.P.S"],
},
"original_message": {
"type": ["string", "null"],
},
"keywords": {
"type": "array",
"items": {"type": "string"},
},
"keyword": {
"type": ["string", "null"],
},
"frequency": {
"type": ["integer", "null"],
"minimum": 1,
},
"num_words": {
"type": ["integer", "null"],
"minimum": 1,
},
"nth_paragraph": {
"type": ["integer", "null"],
"minimum": 1,
},
"first_word": {
"type": ["string", "null"],
},
"key_sentences": {
"type": ["array", "null"],
"items": {"type": "string"},
},
"forbidden_words": {
"type": ["array", "null"],
"items": {"type": "string"},
},
"original_paragraph": {
"type": ["string", "null"],
},
"low": {
"type": ["integer", "null"],
"minimum": 0,
},
"high": {
"type": ["integer", "null"],
"minimum": 0,
},
"prompt_to_repeat": {
"type": ["string", "null"],
},
"end_phrase": {
"type": ["string", "null"],
},
"letter": {
"type": ["string", "null"],
"minLength": 1,
"maxLength": 1,
"pattern": "[a-zA-Z]",
},
"let_frequency": {
"type": ["integer", "null"],
"minimum": 1,
},
"let_relation": {
"type": ["string", "null"],
"enum": ["less than", "at least"],
},
"capital_frequency": {
"type": ["integer", "null"],
"minimum": 1,
},
"capital_relation": {
"type": ["string", "null"],
"enum": ["less than", "at least"],
},
},
"required": [
"language",
"num_sentences",
"relation",
"num_placeholders",
"num_bullets",
"starter",
"num_highlights",
"section_spliter",
"num_sections",
"num_paragraphs",
"postscript_marker",
"original_message",
"keywords",
"keyword",
"frequency",
"num_words",
"nth_paragraph",
"first_word",
"key_sentences",
"forbidden_words",
"original_paragraph",
"low",
"high",
"prompt_to_repeat",
"end_phrase",
"letter",
"let_frequency",
"let_relation",
"capital_frequency",
"capital_relation",
],
"additionalProperties": False,
}
IFEVAL_INSTRUCTION_ID_LIST_JSON_SCHEMA = {
"type": "object",
"properties": {
"instruction_id_list": {
"type": "array",
"items": {
"type": "string",
"enum": [
"keywords:existence",
"keywords:frequency",
"keywords:forbidden_words",
"keywords:letter_frequency",
"language:response_language",
"length_constraints:number_sentences",
"length_constraints:number_paragraphs",
"length_constraints:number_words",
"length_constraints:nth_paragraph_first_word",
"detectable_content:number_placeholders",
"detectable_content:postscript",
"detectable_format:number_bullet_lists",
"detectable_format:constrained_response",
"detectable_format:number_highlighted_sections",
"detectable_format:multiple_sections",
"detectable_format:json_format",
"detectable_format:title",
"combination:two_responses",
"combination:repeat_prompt",
"startend:end_checker",
"change_case:capital_word_frequency",
"change_case:english_capital",
"change_case:english_lowercase",
"punctuation:no_comma",
"startend:quotation",
],
},
"uniqueItems": True,
}
},
"required": ["instruction_id_list"],
}