def fix_intent()

in scripts/adapet/ADAPET/utilcode.py [0:0]


def fix_intent(task_name, dataset, english):
    dataset = dataset.rename_column("label_text", "str_label_text")
    if english:
        for split, dset in dataset.items():
            label_text = []
            for txt_lab in dset["str_label_text"]:
                label_text.append(txt_lab.replace("_", " "))
            dset = dset.add_column('label_text', label_text)
            dataset[split] = dset
        
        lang_pattern = '[TEXT1] this is [LBL]'        
    else:
        if task_name == 'SetFit/amazon_massive_intent_zh-CN':
            lang_pattern = '[TEXT1] 这是 [LBL]'
            dataset = dataset.rename_column("label_text_ch", "label_text")
        
        elif task_name == 'SetFit/amazon_massive_intent_ru-RU':
            lang_pattern = '[TEXT1] это [LBL]'
            dataset = dataset.rename_column("label_text_ru", "label_text")
        
        elif task_name == 'SetFit/amazon_massive_intent_de-DE':
            lang_pattern = '[TEXT1] dies ist [LBL]'
            dataset = dataset.rename_column("label_text_de", "label_text")        
        
        elif task_name == 'SetFit/amazon_massive_intent_ja-JP':
            lang_pattern = '[TEXT1]これは[LBL]だ'
            dataset = dataset.rename_column("label_text_jp", "label_text")
        
        elif task_name == 'SetFit/amazon_massive_intent_es-ES':
            lang_pattern = '[TEXT1] esto es [LBL]'
            dataset = dataset.rename_column("label_text_es", "label_text")
        
    return dataset, lang_pattern