in scripts/adapet/ADAPET/utilcode.py [0:0]
def fix_intent(task_name, dataset, english):
dataset = dataset.rename_column("label_text", "str_label_text")
if english:
for split, dset in dataset.items():
label_text = []
for txt_lab in dset["str_label_text"]:
label_text.append(txt_lab.replace("_", " "))
dset = dset.add_column('label_text', label_text)
dataset[split] = dset
lang_pattern = '[TEXT1] this is [LBL]'
else:
if task_name == 'SetFit/amazon_massive_intent_zh-CN':
lang_pattern = '[TEXT1] 这是 [LBL]'
dataset = dataset.rename_column("label_text_ch", "label_text")
elif task_name == 'SetFit/amazon_massive_intent_ru-RU':
lang_pattern = '[TEXT1] это [LBL]'
dataset = dataset.rename_column("label_text_ru", "label_text")
elif task_name == 'SetFit/amazon_massive_intent_de-DE':
lang_pattern = '[TEXT1] dies ist [LBL]'
dataset = dataset.rename_column("label_text_de", "label_text")
elif task_name == 'SetFit/amazon_massive_intent_ja-JP':
lang_pattern = '[TEXT1]これは[LBL]だ'
dataset = dataset.rename_column("label_text_jp", "label_text")
elif task_name == 'SetFit/amazon_massive_intent_es-ES':
lang_pattern = '[TEXT1] esto es [LBL]'
dataset = dataset.rename_column("label_text_es", "label_text")
return dataset, lang_pattern