in gen_parlai_data.py [0:0]
def clean(x): return x.replace("\n", "").replace("\r", "").replace("\t", " ").strip()