def clean_text()

in generation/boilerplate_cleanup.py [0:0]


def clean_text(sample):
    sample['completion_unfiltered'] = sample['completion']
    for pattern in patterns:
        sample['completion'] = pattern.sub('', sample['completion'].strip())
    return sample