in simuleval/data/tokenizer.py [0:0]
def end_idx_last_full_word(self, tokens):
# Begin of word indices
bow_indices = [0] + [i + 1 for i,
t in enumerate(tokens[1:]) if t[-2:] != '@@']
if len(bow_indices) < 2:
return 0
else:
return bow_indices[-1]