in Sources/Tokenizers/Tokenizer.swift [373:386]
func fuseUnknown(_ tokens: [String]) -> [String] {
guard fuseUnknownTokens else { return tokens }
let (fused, _) = tokens.reduce((fused: [String](), previousIsUnknown: false)) { result, token in
var (fused, previousIsUnknown) = result
let isUnknown = model.convertTokenToId(token) == model.unknownTokenId
if isUnknown {
if !previousIsUnknown { fused.append(token) }
} else {
fused.append(token)
}
return (fused, isUnknown)
}
return fused
}