in opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/utils/Utils.java [35:182]
static {
CHARACTER_MAPPINGS
.add(new String[] {
"[àáâãäå�?ăą�°]",
" " }); // was a
CHARACTER_MAPPINGS
.add(new String[] {
"[À�?ÂÃÄÅĀĂĄ�?]",
"A" });
CHARACTER_MAPPINGS
.add(new String[] {
"[çćĉċ�?]",
"c" });
CHARACTER_MAPPINGS
.add(new String[] {
"[ÇĆĈĊČ]",
"C" });
CHARACTER_MAPPINGS.add(new String[] {
"[�?đ]", "d" });
CHARACTER_MAPPINGS
.add(new String[] {
"[�?�?]",
"D" });
CHARACTER_MAPPINGS
.add(new String[] {
"[èéêëæęēĕ�ęě]",
" " }); // was e
CHARACTER_MAPPINGS
.add(new String[] {
"[ÈÉÊËÆĒ�ĖĘĚ]",
"'" }); // was E
CHARACTER_MAPPINGS
.add(new String[] {
"[�?ğġģ]",
"g" });
CHARACTER_MAPPINGS
.add(new String[] {
"[ĜĞĠĢƓ]",
"G" });
CHARACTER_MAPPINGS.add(new String[] {
"[ĥħ]", "h" });
CHARACTER_MAPPINGS.add(new String[] {
"[ĤĦ]", "H" });
CHARACTER_MAPPINGS
.add(new String[] {
"[ìÃÂÂîïĩīÄÂÂĮįıijĵ]",
"i" });
CHARACTER_MAPPINGS
.add(new String[] {
"[Ì�?Î�?ĨĪĬİIJĴĵ]",
"I" });
CHARACTER_MAPPINGS.add(new String[] {
"[ķĸ]", "k" });
CHARACTER_MAPPINGS.add(new String[] { "[Ķ]", "K" });
CHARACTER_MAPPINGS
.add(new String[] {
"[øőðòóôõö�?�?őœơ]",
"o" });
CHARACTER_MAPPINGS
.add(new String[] {
"[ÒÓ�ÕÖØŌŎ�?ŒƠ]",
"O" });
CHARACTER_MAPPINGS
.add(new String[] {
"[ñńņňʼnŋ]",
"n" });
CHARACTER_MAPPINGS
.add(new String[] {
"[ÑŃŅŇŊŋ]",
"N" });
CHARACTER_MAPPINGS
.add(new String[] {
"[ĺļľŀł]",
"l" });
CHARACTER_MAPPINGS
.add(new String[] {
"[ĹĻĽĿ�?]",
"L" });
CHARACTER_MAPPINGS
.add(new String[] {
"[ùúûüũūÅÂÂůűųư]",
"u" });
CHARACTER_MAPPINGS
.add(new String[] {
"[ÙÚÛÜŨŪŬŮŰŲƯ]",
"U" });
CHARACTER_MAPPINGS.add(new String[] {
"[ýÿŷ]", "y" });
CHARACTER_MAPPINGS
.add(new String[] {
"[�?ŶŸ]",
"Y" });
CHARACTER_MAPPINGS
.add(new String[] {
"[ŕ�ř]",
"r" });
CHARACTER_MAPPINGS
.add(new String[] {
"[�ŖŘ]",
"R" });
CHARACTER_MAPPINGS
.add(new String[] {
"[šś�?şšſ]",
"s" });
CHARACTER_MAPPINGS
.add(new String[] {
"[ŠŚŜŞŠſ]",
"S" });
CHARACTER_MAPPINGS.add(new String[] { "ß", "ss" });
CHARACTER_MAPPINGS.add(new String[] { "Þ", "th" });
CHARACTER_MAPPINGS.add(new String[] { "þ", "Th" });
CHARACTER_MAPPINGS
.add(new String[] {
"[ţťŧ]",
"t" });
CHARACTER_MAPPINGS
.add(new String[] {
"[ŢŤŦ]",
"T" });
CHARACTER_MAPPINGS.add(new String[] { "[ŵ]", "w" });
CHARACTER_MAPPINGS.add(new String[] { "[Å´]", "W" });
CHARACTER_MAPPINGS
.add(new String[] {
"[žźżžƶ]",
"z" });
CHARACTER_MAPPINGS
.add(new String[] {
"[ŽŽŹŻŽƵ]",
"Z" });
CHARACTER_MAPPINGS.add(new String[] {
"[’]", "'" });
CHARACTER_MAPPINGS.add(new String[] {
"[–]", "'" });
CHARACTER_MAPPINGS.add(new String[] { "'", "'" });
CHARACTER_MAPPINGS.add(new String[] { "Âe", "«" });
CHARACTER_MAPPINGS.add(new String[] { "'AG", "“" });
CHARACTER_MAPPINGS.add(new String[] { "A�", " " });
CHARACTER_MAPPINGS.add(new String[] { """, "\"" });
CHARACTER_MAPPINGS.add(new String[] { "&", "&" });
CHARACTER_MAPPINGS.add(new String[] { " ", " " });
CHARACTER_MAPPINGS.add(new String[] {
"", " " });
CHARACTER_MAPPINGS.add(new String[] { "â„¢",
" " });
CHARACTER_MAPPINGS.add(new String[] {
"�", "" });
CHARACTER_MAPPINGS.add(new String[] { "’", "'" });
}