in x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ml/inference/preprocessing/customwordembedding/ScriptCode.java [127:335]
public static ScriptCode unicodeScriptToULScript(Character.UnicodeScript scriptId) {
switch (scriptId) {
case COMMON:
return ScriptCode.Common;
case LATIN:
return ScriptCode.Latin;
case GREEK:
return ScriptCode.Greek;
case CYRILLIC:
return ScriptCode.Cyrillic;
case ARMENIAN:
return ScriptCode.Armenian;
case HEBREW:
return ScriptCode.Hebrew;
case ARABIC:
return ScriptCode.Arabic;
case SYRIAC:
return ScriptCode.Syriac;
case THAANA:
return ScriptCode.Thaana;
case DEVANAGARI:
return ScriptCode.Devanagari;
case BENGALI:
return ScriptCode.Bengali;
case GURMUKHI:
return ScriptCode.Gurmukhi;
case GUJARATI:
return ScriptCode.Gujarati;
case ORIYA:
return ScriptCode.Oriya;
case TAMIL:
return ScriptCode.Tamil;
case TELUGU:
return ScriptCode.Telugu;
case KANNADA:
return ScriptCode.Kannada;
case MALAYALAM:
return ScriptCode.Malayalam;
case SINHALA:
return ScriptCode.Sinhala;
case THAI:
return ScriptCode.Thai;
case LAO:
return ScriptCode.Lao;
case TIBETAN:
return ScriptCode.Tibetan;
case MYANMAR:
return ScriptCode.Myanmar;
case GEORGIAN:
return ScriptCode.Georgian;
case HANGUL:
case HAN: // (based on testing cld3 vs java codepoints)
case HIRAGANA: // (based on testing cld3 va java codepoints)
case KATAKANA: // (based on testing cld3 va java codepoints)
return ScriptCode.Hani;
case ETHIOPIC:
return ScriptCode.Ethiopic;
case CHEROKEE:
return ScriptCode.Cherokee;
case CANADIAN_ABORIGINAL:
return ScriptCode.Canadian_Aboriginal;
case OGHAM:
return ScriptCode.Ogham;
case RUNIC:
return ScriptCode.Runic;
case KHMER:
return ScriptCode.Khmer;
case MONGOLIAN:
return ScriptCode.Mongolian;
case BOPOMOFO:
return ScriptCode.Bopomofo;
case YI:
return ScriptCode.Yi;
case OLD_ITALIC:
return ScriptCode.Old_Italic;
case GOTHIC:
return ScriptCode.Gothic;
case DESERET:
return ScriptCode.Deseret;
case INHERITED:
return ScriptCode.Inherited;
case TAGALOG:
return ScriptCode.Tagalog;
case HANUNOO:
return ScriptCode.Hanunoo;
case BUHID:
return ScriptCode.Buhid;
case TAGBANWA:
return ScriptCode.Tagbanwa;
case LIMBU:
return ScriptCode.Limbu;
case TAI_LE:
return ScriptCode.Tai_Le;
case LINEAR_B:
return ScriptCode.Linear_B;
case UGARITIC:
return ScriptCode.Ugaritic;
case SHAVIAN:
return ScriptCode.Shavian;
case OSMANYA:
return ScriptCode.Osmanya;
case CYPRIOT:
return ScriptCode.Cypriot;
case BRAILLE:
return ScriptCode.Braille;
case BUGINESE:
return ScriptCode.Buginese;
case COPTIC:
return ScriptCode.Coptic;
case NEW_TAI_LUE:
return ScriptCode.New_Tai_Lue;
case GLAGOLITIC:
return ScriptCode.Glagolitic;
case TIFINAGH:
return ScriptCode.Tifinagh;
case SYLOTI_NAGRI:
return ScriptCode.Syloti_Nagri;
case OLD_PERSIAN:
return ScriptCode.Old_Persian;
case KHAROSHTHI:
return ScriptCode.Kharoshthi;
case BALINESE:
return ScriptCode.Balinese;
case CUNEIFORM:
return ScriptCode.Cuneiform;
case PHOENICIAN:
return ScriptCode.Phoenician;
case PHAGS_PA:
return ScriptCode.Phags_Pa;
case NKO:
return ScriptCode.Nko;
case SUNDANESE:
return ScriptCode.Sundanese;
case LEPCHA:
return ScriptCode.Lepcha;
case OL_CHIKI:
return ScriptCode.Ol_Chiki;
case VAI:
return ScriptCode.Vai;
case SAURASHTRA:
return ScriptCode.Saurashtra;
case KAYAH_LI:
return ScriptCode.Kayah_Li;
case REJANG:
return ScriptCode.Rejang;
case LYCIAN:
return ScriptCode.Lycian;
case CARIAN:
return ScriptCode.Carian;
case LYDIAN:
return ScriptCode.Lydian;
case CHAM:
return ScriptCode.Cham;
case TAI_THAM:
return ScriptCode.Tai_Tham;
case TAI_VIET:
return ScriptCode.Tai_Viet;
case AVESTAN:
return ScriptCode.Avestan;
case EGYPTIAN_HIEROGLYPHS:
return ScriptCode.Egyptian_Hieroglyphs;
case SAMARITAN:
return ScriptCode.Samaritan;
case LISU:
return ScriptCode.Lisu;
case BAMUM:
return ScriptCode.Bamum;
case JAVANESE:
return ScriptCode.Javanese;
case MEETEI_MAYEK:
return ScriptCode.Meetei_Mayek;
case IMPERIAL_ARAMAIC:
return ScriptCode.Imperial_Aramaic;
case OLD_SOUTH_ARABIAN:
return ScriptCode.Old_South_Arabian;
case INSCRIPTIONAL_PARTHIAN:
return ScriptCode.Inscriptional_Parthian;
case INSCRIPTIONAL_PAHLAVI:
return ScriptCode.Inscriptional_Pahlavi;
case OLD_TURKIC:
return ScriptCode.Old_Turkic;
case KAITHI:
return ScriptCode.Kaithi;
case BATAK:
return ScriptCode.Batak;
case BRAHMI:
return ScriptCode.Brahmi;
case MANDAIC:
return ScriptCode.Mandaic;
case MEROITIC_CURSIVE:
return ScriptCode.Meroitic_Cursive;
case MEROITIC_HIEROGLYPHS:
return ScriptCode.Meroitic_Hieroglyphs;
case CHAKMA:
return ScriptCode.Chakma;
case SHARADA:
return ScriptCode.Sharada;
case SORA_SOMPENG:
return ScriptCode.Sora_Sompeng;
case MIAO:
return ScriptCode.Miao;
case TAKRI:
return ScriptCode.Takri;
case UNKNOWN:
default:
}
// Fall-through for unknown(s)
return ScriptCode.Common;
}