douguiyan9164 2019-05-06 11:01
浏览 110

在Go中获取Unicode脚本名称

In Go, I want to get the RangeTable of a script given a specific language.

import (
    "golang.org/x/text/language"
    "unicode"
)

...

script, confidence := language.French.Script() 
scriptAsString := script.String() // here scriptAsString = "Latn"
rangeTable, ok := unicode.Scripts[scriptAsString]
// here ok = false, because the Scripts map has key "Latin" and not "Latn"

The problem is that the following function returns the script code

func (s Script) String() string 

Whereas the map unicode.Scripts has all of its keys using the script name

Do you know if there is a way in the native Go lib to go from a script code to a script name?

EDIT:

opened issue here: github.com/golang/go/issues/31862

  • 写回答

1条回答 默认 最新

  • douxuanou2787 2019-05-06 13:24
    关注

    This is the kind of mapping I was after:

    var scriptCodeToScriptNames = map[string][]string {
        "Adlm": {"Adlam"},
        "Afak": {"Afaka"},
        "Aghb": {"Caucasian_Albanian"},
        "Ahom": {"Ahom"},
        "Arab": {"Arabic"},
        "Aran": {"Arabic"},
        "Armi": {"Imperial_Aramaic"},
        "Armn": {"Armenian"},
        "Avst": {"Avestan"},
        "Bali": {"Balinese"},
        "Bamu": {"Bamum"},
        "Bass": {"Bassa_Vah"},
        "Batk": {"Batak"},
        "Beng": {"Bengali"},
        "Bhks": {"Bhaiksuki"},
        "Bopo": {"Bopomofo"},
        "Brah": {"Brahmi"},
        "Brai": {"Braille"},
        "Bugi": {"Buginese"},
        "Buhd": {"Buhid"},
        "Cakm": {"Chakma"},
        "Cans": {"Canadian_Aboriginal"},
        "Cari": {"Carian"},
        "Cham": {"Cham"},
        "Cher": {"Cherokee"},
        "Copt": {"Coptic"},
        "Cpmn": {"Cypro-Minoan"},
        "Cprt": {"Cypriot"},
        "Cyrl": {"Cyrillic"},
        "Cyrs": {"Cyrillic"},
        "Deva": {"Devanagari"},
        "Dogr": {"Dogra"},
        "Dsrt": {"Deseret"},
        "Dupl": {"Duployan"},
        "Egyd": {"Egyptian_Demotic"},
        "Egyh": {"Egyptian_Hieratic"},
        "Egyp": {"Egyptian_Hieroglyphs"},
        "Elba": {"Elbasan"},
        "Ethi": {"Ethiopic"},
        "Geok": {"Khutsuri"},
        "Geor": {"Georgian"},
        "Glag": {"Glagolitic"},
        "Gong": {"Gunjala_Gondi"},
        "Gonm": {"Masaram_Gondi"},
        "Goth": {"Gothic"},
        "Gran": {"Grantha"},
        "Grek": {"Greek"},
        "Gujr": {"Gujarati"},
        "Guru": {"Gurmukhi"},
        "Hanb": {"Han", "Bopomofo"},
        "Hang": {"Hangul"},
        "Hani": {"Han"},
        "Hano": {"Hanunoo"},
        "Hans": {"Han"},
        "Hant": {"Han"},
        "Hatr": {"Hatran"},
        "Hebr": {"Hebrew"},
        "Hira": {"Hiragana"},
        "Hluw": {"Anatolian_Hieroglyphs"},
        "Hmng": {"Pahawh_Hmong"},
        "Hmnp": {"Nyiakeng_Puachue_Hmong"},
        "Hrkt": {"Hiragana", "Katakana"},
        "Hung": {"Old_Hungarian"},
        "Inds": {"Indus_(Harappan)"},
        "Ital": {"Old_Italic"},
        "Jamo": {"Hangul"},
        "Java": {"Javanese"},
        "Jpan": {"Han", "Hiragana", "Katakana"},
        "Jurc": {"Jurchen"},
        "Kali": {"Kayah_Li"},
        "Kana": {"Katakana"},
        "Khar": {"Kharoshthi"},
        "Khmr": {"Khmer"},
        "Khoj": {"Khojki"},
        "Kitl": {"Khitan_large_script"},
        "Kits": {"Khitan_small_script"},
        "Knda": {"Kannada"},
        "Kore": {"Hangul", "Han"},
        "Kpel": {"Kpelle"},
        "Kthi": {"Kaithi"},
        "Lana": {"Tai_Tham"},
        "Laoo": {"Lao"},
        "Latf": {"Latin"},
        "Latg": {"Latin"},
        "Latn": {"Latin"},
        "Leke": {"Leke"},
        "Lepc": {"Lepcha"},
        "Limb": {"Limbu"},
        "Lina": {"Linear_A"},
        "Linb": {"Linear_B"},
        "Lisu": {"Lisu"},
        "Loma": {"Loma"},
        "Lyci": {"Lycian"},
        "Lydi": {"Lydian"},
        "Mahj": {"Mahajani"},
        "Maka": {"Makasar"},
        "Mand": {"Mandaic"},
        "Mani": {"Manichaean"},
        "Marc": {"Marchen"},
        "Maya": {"Mayan_hieroglyphs"},
        "Mend": {"Mende_Kikakui"},
        "Merc": {"Meroitic_Cursive"},
        "Mero": {"Meroitic_Hieroglyphs"},
        "Mlym": {"Malayalam"},
        "Modi": {"Modi"},
        "Mong": {"Mongolian"},
        "Mroo": {"Mro"},
        "Mtei": {"Meetei_Mayek"},
        "Mult": {"Multani"},
        "Mymr": {"Myanmar"},
        "Narb": {"Old_North_Arabian"},
        "Nbat": {"Nabataean"},
        "Newa": {"Newa"},
        "Nkoo": {"Nko"},
        "Nshu": {"Nushu"},
        "Ogam": {"Ogham"},
        "Olck": {"Ol_Chiki"},
        "Orkh": {"Old_Turkic"},
        "Orya": {"Oriya"},
        "Osge": {"Osage"},
        "Osma": {"Osmanya"},
        "Palm": {"Palmyrene"},
        "Pauc": {"Pau_Cin_Hau"},
        "Perm": {"Old_Permic"},
        "Phag": {"Phags_Pa"},
        "Phli": {"Inscriptional_Pahlavi"},
        "Phlp": {"Psalter_Pahlavi"},
        "Phlv": {"Book_Pahlavi"},
        "Phnx": {"Phoenician"},
        "Plrd": {"Miao"},
        "Prti": {"Inscriptional_Parthian"},
        "Rjng": {"Rejang"},
        "Rohg": {"Hanifi_Rohingya"},
        "Roro": {"Rongorongo"},
        "Runr": {"Runic"},
        "Samr": {"Samaritan"},
        "Sara": {"Sarati"},
        "Sarb": {"Old_South_Arabian"},
        "Saur": {"Saurashtra"},
        "Sgnw": {"SignWriting"},
        "Shaw": {"Shavian"},
        "Shrd": {"Sharada"},
        "Shui": {"Shuishu"},
        "Sidd": {"Siddham"},
        "Sind": {"Khudawadi"},
        "Sinh": {"Sinhala"},
        "Sogd": {"Sogdian"},
        "Sogo": {"Old_Sogdian"},
        "Sora": {"Sora_Sompeng"},
        "Soyo": {"Soyombo"},
        "Sund": {"Sundanese"},
        "Sylo": {"Syloti_Nagri"},
        "Syrc": {"Syriac"},
        "Syre": {"Syriac"},
        "Syrj": {"Syriac"},
        "Syrn": {"Syriac"},
        "Tagb": {"Tagbanwa"},
        "Takr": {"Takri"},
        "Tale": {"Tai_Le"},
        "Talu": {"New_Tai_Lue"},
        "Taml": {"Tamil"},
        "Tang": {"Tangut"},
        "Tavt": {"Tai_Viet"},
        "Telu": {"Telugu"},
        "Teng": {"Tengwar"},
        "Tfng": {"Tifinagh"},
        "Tglg": {"Tagalog"},
        "Thaa": {"Thaana"},
        "Thai": {"Thai"},
        "Tibt": {"Tibetan"},
        "Tirh": {"Tirhuta"},
        "Ugar": {"Ugaritic"},
        "Vaii": {"Vai"},
        "Visp": {"Visible_Speech"},
        "Wara": {"Warang_Citi"},
        "Wcho": {"Wancho"},
        "Wole": {"Woleai"},
        "Xpeo": {"Old_Persian"},
        "Xsux": {"Cuneiform"},
        "Yiii": {"Yi"},
        "Zanb": {"Zanabazar_Square"},
        "Zinh": {"Inherited"},
        "Zyyy": {"Common"},
    }
    
    评论

报告相同问题?

悬赏问题

  • ¥30 帮我写一段可以读取LD2450数据并计算距离的Arduino代码
  • ¥15 C#调用python代码(python带有库)
  • ¥15 矩阵加法的规则是两个矩阵中对应位置的数的绝对值进行加和
  • ¥15 活动选择题。最多可以参加几个项目?
  • ¥15 飞机曲面部件如机翼,壁板等具体的孔位模型
  • ¥15 vs2019中数据导出问题
  • ¥20 云服务Linux系统TCP-MSS值修改?
  • ¥20 关于#单片机#的问题:项目:使用模拟iic与ov2640通讯环境:F407问题:读取的ID号总是0xff,自己调了调发现在读从机数据时,SDA线上并未有信号变化(语言-c语言)
  • ¥20 怎么在stm32门禁成品上增加查询记录功能
  • ¥15 Source insight编写代码后使用CCS5.2版本import之后,代码跳到注释行里面