Module:Unicode data/scripts

< Module:Unicode data

Documentation for this module may be created at Module:Unicode data/scripts/doc

---- Module:Unicode data/scripts  (static data; no mw.ext.data)
return {
  singles = {},

  -- Minimal but safe ranges (expand later if you like)
  ranges = {
    -- Common/ASCII pieces
    {0x0000,0x002F,'Zyyy'},{0x0030,0x0039,'Zyyy'},{0x003A,0x0040,'Zyyy'},
    {0x005B,0x0060,'Zyyy'},{0x007B,0x007E,'Zyyy'},

    -- Latin
    {0x0041,0x005A,'Latn'},{0x0061,0x007A,'Latn'},
    {0x00C0,0x00FF,'Latn'},      -- rough Latin-1
    {0x0100,0x017F,'Latn'},      -- Latin Extended-A

    -- Greek
    {0x0370,0x03FF,'Grek'},

    -- Japanese
    {0x3040,0x309F,'Hira'},      -- Hiragana
    {0x30A0,0x30FF,'Kana'},      -- Katakana
    {0x31F0,0x31FF,'Kana'},      -- Katakana Phonetic Extensions
    {0x3400,0x4DBF,'Hani'},      -- CJK Ext A
    {0x4E00,0x9FFF,'Hani'},      -- CJK Unified Ideographs

    -- Combining (Inherited) + punctuation (Common)
    {0x0300,0x036F,'Zinh'},
    {0x2000,0x206F,'Zyyy'},
  },

  -- Needed by is_rtl()
  rtl = { Hebr=true, Arab=true, Syrc=true, Thaa=true, Nkoo=true, Adlm=true },
}