Commit e8c1cf44 authored by Nikolay Sivov's avatar Nikolay Sivov Committed by Alexandre Julliard

Update data tables to Unicode 8.0.0.

parent fb6ad0fe
......@@ -45,6 +45,8 @@ struct dwritescript_properties {
static const struct dwritescript_properties dwritescripts_properties[Script_LastId+1] = {
{ /* Zzzz */ { 0x7a7a7a5a, 999, 15, 0x0020, 0, 0, 0, 0, 0, 0, 0 } },
{ /* Zyyy */ { 0x7979795a, 998, 1, 0x0020, 0, 1, 1, 0, 0, 0, 0 } },
{ /* Ahom */ { 0x6d6f6841, 338, 1, 0x0020, 0, 0, 0, 0, 0, 0, 0 } },
{ /* Hluw */ { 0x77756c48, 80, 1, 0x0020, 0, 0, 0, 0, 0, 0, 0 } },
{ /* Arab */ { 0x62617241, 160, 8, 0x0640, 0, 1, 0, 0, 0, 1, 1 }, _OT('a','r','a','b'), 0, TRUE },
{ /* Armn */ { 0x6e6d7241, 230, 1, 0x0020, 0, 1, 1, 0, 0, 0, 0 }, _OT('a','r','m','n') },
{ /* Avst */ { 0x74737641, 134, 8, 0x0020, 0, 1, 1, 0, 0, 0, 0 }, _OT('a','v','s','t') },
......@@ -84,6 +86,7 @@ static const struct dwritescript_properties dwritescripts_properties[Script_Last
{ /* Hani */ { 0x696e6148, 500, 8, 0x0020, 0, 0, 1, 1, 0, 0, 0 }, _OT('h','a','n','i') },
{ /* Hang */ { 0x676e6148, 286, 8, 0x0020, 1, 1, 1, 1, 0, 0, 0 }, _OT('h','a','n','g'), 0, TRUE },
{ /* Hano */ { 0x6f6e6148, 371, 8, 0x0020, 0, 0, 1, 0, 0, 0, 0 }, _OT('h','a','n','o') },
{ /* Hatr */ { 0x72746148, 127, 1, 0x0020, 0, 0, 0, 0, 0, 0, 0 } },
{ /* Hebr */ { 0x72626548, 125, 8, 0x0020, 1, 1, 1, 0, 0, 0, 0 }, _OT('h','e','b','r'), 0, TRUE },
{ /* Hira */ { 0x61726948, 410, 8, 0x0020, 0, 0, 1, 1, 0, 0, 0 }, _OT('k','a','n','a') },
{ /* Armi */ { 0x696d7241, 124, 1, 0x0020, 0, 1, 1, 0, 0, 0, 0 }, _OT('a','r','m','i') },
......@@ -119,12 +122,14 @@ static const struct dwritescript_properties dwritescripts_properties[Script_Last
{ /* Modi */ { 0x69646f4d, 324, 1, 0x0020, 0, 0, 0, 0, 0, 0, 0 } },
{ /* Mong */ { 0x676e6f4d, 145, 8, 0x0020, 0, 1, 0, 0, 0, 1, 1 }, _OT('m','o','n','g'), 0, TRUE },
{ /* Mroo */ { 0x6f6f724d, 199, 1, 0x0020, 0, 0, 0, 0, 0, 0, 0 } },
{ /* Mult */ { 0x746c754d, 323, 1, 0x0020, 0, 0, 0, 0, 0, 0, 0 } },
{ /* Mymr */ { 0x726d794d, 350, 15, 0x0020, 1, 1, 1, 0, 0, 0, 0 }, _OT('m','y','m','r'), 0, TRUE },
{ /* Nbat */ { 0x7461624e, 159, 1, 0x0020, 0, 0, 0, 0, 0, 0, 0 } },
{ /* Talu */ { 0x756c6154, 354, 8, 0x0020, 1, 1, 1, 0, 0, 0, 0 }, _OT('t','a','l','u'), 0, TRUE },
{ /* Nkoo */ { 0x6f6f6b4e, 165, 8, 0x0020, 0, 1, 0, 0, 0, 1, 1 }, _OT('n','k','o',' '), 0, TRUE },
{ /* Ogam */ { 0x6d61674f, 212, 1, 0x1680, 0, 1, 0, 0, 0, 1, 0 }, _OT('o','g','a','m'), 0, TRUE },
{ /* Olck */ { 0x6b636c4f, 261, 1, 0x0020, 0, 1, 1, 0, 0, 0, 0 }, _OT('o','l','c','k') },
{ /* Hung */ { 0x676e7548, 176, 1, 0x0020, 0, 0, 0, 0, 0, 0, 0 } },
{ /* Ital */ { 0x6c617449, 210, 1, 0x0020, 0, 1, 1, 0, 0, 0, 0 }, _OT('i','t','a','l') },
{ /* Narb */ { 0x6272614e, 106, 1, 0x0020, 0, 0, 0, 0, 0, 0, 0 } },
{ /* Perm */ { 0x6d726550, 227, 1, 0x0020, 0, 0, 0, 0, 0, 0, 0 } },
......@@ -146,6 +151,7 @@ static const struct dwritescript_properties dwritescripts_properties[Script_Last
{ /* Shrd */ { 0x64726853, 319, 1, 0x0020, 0, 0, 0, 0, 0, 0, 0 }, _OT('s','h','r','d') },
{ /* Shaw */ { 0x77616853, 281, 1, 0x0020, 0, 1, 1, 0, 0, 0, 0 }, _OT('s','h','a','w') },
{ /* Sidd */ { 0x64646953, 302, 1, 0x0020, 0, 0, 0, 0, 0, 0, 0 } },
{ /* Sgnw */ { 0x776e6753, 95, 1, 0x0020, 0, 0, 0, 0, 0, 0, 0 } },
{ /* Sinh */ { 0x686e6953, 348, 8, 0x0020, 1, 1, 1, 0, 0, 0, 0 }, _OT('s','i','n','h'), 0, TRUE },
{ /* Sora */ { 0x61726f53, 398, 1, 0x0020, 0, 0, 0, 0, 0, 0, 0 }, _OT('s','o','r','a') },
{ /* Sund */ { 0x646e7553, 362, 8, 0x0020, 1, 1, 1, 0, 0, 0, 0 }, _OT('s','u','n','d') },
......
/* Unicode Bidirectional Bracket table */
/* generated from http://www.unicode.org/Public/7.0.0/ucd/BidiBrackets.txt */
/* generated from http://www.unicode.org/Public/8.0.0/ucd/BidiBrackets.txt */
/* DO NOT EDIT!! */
const unsigned short bidi_bracket_table[768] =
......
/* Unicode BiDi mirroring */
/* generated from http://www.unicode.org/Public/7.0.0/ucd/BidiMirroring.txt */
/* generated from http://www.unicode.org/Public/8.0.0/ucd/BidiMirroring.txt */
/* DO NOT EDIT!! */
#include "wine/unicode.h"
......
/* Unicode Script IDs */
/* generated from http://www.unicode.org/Public/7.0.0/ucd/Scripts.txt */
/* generated from http://www.unicode.org/Public/8.0.0/ucd/Scripts.txt */
/* DO NOT EDIT!! */
enum unicode_script_id {
Script_Unknown = 0,
Script_Common = 1,
Script_Arabic = 2,
Script_Armenian = 3,
Script_Avestan = 4,
Script_Balinese = 5,
Script_Bamum = 6,
Script_Bassa_Vah = 7,
Script_Batak = 8,
Script_Bengali = 9,
Script_Bopomofo = 10,
Script_Brahmi = 11,
Script_Braille = 12,
Script_Buginese = 13,
Script_Buhid = 14,
Script_Canadian_Aboriginal = 15,
Script_Carian = 16,
Script_Caucasian_Albanian = 17,
Script_Chakma = 18,
Script_Cham = 19,
Script_Cherokee = 20,
Script_Coptic = 21,
Script_Cuneiform = 22,
Script_Cypriot = 23,
Script_Cyrillic = 24,
Script_Deseret = 25,
Script_Devanagari = 26,
Script_Duployan = 27,
Script_Egyptian_Hieroglyphs = 28,
Script_Elbasan = 29,
Script_Ethiopic = 30,
Script_Georgian = 31,
Script_Glagolitic = 32,
Script_Gothic = 33,
Script_Grantha = 34,
Script_Greek = 35,
Script_Gujarati = 36,
Script_Gurmukhi = 37,
Script_Han = 38,
Script_Hangul = 39,
Script_Hanunoo = 40,
Script_Hebrew = 41,
Script_Hiragana = 42,
Script_Imperial_Aramaic = 43,
Script_Inscriptional_Pahlavi = 44,
Script_Inscriptional_Parthian = 45,
Script_Javanese = 46,
Script_Kaithi = 47,
Script_Kannada = 48,
Script_Katakana = 49,
Script_Kayah_Li = 50,
Script_Kharoshthi = 51,
Script_Khmer = 52,
Script_Khojki = 53,
Script_Khudawadi = 54,
Script_Lao = 55,
Script_Latin = 56,
Script_Lepcha = 57,
Script_Limbu = 58,
Script_Linear_A = 59,
Script_Linear_B = 60,
Script_Lisu = 61,
Script_Lycian = 62,
Script_Lydian = 63,
Script_Mahajani = 64,
Script_Malayalam = 65,
Script_Mandaic = 66,
Script_Manichaean = 67,
Script_Meetei_Mayek = 68,
Script_Mende_Kikakui = 69,
Script_Meroitic_Cursive = 70,
Script_Meroitic_Hieroglyphs = 71,
Script_Miao = 72,
Script_Modi = 73,
Script_Mongolian = 74,
Script_Mro = 75,
Script_Myanmar = 76,
Script_Nabataean = 77,
Script_New_Tai_Lue = 78,
Script_Nko = 79,
Script_Ogham = 80,
Script_Ol_Chiki = 81,
Script_Old_Italic = 82,
Script_Old_North_Arabian = 83,
Script_Old_Permic = 84,
Script_Old_Persian = 85,
Script_Old_South_Arabian = 86,
Script_Old_Turkic = 87,
Script_Oriya = 88,
Script_Osmanya = 89,
Script_Pahawh_Hmong = 90,
Script_Palmyrene = 91,
Script_Pau_Cin_Hau = 92,
Script_Phags_Pa = 93,
Script_Phoenician = 94,
Script_Psalter_Pahlavi = 95,
Script_Rejang = 96,
Script_Runic = 97,
Script_Samaritan = 98,
Script_Saurashtra = 99,
Script_Sharada = 100,
Script_Shavian = 101,
Script_Siddham = 102,
Script_Sinhala = 103,
Script_Sora_Sompeng = 104,
Script_Sundanese = 105,
Script_Syloti_Nagri = 106,
Script_Syriac = 107,
Script_Tagalog = 108,
Script_Tagbanwa = 109,
Script_Tai_Le = 110,
Script_Tai_Tham = 111,
Script_Tai_Viet = 112,
Script_Takri = 113,
Script_Tamil = 114,
Script_Telugu = 115,
Script_Thaana = 116,
Script_Thai = 117,
Script_Tibetan = 118,
Script_Tifinagh = 119,
Script_Tirhuta = 120,
Script_Ugaritic = 121,
Script_Vai = 122,
Script_Warang_Citi = 123,
Script_Yi = 124,
Script_LastId = 124
Script_Ahom = 2,
Script_Anatolian_Hieroglyphs = 3,
Script_Arabic = 4,
Script_Armenian = 5,
Script_Avestan = 6,
Script_Balinese = 7,
Script_Bamum = 8,
Script_Bassa_Vah = 9,
Script_Batak = 10,
Script_Bengali = 11,
Script_Bopomofo = 12,
Script_Brahmi = 13,
Script_Braille = 14,
Script_Buginese = 15,
Script_Buhid = 16,
Script_Canadian_Aboriginal = 17,
Script_Carian = 18,
Script_Caucasian_Albanian = 19,
Script_Chakma = 20,
Script_Cham = 21,
Script_Cherokee = 22,
Script_Coptic = 23,
Script_Cuneiform = 24,
Script_Cypriot = 25,
Script_Cyrillic = 26,
Script_Deseret = 27,
Script_Devanagari = 28,
Script_Duployan = 29,
Script_Egyptian_Hieroglyphs = 30,
Script_Elbasan = 31,
Script_Ethiopic = 32,
Script_Georgian = 33,
Script_Glagolitic = 34,
Script_Gothic = 35,
Script_Grantha = 36,
Script_Greek = 37,
Script_Gujarati = 38,
Script_Gurmukhi = 39,
Script_Han = 40,
Script_Hangul = 41,
Script_Hanunoo = 42,
Script_Hatran = 43,
Script_Hebrew = 44,
Script_Hiragana = 45,
Script_Imperial_Aramaic = 46,
Script_Inscriptional_Pahlavi = 47,
Script_Inscriptional_Parthian = 48,
Script_Javanese = 49,
Script_Kaithi = 50,
Script_Kannada = 51,
Script_Katakana = 52,
Script_Kayah_Li = 53,
Script_Kharoshthi = 54,
Script_Khmer = 55,
Script_Khojki = 56,
Script_Khudawadi = 57,
Script_Lao = 58,
Script_Latin = 59,
Script_Lepcha = 60,
Script_Limbu = 61,
Script_Linear_A = 62,
Script_Linear_B = 63,
Script_Lisu = 64,
Script_Lycian = 65,
Script_Lydian = 66,
Script_Mahajani = 67,
Script_Malayalam = 68,
Script_Mandaic = 69,
Script_Manichaean = 70,
Script_Meetei_Mayek = 71,
Script_Mende_Kikakui = 72,
Script_Meroitic_Cursive = 73,
Script_Meroitic_Hieroglyphs = 74,
Script_Miao = 75,
Script_Modi = 76,
Script_Mongolian = 77,
Script_Mro = 78,
Script_Multani = 79,
Script_Myanmar = 80,
Script_Nabataean = 81,
Script_New_Tai_Lue = 82,
Script_Nko = 83,
Script_Ogham = 84,
Script_Ol_Chiki = 85,
Script_Old_Hungarian = 86,
Script_Old_Italic = 87,
Script_Old_North_Arabian = 88,
Script_Old_Permic = 89,
Script_Old_Persian = 90,
Script_Old_South_Arabian = 91,
Script_Old_Turkic = 92,
Script_Oriya = 93,
Script_Osmanya = 94,
Script_Pahawh_Hmong = 95,
Script_Palmyrene = 96,
Script_Pau_Cin_Hau = 97,
Script_Phags_Pa = 98,
Script_Phoenician = 99,
Script_Psalter_Pahlavi = 100,
Script_Rejang = 101,
Script_Runic = 102,
Script_Samaritan = 103,
Script_Saurashtra = 104,
Script_Sharada = 105,
Script_Shavian = 106,
Script_Siddham = 107,
Script_SignWriting = 108,
Script_Sinhala = 109,
Script_Sora_Sompeng = 110,
Script_Sundanese = 111,
Script_Syloti_Nagri = 112,
Script_Syriac = 113,
Script_Tagalog = 114,
Script_Tagbanwa = 115,
Script_Tai_Le = 116,
Script_Tai_Tham = 117,
Script_Tai_Viet = 118,
Script_Takri = 119,
Script_Tamil = 120,
Script_Telugu = 121,
Script_Thaana = 122,
Script_Thai = 123,
Script_Tibetan = 124,
Script_Tifinagh = 125,
Script_Tirhuta = 126,
Script_Ugaritic = 127,
Script_Vai = 128,
Script_Warang_Citi = 129,
Script_Yi = 130,
Script_LastId = 130
};
/* Unicode Bidirectional Bracket table */
/* generated from http://www.unicode.org/Public/7.0.0/ucd/BidiBrackets.txt */
/* generated from http://www.unicode.org/Public/8.0.0/ucd/BidiBrackets.txt */
/* DO NOT EDIT!! */
const unsigned short bidi_bracket_table[768] =
......
/* Unicode BiDi mirroring */
/* generated from http://www.unicode.org/Public/7.0.0/ucd/BidiMirroring.txt */
/* generated from http://www.unicode.org/Public/8.0.0/ucd/BidiMirroring.txt */
/* DO NOT EDIT!! */
#include "wine/unicode.h"
......
/* Unicode Arabic shaping */
/* generated from http://www.unicode.org/Public/7.0.0/ucd/ArabicShaping.txt */
/* generated from http://www.unicode.org/Public/8.0.0/ucd/ArabicShaping.txt */
/* DO NOT EDIT!! */
const unsigned short wine_shaping_table[2864] =
const unsigned short wine_shaping_table[2848] =
{
/* level 1 offsets */
0x0100, 0x0110, 0x0110, 0x0120, 0x0130, 0x0140, 0x0150, 0x0160,
......@@ -95,7 +95,7 @@ const unsigned short wine_shaping_table[2864] =
0x0340, 0x0340, 0x0a00, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340,
0x0340, 0x0a10, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340,
0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0490, 0x0a20,
0x0340, 0x0490, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0940,
0x0340, 0x06d0, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0940,
0x0a30, 0x0340, 0x06f0, 0x0340, 0x0530, 0x0530, 0x0530, 0x0a40,
0x0340, 0x0340, 0x0340, 0x0340, 0x0a50, 0x0340, 0x0360, 0x0940,
0x0340, 0x0340, 0x0a60, 0x0340, 0x0a70, 0x0940, 0x0340, 0x0340,
......@@ -106,10 +106,10 @@ const unsigned short wine_shaping_table[2864] =
0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0af0, 0x0340,
0x0340, 0x0b00, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340,
0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340,
0x0360, 0x0340, 0x0b10, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340,
0x0360, 0x0340, 0x0360, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340,
0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0490,
0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340,
0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0b20,
0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0340, 0x0b10,
/* values */
0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000,
0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000,
......@@ -183,15 +183,15 @@ const unsigned short wine_shaping_table[2864] =
0x0001, 0x0001, 0x0000, 0x0001, 0x0001, 0x0001, 0x0001, 0x0001,
0x0001, 0x0001, 0x0001, 0x0001, 0x0000, 0x0001, 0x0001, 0x0001,
0x0000, 0x0001, 0x0001, 0x0001, 0x0001, 0x0001, 0x0000, 0x0000,
0x0002, 0x0004, 0x0004, 0x0004, 0x0004, 0x0004, 0x0002, 0x0004,
0x0004, 0x0002, 0x0004, 0x0004, 0x0004, 0x0004, 0x0004, 0x0002,
0x0002, 0x0004, 0x0004, 0x0004, 0x0004, 0x0004, 0x0002, 0x0002,
0x0004, 0x0002, 0x0004, 0x0004, 0x0004, 0x0004, 0x0004, 0x0004,
0x0004, 0x0004, 0x0004, 0x0004, 0x0002, 0x0004, 0x0000, 0x0000,
0x0000, 0x0001, 0x0001, 0x0001, 0x0000, 0x0000, 0x0000, 0x0000,
0x0404, 0x0404, 0x0604, 0x0b04, 0x0f04, 0x1004, 0x1204, 0x1304,
0x0104, 0x0104, 0x0802, 0x0302, 0x3402, 0x0000, 0x0702, 0x0a04,
0x0d04, 0x3502, 0x0802, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000,
0x0d04, 0x3502, 0x0802, 0x0c04, 0x1104, 0x0000, 0x0000, 0x0000,
0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000,
0x0000, 0x0000, 0x0000, 0x0000, 0x0001, 0x0001, 0x0001, 0x0001,
0x0000, 0x0000, 0x0000, 0x0001, 0x0001, 0x0001, 0x0001, 0x0001,
0x0001, 0x0001, 0x0001, 0x0001, 0x0001, 0x0001, 0x0001, 0x0001,
0x0001, 0x0001, 0x0001, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000,
0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000,
......@@ -361,8 +361,6 @@ const unsigned short wine_shaping_table[2864] =
0x0001, 0x0000, 0x0000, 0x0000, 0x0000, 0x0001, 0x0000, 0x0000,
0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000,
0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0001, 0x0000,
0x0001, 0x0001, 0x0001, 0x0001, 0x0001, 0x0001, 0x0001, 0x0001,
0x0001, 0x0001, 0x0001, 0x0001, 0x0001, 0x0001, 0x0000, 0x0000,
0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000,
0x0000, 0x0001, 0x0001, 0x0001, 0x0000, 0x0000, 0x0000, 0x0000
};
......
No preview for this file type
......@@ -23,7 +23,7 @@ use strict;
# base URLs for www.unicode.org files
my $MAPPINGS = "http://www.unicode.org/Public/MAPPINGS";
my $UNIDATA = "http://www.unicode.org/Public/7.0.0/ucd";
my $UNIDATA = "http://www.unicode.org/Public/8.0.0/ucd";
my $REPORTS = "http://www.unicode.org/reports";
my $RFCS = "http://www.rfc-editor.org/rfc";
my $VERTICALDATA = "http://www.unicode.org/Public/vertical/revision-11";
......@@ -169,7 +169,11 @@ my %indic_types =
"Joiner" => 0x001b,
"Number_Joiner" => 0x001c,
"Number" => 0x001d,
"Brahmi_Joining_Number" => 0x001e
"Brahmi_Joining_Number" => 0x001e,
"Consonant_With_Stacker" => 0x001f,
"Consonant_Prefixed" => 0x0020,
"Syllable_Modifier" => 0x0021,
"Consonant_Killer" => 0x0022
);
my %matra_types =
......@@ -1207,7 +1211,7 @@ sub dump_indic($)
}
close $INPUT;
$INPUT = open_data_file( $UNIDATA, "IndicMatraCategory.txt" );
$INPUT = open_data_file( $UNIDATA, "IndicPositionalCategory.txt" );
while (<$INPUT>)
{
next if /^\#/; # skip comments
......@@ -1238,7 +1242,7 @@ sub dump_indic($)
print "Building $filename\n";
print OUTPUT "/* Unicode Indic Syllabic Category */\n";
print OUTPUT "/* generated from $UNIDATA/IndicSyllabicCategory.txt */\n";
print OUTPUT "/* and from $UNIDATA/IndicMatraCategory.txt */\n";
print OUTPUT "/* and from $UNIDATA/IndicPositionalCategory.txt */\n";
print OUTPUT "/* DO NOT EDIT!! */\n\n";
dump_two_level_mapping( "indic_syllabic_table", @indic_table);
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment