зеркало из https://github.com/mozilla/gecko-dev.git
313 строки
6.5 KiB
C++
313 строки
6.5 KiB
C++
|
|
/* -*- Mode: C++; tab-width: 20; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
|
|
/* This Source Code Form is subject to the terms of the Mozilla Public
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/. */
|
|
|
|
/*
|
|
* Derived from the Unicode Character Database by genUnicodePropertyData.pl
|
|
*
|
|
* For Unicode terms of use, see http://www.unicode.org/terms_of_use.html
|
|
*/
|
|
|
|
/*
|
|
* Created on Tue Nov 15 16:39:42 2016 from UCD data files with version info:
|
|
*
|
|
|
|
# Unicode Character Database
|
|
# Date: 2016-06-20, 14:59:00 GMT [KW]
|
|
# © 2016 Unicode®, Inc.
|
|
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
|
|
# For terms of use, see http://www.unicode.org/terms_of_use.html
|
|
#
|
|
# For documentation, see the following:
|
|
# NamesList.html
|
|
# UAX #38, "Unicode Han Database (Unihan)"
|
|
# UAX #44, "Unicode Character Database."
|
|
#
|
|
# The UAXes can be accessed at http://www.unicode.org/versions/Unicode9.0.0/
|
|
|
|
This directory contains the final data files
|
|
for the Unicode Character Database, for Version 9.0.0 of the Unicode Standard.
|
|
|
|
# Scripts-9.0.0.txt
|
|
# Date: 2016-06-01, 10:34:37 GMT
|
|
|
|
# BidiMirroring-9.0.0.txt
|
|
# Date: 2016-01-21, 22:00:00 GMT [KW, LI]
|
|
|
|
# BidiBrackets-9.0.0.txt
|
|
# Date: 2016-06-07, 22:30:00 GMT [AG, LI, KW]
|
|
|
|
# HangulSyllableType-9.0.0.txt
|
|
# Date: 2016-03-02, 18:55:01 GMT
|
|
|
|
# LineBreak-9.0.0.txt
|
|
# Date: 2016-05-26, 01:00:00 GMT [KW, LI]
|
|
|
|
# EastAsianWidth-9.0.0.txt
|
|
# Date: 2016-05-27, 17:00:00 GMT [KW, LI]
|
|
|
|
# DerivedCoreProperties-9.0.0.txt
|
|
# Date: 2016-06-01, 10:34:24 GMT
|
|
|
|
# IdentifierStatus.txt
|
|
# Date: 2016-06-16, 13:41:30 GMT
|
|
|
|
# IdentifierType.txt
|
|
# Date: 2016-06-16, 13:41:30 GMT
|
|
|
|
#
|
|
# Unihan_Variants.txt
|
|
# Date: 2016-06-01 07:01:48 GMT [JHJ]
|
|
|
|
# VerticalOrientation-16.txt
|
|
# Date: 2016-07-23, 01:00:00 GMT [EM, KI, LI]
|
|
|
|
*
|
|
* * * * * This file contains MACHINE-GENERATED DATA, do not edit! * * * * *
|
|
*/
|
|
|
|
#ifndef NS_UNICODE_SCRIPT_CODES
|
|
#define NS_UNICODE_SCRIPT_CODES
|
|
|
|
#pragma pack(1)
|
|
|
|
#if !ENABLE_INTL_API
|
|
|
|
struct nsCharProps1 {
|
|
unsigned char mMirrorOffsetIndex:5;
|
|
unsigned char mHangulType:3;
|
|
unsigned char mCombiningClass:8;
|
|
};
|
|
|
|
#endif
|
|
|
|
#if ENABLE_INTL_API
|
|
|
|
struct nsCharProps2 {
|
|
// Currently only 4 bits are defined here, so 4 more could be added without
|
|
// affecting the storage requirements for this struct. Or we could pack two
|
|
// records per byte, at the cost of a slightly more complex accessor.
|
|
unsigned char mVertOrient:2;
|
|
unsigned char mIdType:2;
|
|
};
|
|
|
|
#endif
|
|
|
|
#if !ENABLE_INTL_API
|
|
|
|
// This struct currently requires 5 bytes. We try to ensure that whole-byte
|
|
// fields will not straddle byte boundaries, to optimize access to them.
|
|
struct nsCharProps2 {
|
|
unsigned char mScriptCode:8;
|
|
// -- byte boundary --
|
|
unsigned char mPairedBracketType:2;
|
|
unsigned char mEastAsianWidthFWH:1;
|
|
unsigned char mCategory:5;
|
|
// -- byte boundary --
|
|
unsigned char mIdType:2;
|
|
unsigned char mDefaultIgnorable:1;
|
|
unsigned char mBidiCategory:5;
|
|
// -- byte boundary --
|
|
unsigned char mVertOrient:2;
|
|
unsigned char mLineBreak:6;
|
|
// -- byte boundary --
|
|
signed char mNumericValue; // only 5 bits are actually needed here
|
|
};
|
|
|
|
#endif
|
|
|
|
#pragma pack()
|
|
|
|
namespace mozilla {
|
|
namespace unicode {
|
|
enum class Script {
|
|
COMMON = 0,
|
|
INHERITED = 1,
|
|
ARABIC = 2,
|
|
ARMENIAN = 3,
|
|
BENGALI = 4,
|
|
BOPOMOFO = 5,
|
|
CHEROKEE = 6,
|
|
COPTIC = 7,
|
|
CYRILLIC = 8,
|
|
DESERET = 9,
|
|
DEVANAGARI = 10,
|
|
ETHIOPIC = 11,
|
|
GEORGIAN = 12,
|
|
GOTHIC = 13,
|
|
GREEK = 14,
|
|
GUJARATI = 15,
|
|
GURMUKHI = 16,
|
|
HAN = 17,
|
|
HANGUL = 18,
|
|
HEBREW = 19,
|
|
HIRAGANA = 20,
|
|
KANNADA = 21,
|
|
KATAKANA = 22,
|
|
KHMER = 23,
|
|
LAO = 24,
|
|
LATIN = 25,
|
|
MALAYALAM = 26,
|
|
MONGOLIAN = 27,
|
|
MYANMAR = 28,
|
|
OGHAM = 29,
|
|
OLD_ITALIC = 30,
|
|
ORIYA = 31,
|
|
RUNIC = 32,
|
|
SINHALA = 33,
|
|
SYRIAC = 34,
|
|
TAMIL = 35,
|
|
TELUGU = 36,
|
|
THAANA = 37,
|
|
THAI = 38,
|
|
TIBETAN = 39,
|
|
CANADIAN_ABORIGINAL = 40,
|
|
YI = 41,
|
|
TAGALOG = 42,
|
|
HANUNOO = 43,
|
|
BUHID = 44,
|
|
TAGBANWA = 45,
|
|
BRAILLE = 46,
|
|
CYPRIOT = 47,
|
|
LIMBU = 48,
|
|
LINEAR_B = 49,
|
|
OSMANYA = 50,
|
|
SHAVIAN = 51,
|
|
TAI_LE = 52,
|
|
UGARITIC = 53,
|
|
KATAKANA_OR_HIRAGANA = 54,
|
|
BUGINESE = 55,
|
|
GLAGOLITIC = 56,
|
|
KHAROSHTHI = 57,
|
|
SYLOTI_NAGRI = 58,
|
|
NEW_TAI_LUE = 59,
|
|
TIFINAGH = 60,
|
|
OLD_PERSIAN = 61,
|
|
BALINESE = 62,
|
|
BATAK = 63,
|
|
BLISSYMBOLS = 64,
|
|
BRAHMI = 65,
|
|
CHAM = 66,
|
|
CIRTH = 67,
|
|
OLD_CHURCH_SLAVONIC_CYRILLIC = 68,
|
|
DEMOTIC_EGYPTIAN = 69,
|
|
HIERATIC_EGYPTIAN = 70,
|
|
EGYPTIAN_HIEROGLYPHS = 71,
|
|
KHUTSURI = 72,
|
|
SIMPLIFIED_HAN = 73,
|
|
TRADITIONAL_HAN = 74,
|
|
PAHAWH_HMONG = 75,
|
|
OLD_HUNGARIAN = 76,
|
|
HARAPPAN_INDUS = 77,
|
|
JAVANESE = 78,
|
|
KAYAH_LI = 79,
|
|
LATIN_FRAKTUR = 80,
|
|
LATIN_GAELIC = 81,
|
|
LEPCHA = 82,
|
|
LINEAR_A = 83,
|
|
MANDAIC = 84,
|
|
MAYAN_HIEROGLYPHS = 85,
|
|
MEROITIC_HIEROGLYPHS = 86,
|
|
NKO = 87,
|
|
OLD_TURKIC = 88,
|
|
OLD_PERMIC = 89,
|
|
PHAGS_PA = 90,
|
|
PHOENICIAN = 91,
|
|
MIAO = 92,
|
|
RONGORONGO = 93,
|
|
SARATI = 94,
|
|
ESTRANGELO_SYRIAC = 95,
|
|
WESTERN_SYRIAC = 96,
|
|
EASTERN_SYRIAC = 97,
|
|
TENGWAR = 98,
|
|
VAI = 99,
|
|
VISIBLE_SPEECH = 100,
|
|
CUNEIFORM = 101,
|
|
UNWRITTEN_LANGUAGES = 102,
|
|
UNKNOWN = 103,
|
|
CARIAN = 104,
|
|
JAPANESE = 105,
|
|
TAI_THAM = 106,
|
|
LYCIAN = 107,
|
|
LYDIAN = 108,
|
|
OL_CHIKI = 109,
|
|
REJANG = 110,
|
|
SAURASHTRA = 111,
|
|
SIGNWRITING = 112,
|
|
SUNDANESE = 113,
|
|
MOON = 114,
|
|
MEETEI_MAYEK = 115,
|
|
IMPERIAL_ARAMAIC = 116,
|
|
AVESTAN = 117,
|
|
CHAKMA = 118,
|
|
KOREAN = 119,
|
|
KAITHI = 120,
|
|
MANICHAEAN = 121,
|
|
INSCRIPTIONAL_PAHLAVI = 122,
|
|
PSALTER_PAHLAVI = 123,
|
|
BOOK_PAHLAVI = 124,
|
|
INSCRIPTIONAL_PARTHIAN = 125,
|
|
SAMARITAN = 126,
|
|
TAI_VIET = 127,
|
|
MATHEMATICAL_NOTATION = 128,
|
|
SYMBOLS = 129,
|
|
BAMUM = 130,
|
|
LISU = 131,
|
|
NAKHI_GEBA = 132,
|
|
OLD_SOUTH_ARABIAN = 133,
|
|
BASSA_VAH = 134,
|
|
DUPLOYAN = 135,
|
|
ELBASAN = 136,
|
|
GRANTHA = 137,
|
|
KPELLE = 138,
|
|
LOMA = 139,
|
|
MENDE_KIKAKUI = 140,
|
|
MEROITIC_CURSIVE = 141,
|
|
OLD_NORTH_ARABIAN = 142,
|
|
NABATAEAN = 143,
|
|
PALMYRENE = 144,
|
|
KHUDAWADI = 145,
|
|
WARANG_CITI = 146,
|
|
AFAKA = 147,
|
|
JURCHEN = 148,
|
|
MRO = 149,
|
|
NUSHU = 150,
|
|
SHARADA = 151,
|
|
SORA_SOMPENG = 152,
|
|
TAKRI = 153,
|
|
TANGUT = 154,
|
|
WOLEAI = 155,
|
|
ANATOLIAN_HIEROGLYPHS = 156,
|
|
KHOJKI = 157,
|
|
TIRHUTA = 158,
|
|
CAUCASIAN_ALBANIAN = 159,
|
|
MAHAJANI = 160,
|
|
AHOM = 161,
|
|
HATRAN = 162,
|
|
MODI = 163,
|
|
MULTANI = 164,
|
|
PAU_CIN_HAU = 165,
|
|
SIDDHAM = 166,
|
|
ADLAM = 167,
|
|
BHAIKSUKI = 168,
|
|
MARCHEN = 169,
|
|
NEWA = 170,
|
|
OSAGE = 171,
|
|
HAN_WITH_BOPOMOFO = 172,
|
|
JAMO = 173,
|
|
SYMBOLS_EMOJI = 174,
|
|
|
|
NUM_SCRIPT_CODES = 175,
|
|
|
|
INVALID = -1
|
|
};
|
|
} // namespace unicode
|
|
} // namespace mozilla
|
|
|
|
#endif
|
|
/*
|
|
* * * * * This file contains MACHINE-GENERATED DATA, do not edit! * * * * *
|
|
*/
|