ruby/utf8.c

3765 строки
71 KiB
C

/**********************************************************************
utf8.c - Oniguruma (regular expression library)
**********************************************************************/
/*-
* Copyright (c) 2002-2006 K.Kosako <sndgk393 AT ybb DOT ne DOT jp>
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
#include "regenc.h"
#define USE_INVALID_CODE_SCHEME
#ifdef USE_INVALID_CODE_SCHEME
/* virtual codepoint values for invalid encoding byte 0xfe and 0xff */
#define INVALID_CODE_FE 0xfffffffe
#define INVALID_CODE_FF 0xffffffff
#define VALID_CODE_LIMIT 0x7fffffff
#endif
#define utf8_islead(c) ((UChar )((c) & 0xc0) != 0x80)
static const int EncLen_UTF8[] = {
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
4, 4, 4, 4, 4, 4, 4, 4, 5, 5, 5, 5, 6, 6, 1, 1
};
static int
utf8_mbc_enc_len(const UChar* p)
{
return EncLen_UTF8[*p];
}
static int
utf8_is_mbc_newline(const UChar* p, const UChar* end)
{
if (p < end) {
if (*p == 0x0a) return 1;
#ifdef USE_UNICODE_ALL_LINE_TERMINATORS
if (*p == 0x0d) return 1;
if (p + 1 < end) {
if (*(p+1) == 0x85 && *p == 0xc2) /* U+0085 */
return 1;
if (p + 2 < end) {
if ((*(p+2) == 0xa8 || *(p+2) == 0xa9)
&& *(p+1) == 0x80 && *p == 0xe2) /* U+2028, U+2029 */
return 1;
}
}
#endif
}
return 0;
}
static OnigCodePoint
utf8_mbc_to_code(const UChar* p, const UChar* end)
{
int c, len;
OnigCodePoint n;
len = enc_len(ONIG_ENCODING_UTF8, p);
c = *p++;
if (len > 1) {
len--;
n = c & ((1 << (6 - len)) - 1);
while (len--) {
c = *p++;
n = (n << 6) | (c & ((1 << 6) - 1));
}
return n;
}
else {
#ifdef USE_INVALID_CODE_SCHEME
if (c > 0xfd) {
return ((c == 0xfe) ? INVALID_CODE_FE : INVALID_CODE_FF);
}
#endif
return (OnigCodePoint )c;
}
}
static int
utf8_code_to_mbclen(OnigCodePoint code)
{
if ((code & 0xffffff80) == 0) return 1;
else if ((code & 0xfffff800) == 0) {
if (code <= 0xff && code >= 0xfe)
return 1;
return 2;
}
else if ((code & 0xffff0000) == 0) return 3;
else if ((code & 0xffe00000) == 0) return 4;
else if ((code & 0xfc000000) == 0) return 5;
else if ((code & 0x80000000) == 0) return 6;
#ifdef USE_INVALID_CODE_SCHEME
else if (code == INVALID_CODE_FE) return 1;
else if (code == INVALID_CODE_FF) return 1;
#endif
else
return ONIGENCERR_TOO_BIG_WIDE_CHAR_VALUE;
}
#if 0
static int
utf8_code_to_mbc_first(OnigCodePoint code)
{
if ((code & 0xffffff80) == 0)
return code;
else {
if ((code & 0xfffff800) == 0)
return ((code>>6)& 0x1f) | 0xc0;
else if ((code & 0xffff0000) == 0)
return ((code>>12) & 0x0f) | 0xe0;
else if ((code & 0xffe00000) == 0)
return ((code>>18) & 0x07) | 0xf0;
else if ((code & 0xfc000000) == 0)
return ((code>>24) & 0x03) | 0xf8;
else if ((code & 0x80000000) == 0)
return ((code>>30) & 0x01) | 0xfc;
else {
return ONIGENCERR_TOO_BIG_WIDE_CHAR_VALUE;
}
}
}
#endif
static int
utf8_code_to_mbc(OnigCodePoint code, UChar *buf)
{
#define UTF8_TRAILS(code, shift) (UChar )((((code) >> (shift)) & 0x3f) | 0x80)
#define UTF8_TRAIL0(code) (UChar )(((code) & 0x3f) | 0x80)
if ((code & 0xffffff80) == 0) {
*buf = (UChar )code;
return 1;
}
else {
UChar *p = buf;
if ((code & 0xfffff800) == 0) {
*p++ = (UChar )(((code>>6)& 0x1f) | 0xc0);
}
else if ((code & 0xffff0000) == 0) {
*p++ = (UChar )(((code>>12) & 0x0f) | 0xe0);
*p++ = UTF8_TRAILS(code, 6);
}
else if ((code & 0xffe00000) == 0) {
*p++ = (UChar )(((code>>18) & 0x07) | 0xf0);
*p++ = UTF8_TRAILS(code, 12);
*p++ = UTF8_TRAILS(code, 6);
}
else if ((code & 0xfc000000) == 0) {
*p++ = (UChar )(((code>>24) & 0x03) | 0xf8);
*p++ = UTF8_TRAILS(code, 18);
*p++ = UTF8_TRAILS(code, 12);
*p++ = UTF8_TRAILS(code, 6);
}
else if ((code & 0x80000000) == 0) {
*p++ = (UChar )(((code>>30) & 0x01) | 0xfc);
*p++ = UTF8_TRAILS(code, 24);
*p++ = UTF8_TRAILS(code, 18);
*p++ = UTF8_TRAILS(code, 12);
*p++ = UTF8_TRAILS(code, 6);
}
#ifdef USE_INVALID_CODE_SCHEME
else if (code == INVALID_CODE_FE) {
*p = 0xfe;
return 1;
}
else if (code == INVALID_CODE_FF) {
*p = 0xff;
return 1;
}
#endif
else {
return ONIGENCERR_TOO_BIG_WIDE_CHAR_VALUE;
}
*p++ = UTF8_TRAIL0(code);
return p - buf;
}
}
static int
utf8_mbc_to_normalize(OnigAmbigType flag, const UChar** pp, const UChar* end, UChar* lower)
{
const UChar* p = *pp;
if (ONIGENC_IS_MBC_ASCII(p)) {
if (end > p + 1 &&
(flag & ONIGENC_AMBIGUOUS_MATCH_COMPOUND) != 0 &&
((*p == 's' && *(p+1) == 's') ||
((flag & ONIGENC_AMBIGUOUS_MATCH_ASCII_CASE) != 0 &&
(*p == 'S' && *(p+1) == 'S')))) {
*lower++ = '\303';
*lower = '\237';
(*pp) += 2;
return 2;
}
if ((flag & ONIGENC_AMBIGUOUS_MATCH_ASCII_CASE) != 0) {
*lower = ONIGENC_ASCII_CODE_TO_LOWER_CASE(*p);
}
else {
*lower = *p;
}
(*pp)++;
return 1; /* return byte length of converted char to lower */
}
else {
int len;
if (*p == 195) { /* 195 == '\303' */
int c = *(p + 1);
if (c >= 128) {
if (c <= (UChar )'\236' && /* upper */
(flag & ONIGENC_AMBIGUOUS_MATCH_NONASCII_CASE) != 0) {
if (c != (UChar )'\227') {
*lower++ = *p;
*lower = (UChar )(c + 32);
(*pp) += 2;
return 2;
}
}
#if 0
else if (c == (UChar )'\237' &&
(flag & ONIGENC_AMBIGUOUS_MATCH_COMPOUND) != 0) {
*lower++ = '\303';
*lower = '\237';
(*pp) += 2;
return 2;
}
#endif
}
}
len = enc_len(ONIG_ENCODING_UTF8, p);
if (lower != p) {
int i;
for (i = 0; i < len; i++) {
*lower++ = *p++;
}
}
(*pp) += len;
return len; /* return byte length of converted char to lower */
}
}
static int
utf8_is_mbc_ambiguous(OnigAmbigType flag, const UChar** pp, const UChar* end)
{
const UChar* p = *pp;
if (ONIGENC_IS_MBC_ASCII(p)) {
if (end > p + 1 &&
(flag & ONIGENC_AMBIGUOUS_MATCH_COMPOUND) != 0 &&
((*p == 's' && *(p+1) == 's') ||
((flag & ONIGENC_AMBIGUOUS_MATCH_ASCII_CASE) != 0 &&
(*p == 'S' && *(p+1) == 'S')))) {
(*pp) += 2;
return TRUE;
}
(*pp)++;
if ((flag & ONIGENC_AMBIGUOUS_MATCH_ASCII_CASE) != 0) {
return ONIGENC_IS_ASCII_CODE_CASE_AMBIG(*p);
}
}
else {
(*pp) += enc_len(ONIG_ENCODING_UTF8, p);
if (*p == 195) { /* 195 == '\303' */
int c = *(p + 1);
if (c >= 128) {
if ((flag & ONIGENC_AMBIGUOUS_MATCH_NONASCII_CASE) != 0) {
if (c <= (UChar )'\236') { /* upper */
if (c == (UChar )'\227') return FALSE;
return TRUE;
}
else if (c >= (UChar )'\240' && c <= (UChar )'\276') { /* lower */
if (c == (UChar )'\267') return FALSE;
return TRUE;
}
}
else if (c == (UChar )'\237' &&
(flag & ONIGENC_AMBIGUOUS_MATCH_COMPOUND) != 0) {
return TRUE;
}
}
}
}
return FALSE;
}
static const OnigCodePoint EmptyRange[] = { 0 };
static const OnigCodePoint SBAlnum[] = {
3,
0x0030, 0x0039,
0x0041, 0x005a,
0x0061, 0x007a
};
static const OnigCodePoint MBAlnum[] = {
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
411,
#else
6,
#endif
0x00aa, 0x00aa,
0x00b5, 0x00b5,
0x00ba, 0x00ba,
0x00c0, 0x00d6,
0x00d8, 0x00f6,
0x00f8, 0x0236
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
,
0x0250, 0x02c1,
0x02c6, 0x02d1,
0x02e0, 0x02e4,
0x02ee, 0x02ee,
0x0300, 0x0357,
0x035d, 0x036f,
0x037a, 0x037a,
0x0386, 0x0386,
0x0388, 0x038a,
0x038c, 0x038c,
0x038e, 0x03a1,
0x03a3, 0x03ce,
0x03d0, 0x03f5,
0x03f7, 0x03fb,
0x0400, 0x0481,
0x0483, 0x0486,
0x0488, 0x04ce,
0x04d0, 0x04f5,
0x04f8, 0x04f9,
0x0500, 0x050f,
0x0531, 0x0556,
0x0559, 0x0559,
0x0561, 0x0587,
0x0591, 0x05a1,
0x05a3, 0x05b9,
0x05bb, 0x05bd,
0x05bf, 0x05bf,
0x05c1, 0x05c2,
0x05c4, 0x05c4,
0x05d0, 0x05ea,
0x05f0, 0x05f2,
0x0610, 0x0615,
0x0621, 0x063a,
0x0640, 0x0658,
0x0660, 0x0669,
0x066e, 0x06d3,
0x06d5, 0x06dc,
0x06de, 0x06e8,
0x06ea, 0x06fc,
0x06ff, 0x06ff,
0x0710, 0x074a,
0x074d, 0x074f,
0x0780, 0x07b1,
0x0901, 0x0939,
0x093c, 0x094d,
0x0950, 0x0954,
0x0958, 0x0963,
0x0966, 0x096f,
0x0981, 0x0983,
0x0985, 0x098c,
0x098f, 0x0990,
0x0993, 0x09a8,
0x09aa, 0x09b0,
0x09b2, 0x09b2,
0x09b6, 0x09b9,
0x09bc, 0x09c4,
0x09c7, 0x09c8,
0x09cb, 0x09cd,
0x09d7, 0x09d7,
0x09dc, 0x09dd,
0x09df, 0x09e3,
0x09e6, 0x09f1,
0x0a01, 0x0a03,
0x0a05, 0x0a0a,
0x0a0f, 0x0a10,
0x0a13, 0x0a28,
0x0a2a, 0x0a30,
0x0a32, 0x0a33,
0x0a35, 0x0a36,
0x0a38, 0x0a39,
0x0a3c, 0x0a3c,
0x0a3e, 0x0a42,
0x0a47, 0x0a48,
0x0a4b, 0x0a4d,
0x0a59, 0x0a5c,
0x0a5e, 0x0a5e,
0x0a66, 0x0a74,
0x0a81, 0x0a83,
0x0a85, 0x0a8d,
0x0a8f, 0x0a91,
0x0a93, 0x0aa8,
0x0aaa, 0x0ab0,
0x0ab2, 0x0ab3,
0x0ab5, 0x0ab9,
0x0abc, 0x0ac5,
0x0ac7, 0x0ac9,
0x0acb, 0x0acd,
0x0ad0, 0x0ad0,
0x0ae0, 0x0ae3,
0x0ae6, 0x0aef,
0x0b01, 0x0b03,
0x0b05, 0x0b0c,
0x0b0f, 0x0b10,
0x0b13, 0x0b28,
0x0b2a, 0x0b30,
0x0b32, 0x0b33,
0x0b35, 0x0b39,
0x0b3c, 0x0b43,
0x0b47, 0x0b48,
0x0b4b, 0x0b4d,
0x0b56, 0x0b57,
0x0b5c, 0x0b5d,
0x0b5f, 0x0b61,
0x0b66, 0x0b6f,
0x0b71, 0x0b71,
0x0b82, 0x0b83,
0x0b85, 0x0b8a,
0x0b8e, 0x0b90,
0x0b92, 0x0b95,
0x0b99, 0x0b9a,
0x0b9c, 0x0b9c,
0x0b9e, 0x0b9f,
0x0ba3, 0x0ba4,
0x0ba8, 0x0baa,
0x0bae, 0x0bb5,
0x0bb7, 0x0bb9,
0x0bbe, 0x0bc2,
0x0bc6, 0x0bc8,
0x0bca, 0x0bcd,
0x0bd7, 0x0bd7,
0x0be7, 0x0bef,
0x0c01, 0x0c03,
0x0c05, 0x0c0c,
0x0c0e, 0x0c10,
0x0c12, 0x0c28,
0x0c2a, 0x0c33,
0x0c35, 0x0c39,
0x0c3e, 0x0c44,
0x0c46, 0x0c48,
0x0c4a, 0x0c4d,
0x0c55, 0x0c56,
0x0c60, 0x0c61,
0x0c66, 0x0c6f,
0x0c82, 0x0c83,
0x0c85, 0x0c8c,
0x0c8e, 0x0c90,
0x0c92, 0x0ca8,
0x0caa, 0x0cb3,
0x0cb5, 0x0cb9,
0x0cbc, 0x0cc4,
0x0cc6, 0x0cc8,
0x0cca, 0x0ccd,
0x0cd5, 0x0cd6,
0x0cde, 0x0cde,
0x0ce0, 0x0ce1,
0x0ce6, 0x0cef,
0x0d02, 0x0d03,
0x0d05, 0x0d0c,
0x0d0e, 0x0d10,
0x0d12, 0x0d28,
0x0d2a, 0x0d39,
0x0d3e, 0x0d43,
0x0d46, 0x0d48,
0x0d4a, 0x0d4d,
0x0d57, 0x0d57,
0x0d60, 0x0d61,
0x0d66, 0x0d6f,
0x0d82, 0x0d83,
0x0d85, 0x0d96,
0x0d9a, 0x0db1,
0x0db3, 0x0dbb,
0x0dbd, 0x0dbd,
0x0dc0, 0x0dc6,
0x0dca, 0x0dca,
0x0dcf, 0x0dd4,
0x0dd6, 0x0dd6,
0x0dd8, 0x0ddf,
0x0df2, 0x0df3,
0x0e01, 0x0e3a,
0x0e40, 0x0e4e,
0x0e50, 0x0e59,
0x0e81, 0x0e82,
0x0e84, 0x0e84,
0x0e87, 0x0e88,
0x0e8a, 0x0e8a,
0x0e8d, 0x0e8d,
0x0e94, 0x0e97,
0x0e99, 0x0e9f,
0x0ea1, 0x0ea3,
0x0ea5, 0x0ea5,
0x0ea7, 0x0ea7,
0x0eaa, 0x0eab,
0x0ead, 0x0eb9,
0x0ebb, 0x0ebd,
0x0ec0, 0x0ec4,
0x0ec6, 0x0ec6,
0x0ec8, 0x0ecd,
0x0ed0, 0x0ed9,
0x0edc, 0x0edd,
0x0f00, 0x0f00,
0x0f18, 0x0f19,
0x0f20, 0x0f29,
0x0f35, 0x0f35,
0x0f37, 0x0f37,
0x0f39, 0x0f39,
0x0f3e, 0x0f47,
0x0f49, 0x0f6a,
0x0f71, 0x0f84,
0x0f86, 0x0f8b,
0x0f90, 0x0f97,
0x0f99, 0x0fbc,
0x0fc6, 0x0fc6,
0x1000, 0x1021,
0x1023, 0x1027,
0x1029, 0x102a,
0x102c, 0x1032,
0x1036, 0x1039,
0x1040, 0x1049,
0x1050, 0x1059,
0x10a0, 0x10c5,
0x10d0, 0x10f8,
0x1100, 0x1159,
0x115f, 0x11a2,
0x11a8, 0x11f9,
0x1200, 0x1206,
0x1208, 0x1246,
0x1248, 0x1248,
0x124a, 0x124d,
0x1250, 0x1256,
0x1258, 0x1258,
0x125a, 0x125d,
0x1260, 0x1286,
0x1288, 0x1288,
0x128a, 0x128d,
0x1290, 0x12ae,
0x12b0, 0x12b0,
0x12b2, 0x12b5,
0x12b8, 0x12be,
0x12c0, 0x12c0,
0x12c2, 0x12c5,
0x12c8, 0x12ce,
0x12d0, 0x12d6,
0x12d8, 0x12ee,
0x12f0, 0x130e,
0x1310, 0x1310,
0x1312, 0x1315,
0x1318, 0x131e,
0x1320, 0x1346,
0x1348, 0x135a,
0x1369, 0x1371,
0x13a0, 0x13f4,
0x1401, 0x166c,
0x166f, 0x1676,
0x1681, 0x169a,
0x16a0, 0x16ea,
0x1700, 0x170c,
0x170e, 0x1714,
0x1720, 0x1734,
0x1740, 0x1753,
0x1760, 0x176c,
0x176e, 0x1770,
0x1772, 0x1773,
0x1780, 0x17b3,
0x17b6, 0x17d3,
0x17d7, 0x17d7,
0x17dc, 0x17dd,
0x17e0, 0x17e9,
0x180b, 0x180d,
0x1810, 0x1819,
0x1820, 0x1877,
0x1880, 0x18a9,
0x1900, 0x191c,
0x1920, 0x192b,
0x1930, 0x193b,
0x1946, 0x196d,
0x1970, 0x1974,
0x1d00, 0x1d6b,
0x1e00, 0x1e9b,
0x1ea0, 0x1ef9,
0x1f00, 0x1f15,
0x1f18, 0x1f1d,
0x1f20, 0x1f45,
0x1f48, 0x1f4d,
0x1f50, 0x1f57,
0x1f59, 0x1f59,
0x1f5b, 0x1f5b,
0x1f5d, 0x1f5d,
0x1f5f, 0x1f7d,
0x1f80, 0x1fb4,
0x1fb6, 0x1fbc,
0x1fbe, 0x1fbe,
0x1fc2, 0x1fc4,
0x1fc6, 0x1fcc,
0x1fd0, 0x1fd3,
0x1fd6, 0x1fdb,
0x1fe0, 0x1fec,
0x1ff2, 0x1ff4,
0x1ff6, 0x1ffc,
0x2071, 0x2071,
0x207f, 0x207f,
0x20d0, 0x20ea,
0x2102, 0x2102,
0x2107, 0x2107,
0x210a, 0x2113,
0x2115, 0x2115,
0x2119, 0x211d,
0x2124, 0x2124,
0x2126, 0x2126,
0x2128, 0x2128,
0x212a, 0x212d,
0x212f, 0x2131,
0x2133, 0x2139,
0x213d, 0x213f,
0x2145, 0x2149,
0x3005, 0x3006,
0x302a, 0x302f,
0x3031, 0x3035,
0x303b, 0x303c,
0x3041, 0x3096,
0x3099, 0x309a,
0x309d, 0x309f,
0x30a1, 0x30fa,
0x30fc, 0x30ff,
0x3105, 0x312c,
0x3131, 0x318e,
0x31a0, 0x31b7,
0x31f0, 0x31ff,
0x3400, 0x4db5,
0x4e00, 0x9fa5,
0xa000, 0xa48c,
0xac00, 0xd7a3,
0xf900, 0xfa2d,
0xfa30, 0xfa6a,
0xfb00, 0xfb06,
0xfb13, 0xfb17,
0xfb1d, 0xfb28,
0xfb2a, 0xfb36,
0xfb38, 0xfb3c,
0xfb3e, 0xfb3e,
0xfb40, 0xfb41,
0xfb43, 0xfb44,
0xfb46, 0xfbb1,
0xfbd3, 0xfd3d,
0xfd50, 0xfd8f,
0xfd92, 0xfdc7,
0xfdf0, 0xfdfb,
0xfe00, 0xfe0f,
0xfe20, 0xfe23,
0xfe70, 0xfe74,
0xfe76, 0xfefc,
0xff10, 0xff19,
0xff21, 0xff3a,
0xff41, 0xff5a,
0xff66, 0xffbe,
0xffc2, 0xffc7,
0xffca, 0xffcf,
0xffd2, 0xffd7,
0xffda, 0xffdc,
0x10000, 0x1000b,
0x1000d, 0x10026,
0x10028, 0x1003a,
0x1003c, 0x1003d,
0x1003f, 0x1004d,
0x10050, 0x1005d,
0x10080, 0x100fa,
0x10300, 0x1031e,
0x10330, 0x10349,
0x10380, 0x1039d,
0x10400, 0x1049d,
0x104a0, 0x104a9,
0x10800, 0x10805,
0x10808, 0x10808,
0x1080a, 0x10835,
0x10837, 0x10838,
0x1083c, 0x1083c,
0x1083f, 0x1083f,
0x1d165, 0x1d169,
0x1d16d, 0x1d172,
0x1d17b, 0x1d182,
0x1d185, 0x1d18b,
0x1d1aa, 0x1d1ad,
0x1d400, 0x1d454,
0x1d456, 0x1d49c,
0x1d49e, 0x1d49f,
0x1d4a2, 0x1d4a2,
0x1d4a5, 0x1d4a6,
0x1d4a9, 0x1d4ac,
0x1d4ae, 0x1d4b9,
0x1d4bb, 0x1d4bb,
0x1d4bd, 0x1d4c3,
0x1d4c5, 0x1d505,
0x1d507, 0x1d50a,
0x1d50d, 0x1d514,
0x1d516, 0x1d51c,
0x1d51e, 0x1d539,
0x1d53b, 0x1d53e,
0x1d540, 0x1d544,
0x1d546, 0x1d546,
0x1d54a, 0x1d550,
0x1d552, 0x1d6a3,
0x1d6a8, 0x1d6c0,
0x1d6c2, 0x1d6da,
0x1d6dc, 0x1d6fa,
0x1d6fc, 0x1d714,
0x1d716, 0x1d734,
0x1d736, 0x1d74e,
0x1d750, 0x1d76e,
0x1d770, 0x1d788,
0x1d78a, 0x1d7a8,
0x1d7aa, 0x1d7c2,
0x1d7c4, 0x1d7c9,
0x1d7ce, 0x1d7ff,
0x20000, 0x2a6d6,
0x2f800, 0x2fa1d,
0xe0100, 0xe01ef
#endif /* USE_UNICODE_FULL_RANGE_CTYPE */
}; /* end of MBAlnum */
static const OnigCodePoint SBAlpha[] = {
2,
0x0041, 0x005a,
0x0061, 0x007a
};
static const OnigCodePoint MBAlpha[] = {
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
394,
#else
6,
#endif
0x00aa, 0x00aa,
0x00b5, 0x00b5,
0x00ba, 0x00ba,
0x00c0, 0x00d6,
0x00d8, 0x00f6,
0x00f8, 0x0236
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
,
0x0250, 0x02c1,
0x02c6, 0x02d1,
0x02e0, 0x02e4,
0x02ee, 0x02ee,
0x0300, 0x0357,
0x035d, 0x036f,
0x037a, 0x037a,
0x0386, 0x0386,
0x0388, 0x038a,
0x038c, 0x038c,
0x038e, 0x03a1,
0x03a3, 0x03ce,
0x03d0, 0x03f5,
0x03f7, 0x03fb,
0x0400, 0x0481,
0x0483, 0x0486,
0x0488, 0x04ce,
0x04d0, 0x04f5,
0x04f8, 0x04f9,
0x0500, 0x050f,
0x0531, 0x0556,
0x0559, 0x0559,
0x0561, 0x0587,
0x0591, 0x05a1,
0x05a3, 0x05b9,
0x05bb, 0x05bd,
0x05bf, 0x05bf,
0x05c1, 0x05c2,
0x05c4, 0x05c4,
0x05d0, 0x05ea,
0x05f0, 0x05f2,
0x0610, 0x0615,
0x0621, 0x063a,
0x0640, 0x0658,
0x066e, 0x06d3,
0x06d5, 0x06dc,
0x06de, 0x06e8,
0x06ea, 0x06ef,
0x06fa, 0x06fc,
0x06ff, 0x06ff,
0x0710, 0x074a,
0x074d, 0x074f,
0x0780, 0x07b1,
0x0901, 0x0939,
0x093c, 0x094d,
0x0950, 0x0954,
0x0958, 0x0963,
0x0981, 0x0983,
0x0985, 0x098c,
0x098f, 0x0990,
0x0993, 0x09a8,
0x09aa, 0x09b0,
0x09b2, 0x09b2,
0x09b6, 0x09b9,
0x09bc, 0x09c4,
0x09c7, 0x09c8,
0x09cb, 0x09cd,
0x09d7, 0x09d7,
0x09dc, 0x09dd,
0x09df, 0x09e3,
0x09f0, 0x09f1,
0x0a01, 0x0a03,
0x0a05, 0x0a0a,
0x0a0f, 0x0a10,
0x0a13, 0x0a28,
0x0a2a, 0x0a30,
0x0a32, 0x0a33,
0x0a35, 0x0a36,
0x0a38, 0x0a39,
0x0a3c, 0x0a3c,
0x0a3e, 0x0a42,
0x0a47, 0x0a48,
0x0a4b, 0x0a4d,
0x0a59, 0x0a5c,
0x0a5e, 0x0a5e,
0x0a70, 0x0a74,
0x0a81, 0x0a83,
0x0a85, 0x0a8d,
0x0a8f, 0x0a91,
0x0a93, 0x0aa8,
0x0aaa, 0x0ab0,
0x0ab2, 0x0ab3,
0x0ab5, 0x0ab9,
0x0abc, 0x0ac5,
0x0ac7, 0x0ac9,
0x0acb, 0x0acd,
0x0ad0, 0x0ad0,
0x0ae0, 0x0ae3,
0x0b01, 0x0b03,
0x0b05, 0x0b0c,
0x0b0f, 0x0b10,
0x0b13, 0x0b28,
0x0b2a, 0x0b30,
0x0b32, 0x0b33,
0x0b35, 0x0b39,
0x0b3c, 0x0b43,
0x0b47, 0x0b48,
0x0b4b, 0x0b4d,
0x0b56, 0x0b57,
0x0b5c, 0x0b5d,
0x0b5f, 0x0b61,
0x0b71, 0x0b71,
0x0b82, 0x0b83,
0x0b85, 0x0b8a,
0x0b8e, 0x0b90,
0x0b92, 0x0b95,
0x0b99, 0x0b9a,
0x0b9c, 0x0b9c,
0x0b9e, 0x0b9f,
0x0ba3, 0x0ba4,
0x0ba8, 0x0baa,
0x0bae, 0x0bb5,
0x0bb7, 0x0bb9,
0x0bbe, 0x0bc2,
0x0bc6, 0x0bc8,
0x0bca, 0x0bcd,
0x0bd7, 0x0bd7,
0x0c01, 0x0c03,
0x0c05, 0x0c0c,
0x0c0e, 0x0c10,
0x0c12, 0x0c28,
0x0c2a, 0x0c33,
0x0c35, 0x0c39,
0x0c3e, 0x0c44,
0x0c46, 0x0c48,
0x0c4a, 0x0c4d,
0x0c55, 0x0c56,
0x0c60, 0x0c61,
0x0c82, 0x0c83,
0x0c85, 0x0c8c,
0x0c8e, 0x0c90,
0x0c92, 0x0ca8,
0x0caa, 0x0cb3,
0x0cb5, 0x0cb9,
0x0cbc, 0x0cc4,
0x0cc6, 0x0cc8,
0x0cca, 0x0ccd,
0x0cd5, 0x0cd6,
0x0cde, 0x0cde,
0x0ce0, 0x0ce1,
0x0d02, 0x0d03,
0x0d05, 0x0d0c,
0x0d0e, 0x0d10,
0x0d12, 0x0d28,
0x0d2a, 0x0d39,
0x0d3e, 0x0d43,
0x0d46, 0x0d48,
0x0d4a, 0x0d4d,
0x0d57, 0x0d57,
0x0d60, 0x0d61,
0x0d82, 0x0d83,
0x0d85, 0x0d96,
0x0d9a, 0x0db1,
0x0db3, 0x0dbb,
0x0dbd, 0x0dbd,
0x0dc0, 0x0dc6,
0x0dca, 0x0dca,
0x0dcf, 0x0dd4,
0x0dd6, 0x0dd6,
0x0dd8, 0x0ddf,
0x0df2, 0x0df3,
0x0e01, 0x0e3a,
0x0e40, 0x0e4e,
0x0e81, 0x0e82,
0x0e84, 0x0e84,
0x0e87, 0x0e88,
0x0e8a, 0x0e8a,
0x0e8d, 0x0e8d,
0x0e94, 0x0e97,
0x0e99, 0x0e9f,
0x0ea1, 0x0ea3,
0x0ea5, 0x0ea5,
0x0ea7, 0x0ea7,
0x0eaa, 0x0eab,
0x0ead, 0x0eb9,
0x0ebb, 0x0ebd,
0x0ec0, 0x0ec4,
0x0ec6, 0x0ec6,
0x0ec8, 0x0ecd,
0x0edc, 0x0edd,
0x0f00, 0x0f00,
0x0f18, 0x0f19,
0x0f35, 0x0f35,
0x0f37, 0x0f37,
0x0f39, 0x0f39,
0x0f3e, 0x0f47,
0x0f49, 0x0f6a,
0x0f71, 0x0f84,
0x0f86, 0x0f8b,
0x0f90, 0x0f97,
0x0f99, 0x0fbc,
0x0fc6, 0x0fc6,
0x1000, 0x1021,
0x1023, 0x1027,
0x1029, 0x102a,
0x102c, 0x1032,
0x1036, 0x1039,
0x1050, 0x1059,
0x10a0, 0x10c5,
0x10d0, 0x10f8,
0x1100, 0x1159,
0x115f, 0x11a2,
0x11a8, 0x11f9,
0x1200, 0x1206,
0x1208, 0x1246,
0x1248, 0x1248,
0x124a, 0x124d,
0x1250, 0x1256,
0x1258, 0x1258,
0x125a, 0x125d,
0x1260, 0x1286,
0x1288, 0x1288,
0x128a, 0x128d,
0x1290, 0x12ae,
0x12b0, 0x12b0,
0x12b2, 0x12b5,
0x12b8, 0x12be,
0x12c0, 0x12c0,
0x12c2, 0x12c5,
0x12c8, 0x12ce,
0x12d0, 0x12d6,
0x12d8, 0x12ee,
0x12f0, 0x130e,
0x1310, 0x1310,
0x1312, 0x1315,
0x1318, 0x131e,
0x1320, 0x1346,
0x1348, 0x135a,
0x13a0, 0x13f4,
0x1401, 0x166c,
0x166f, 0x1676,
0x1681, 0x169a,
0x16a0, 0x16ea,
0x1700, 0x170c,
0x170e, 0x1714,
0x1720, 0x1734,
0x1740, 0x1753,
0x1760, 0x176c,
0x176e, 0x1770,
0x1772, 0x1773,
0x1780, 0x17b3,
0x17b6, 0x17d3,
0x17d7, 0x17d7,
0x17dc, 0x17dd,
0x180b, 0x180d,
0x1820, 0x1877,
0x1880, 0x18a9,
0x1900, 0x191c,
0x1920, 0x192b,
0x1930, 0x193b,
0x1950, 0x196d,
0x1970, 0x1974,
0x1d00, 0x1d6b,
0x1e00, 0x1e9b,
0x1ea0, 0x1ef9,
0x1f00, 0x1f15,
0x1f18, 0x1f1d,
0x1f20, 0x1f45,
0x1f48, 0x1f4d,
0x1f50, 0x1f57,
0x1f59, 0x1f59,
0x1f5b, 0x1f5b,
0x1f5d, 0x1f5d,
0x1f5f, 0x1f7d,
0x1f80, 0x1fb4,
0x1fb6, 0x1fbc,
0x1fbe, 0x1fbe,
0x1fc2, 0x1fc4,
0x1fc6, 0x1fcc,
0x1fd0, 0x1fd3,
0x1fd6, 0x1fdb,
0x1fe0, 0x1fec,
0x1ff2, 0x1ff4,
0x1ff6, 0x1ffc,
0x2071, 0x2071,
0x207f, 0x207f,
0x20d0, 0x20ea,
0x2102, 0x2102,
0x2107, 0x2107,
0x210a, 0x2113,
0x2115, 0x2115,
0x2119, 0x211d,
0x2124, 0x2124,
0x2126, 0x2126,
0x2128, 0x2128,
0x212a, 0x212d,
0x212f, 0x2131,
0x2133, 0x2139,
0x213d, 0x213f,
0x2145, 0x2149,
0x3005, 0x3006,
0x302a, 0x302f,
0x3031, 0x3035,
0x303b, 0x303c,
0x3041, 0x3096,
0x3099, 0x309a,
0x309d, 0x309f,
0x30a1, 0x30fa,
0x30fc, 0x30ff,
0x3105, 0x312c,
0x3131, 0x318e,
0x31a0, 0x31b7,
0x31f0, 0x31ff,
0x3400, 0x4db5,
0x4e00, 0x9fa5,
0xa000, 0xa48c,
0xac00, 0xd7a3,
0xf900, 0xfa2d,
0xfa30, 0xfa6a,
0xfb00, 0xfb06,
0xfb13, 0xfb17,
0xfb1d, 0xfb28,
0xfb2a, 0xfb36,
0xfb38, 0xfb3c,
0xfb3e, 0xfb3e,
0xfb40, 0xfb41,
0xfb43, 0xfb44,
0xfb46, 0xfbb1,
0xfbd3, 0xfd3d,
0xfd50, 0xfd8f,
0xfd92, 0xfdc7,
0xfdf0, 0xfdfb,
0xfe00, 0xfe0f,
0xfe20, 0xfe23,
0xfe70, 0xfe74,
0xfe76, 0xfefc,
0xff21, 0xff3a,
0xff41, 0xff5a,
0xff66, 0xffbe,
0xffc2, 0xffc7,
0xffca, 0xffcf,
0xffd2, 0xffd7,
0xffda, 0xffdc,
0x10000, 0x1000b,
0x1000d, 0x10026,
0x10028, 0x1003a,
0x1003c, 0x1003d,
0x1003f, 0x1004d,
0x10050, 0x1005d,
0x10080, 0x100fa,
0x10300, 0x1031e,
0x10330, 0x10349,
0x10380, 0x1039d,
0x10400, 0x1049d,
0x10800, 0x10805,
0x10808, 0x10808,
0x1080a, 0x10835,
0x10837, 0x10838,
0x1083c, 0x1083c,
0x1083f, 0x1083f,
0x1d165, 0x1d169,
0x1d16d, 0x1d172,
0x1d17b, 0x1d182,
0x1d185, 0x1d18b,
0x1d1aa, 0x1d1ad,
0x1d400, 0x1d454,
0x1d456, 0x1d49c,
0x1d49e, 0x1d49f,
0x1d4a2, 0x1d4a2,
0x1d4a5, 0x1d4a6,
0x1d4a9, 0x1d4ac,
0x1d4ae, 0x1d4b9,
0x1d4bb, 0x1d4bb,
0x1d4bd, 0x1d4c3,
0x1d4c5, 0x1d505,
0x1d507, 0x1d50a,
0x1d50d, 0x1d514,
0x1d516, 0x1d51c,
0x1d51e, 0x1d539,
0x1d53b, 0x1d53e,
0x1d540, 0x1d544,
0x1d546, 0x1d546,
0x1d54a, 0x1d550,
0x1d552, 0x1d6a3,
0x1d6a8, 0x1d6c0,
0x1d6c2, 0x1d6da,
0x1d6dc, 0x1d6fa,
0x1d6fc, 0x1d714,
0x1d716, 0x1d734,
0x1d736, 0x1d74e,
0x1d750, 0x1d76e,
0x1d770, 0x1d788,
0x1d78a, 0x1d7a8,
0x1d7aa, 0x1d7c2,
0x1d7c4, 0x1d7c9,
0x20000, 0x2a6d6,
0x2f800, 0x2fa1d,
0xe0100, 0xe01ef
#endif /* USE_UNICODE_FULL_RANGE_CTYPE */
}; /* end of MBAlpha */
static const OnigCodePoint SBBlank[] = {
2,
0x0009, 0x0009,
0x0020, 0x0020
};
static const OnigCodePoint MBBlank[] = {
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
7,
#else
1,
#endif
0x00a0, 0x00a0
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
,
0x1680, 0x1680,
0x180e, 0x180e,
0x2000, 0x200a,
0x202f, 0x202f,
0x205f, 0x205f,
0x3000, 0x3000
#endif /* USE_UNICODE_FULL_RANGE_CTYPE */
}; /* end of MBBlank */
static const OnigCodePoint SBCntrl[] = {
2,
0x0000, 0x001f,
0x007f, 0x007f
};
static const OnigCodePoint MBCntrl[] = {
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
18,
#else
2,
#endif
0x0080, 0x009f,
0x00ad, 0x00ad
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
,
0x0600, 0x0603,
0x06dd, 0x06dd,
0x070f, 0x070f,
0x17b4, 0x17b5,
0x200b, 0x200f,
0x202a, 0x202e,
0x2060, 0x2063,
0x206a, 0x206f,
0xd800, 0xf8ff,
0xfeff, 0xfeff,
0xfff9, 0xfffb,
0x1d173, 0x1d17a,
0xe0001, 0xe0001,
0xe0020, 0xe007f,
0xf0000, 0xffffd,
0x100000, 0x10fffd
#endif /* USE_UNICODE_FULL_RANGE_CTYPE */
}; /* end of MBCntrl */
static const OnigCodePoint SBDigit[] = {
1,
0x0030, 0x0039
};
static const OnigCodePoint MBDigit[] = {
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
22,
#else
0
#endif
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
0x0660, 0x0669,
0x06f0, 0x06f9,
0x0966, 0x096f,
0x09e6, 0x09ef,
0x0a66, 0x0a6f,
0x0ae6, 0x0aef,
0x0b66, 0x0b6f,
0x0be7, 0x0bef,
0x0c66, 0x0c6f,
0x0ce6, 0x0cef,
0x0d66, 0x0d6f,
0x0e50, 0x0e59,
0x0ed0, 0x0ed9,
0x0f20, 0x0f29,
0x1040, 0x1049,
0x1369, 0x1371,
0x17e0, 0x17e9,
0x1810, 0x1819,
0x1946, 0x194f,
0xff10, 0xff19,
0x104a0, 0x104a9,
0x1d7ce, 0x1d7ff
#endif /* USE_UNICODE_FULL_RANGE_CTYPE */
}; /* end of MBDigit */
static const OnigCodePoint SBGraph[] = {
1,
0x0021, 0x007e
};
static const OnigCodePoint MBGraph[] = {
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
404,
#else
1,
#endif
0x00a1, 0x0236
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
,
0x0250, 0x0357,
0x035d, 0x036f,
0x0374, 0x0375,
0x037a, 0x037a,
0x037e, 0x037e,
0x0384, 0x038a,
0x038c, 0x038c,
0x038e, 0x03a1,
0x03a3, 0x03ce,
0x03d0, 0x03fb,
0x0400, 0x0486,
0x0488, 0x04ce,
0x04d0, 0x04f5,
0x04f8, 0x04f9,
0x0500, 0x050f,
0x0531, 0x0556,
0x0559, 0x055f,
0x0561, 0x0587,
0x0589, 0x058a,
0x0591, 0x05a1,
0x05a3, 0x05b9,
0x05bb, 0x05c4,
0x05d0, 0x05ea,
0x05f0, 0x05f4,
0x0600, 0x0603,
0x060c, 0x0615,
0x061b, 0x061b,
0x061f, 0x061f,
0x0621, 0x063a,
0x0640, 0x0658,
0x0660, 0x070d,
0x070f, 0x074a,
0x074d, 0x074f,
0x0780, 0x07b1,
0x0901, 0x0939,
0x093c, 0x094d,
0x0950, 0x0954,
0x0958, 0x0970,
0x0981, 0x0983,
0x0985, 0x098c,
0x098f, 0x0990,
0x0993, 0x09a8,
0x09aa, 0x09b0,
0x09b2, 0x09b2,
0x09b6, 0x09b9,
0x09bc, 0x09c4,
0x09c7, 0x09c8,
0x09cb, 0x09cd,
0x09d7, 0x09d7,
0x09dc, 0x09dd,
0x09df, 0x09e3,
0x09e6, 0x09fa,
0x0a01, 0x0a03,
0x0a05, 0x0a0a,
0x0a0f, 0x0a10,
0x0a13, 0x0a28,
0x0a2a, 0x0a30,
0x0a32, 0x0a33,
0x0a35, 0x0a36,
0x0a38, 0x0a39,
0x0a3c, 0x0a3c,
0x0a3e, 0x0a42,
0x0a47, 0x0a48,
0x0a4b, 0x0a4d,
0x0a59, 0x0a5c,
0x0a5e, 0x0a5e,
0x0a66, 0x0a74,
0x0a81, 0x0a83,
0x0a85, 0x0a8d,
0x0a8f, 0x0a91,
0x0a93, 0x0aa8,
0x0aaa, 0x0ab0,
0x0ab2, 0x0ab3,
0x0ab5, 0x0ab9,
0x0abc, 0x0ac5,
0x0ac7, 0x0ac9,
0x0acb, 0x0acd,
0x0ad0, 0x0ad0,
0x0ae0, 0x0ae3,
0x0ae6, 0x0aef,
0x0af1, 0x0af1,
0x0b01, 0x0b03,
0x0b05, 0x0b0c,
0x0b0f, 0x0b10,
0x0b13, 0x0b28,
0x0b2a, 0x0b30,
0x0b32, 0x0b33,
0x0b35, 0x0b39,
0x0b3c, 0x0b43,
0x0b47, 0x0b48,
0x0b4b, 0x0b4d,
0x0b56, 0x0b57,
0x0b5c, 0x0b5d,
0x0b5f, 0x0b61,
0x0b66, 0x0b71,
0x0b82, 0x0b83,
0x0b85, 0x0b8a,
0x0b8e, 0x0b90,
0x0b92, 0x0b95,
0x0b99, 0x0b9a,
0x0b9c, 0x0b9c,
0x0b9e, 0x0b9f,
0x0ba3, 0x0ba4,
0x0ba8, 0x0baa,
0x0bae, 0x0bb5,
0x0bb7, 0x0bb9,
0x0bbe, 0x0bc2,
0x0bc6, 0x0bc8,
0x0bca, 0x0bcd,
0x0bd7, 0x0bd7,
0x0be7, 0x0bfa,
0x0c01, 0x0c03,
0x0c05, 0x0c0c,
0x0c0e, 0x0c10,
0x0c12, 0x0c28,
0x0c2a, 0x0c33,
0x0c35, 0x0c39,
0x0c3e, 0x0c44,
0x0c46, 0x0c48,
0x0c4a, 0x0c4d,
0x0c55, 0x0c56,
0x0c60, 0x0c61,
0x0c66, 0x0c6f,
0x0c82, 0x0c83,
0x0c85, 0x0c8c,
0x0c8e, 0x0c90,
0x0c92, 0x0ca8,
0x0caa, 0x0cb3,
0x0cb5, 0x0cb9,
0x0cbc, 0x0cc4,
0x0cc6, 0x0cc8,
0x0cca, 0x0ccd,
0x0cd5, 0x0cd6,
0x0cde, 0x0cde,
0x0ce0, 0x0ce1,
0x0ce6, 0x0cef,
0x0d02, 0x0d03,
0x0d05, 0x0d0c,
0x0d0e, 0x0d10,
0x0d12, 0x0d28,
0x0d2a, 0x0d39,
0x0d3e, 0x0d43,
0x0d46, 0x0d48,
0x0d4a, 0x0d4d,
0x0d57, 0x0d57,
0x0d60, 0x0d61,
0x0d66, 0x0d6f,
0x0d82, 0x0d83,
0x0d85, 0x0d96,
0x0d9a, 0x0db1,
0x0db3, 0x0dbb,
0x0dbd, 0x0dbd,
0x0dc0, 0x0dc6,
0x0dca, 0x0dca,
0x0dcf, 0x0dd4,
0x0dd6, 0x0dd6,
0x0dd8, 0x0ddf,
0x0df2, 0x0df4,
0x0e01, 0x0e3a,
0x0e3f, 0x0e5b,
0x0e81, 0x0e82,
0x0e84, 0x0e84,
0x0e87, 0x0e88,
0x0e8a, 0x0e8a,
0x0e8d, 0x0e8d,
0x0e94, 0x0e97,
0x0e99, 0x0e9f,
0x0ea1, 0x0ea3,
0x0ea5, 0x0ea5,
0x0ea7, 0x0ea7,
0x0eaa, 0x0eab,
0x0ead, 0x0eb9,
0x0ebb, 0x0ebd,
0x0ec0, 0x0ec4,
0x0ec6, 0x0ec6,
0x0ec8, 0x0ecd,
0x0ed0, 0x0ed9,
0x0edc, 0x0edd,
0x0f00, 0x0f47,
0x0f49, 0x0f6a,
0x0f71, 0x0f8b,
0x0f90, 0x0f97,
0x0f99, 0x0fbc,
0x0fbe, 0x0fcc,
0x0fcf, 0x0fcf,
0x1000, 0x1021,
0x1023, 0x1027,
0x1029, 0x102a,
0x102c, 0x1032,
0x1036, 0x1039,
0x1040, 0x1059,
0x10a0, 0x10c5,
0x10d0, 0x10f8,
0x10fb, 0x10fb,
0x1100, 0x1159,
0x115f, 0x11a2,
0x11a8, 0x11f9,
0x1200, 0x1206,
0x1208, 0x1246,
0x1248, 0x1248,
0x124a, 0x124d,
0x1250, 0x1256,
0x1258, 0x1258,
0x125a, 0x125d,
0x1260, 0x1286,
0x1288, 0x1288,
0x128a, 0x128d,
0x1290, 0x12ae,
0x12b0, 0x12b0,
0x12b2, 0x12b5,
0x12b8, 0x12be,
0x12c0, 0x12c0,
0x12c2, 0x12c5,
0x12c8, 0x12ce,
0x12d0, 0x12d6,
0x12d8, 0x12ee,
0x12f0, 0x130e,
0x1310, 0x1310,
0x1312, 0x1315,
0x1318, 0x131e,
0x1320, 0x1346,
0x1348, 0x135a,
0x1361, 0x137c,
0x13a0, 0x13f4,
0x1401, 0x1676,
0x1681, 0x169c,
0x16a0, 0x16f0,
0x1700, 0x170c,
0x170e, 0x1714,
0x1720, 0x1736,
0x1740, 0x1753,
0x1760, 0x176c,
0x176e, 0x1770,
0x1772, 0x1773,
0x1780, 0x17dd,
0x17e0, 0x17e9,
0x17f0, 0x17f9,
0x1800, 0x180d,
0x1810, 0x1819,
0x1820, 0x1877,
0x1880, 0x18a9,
0x1900, 0x191c,
0x1920, 0x192b,
0x1930, 0x193b,
0x1940, 0x1940,
0x1944, 0x196d,
0x1970, 0x1974,
0x19e0, 0x19ff,
0x1d00, 0x1d6b,
0x1e00, 0x1e9b,
0x1ea0, 0x1ef9,
0x1f00, 0x1f15,
0x1f18, 0x1f1d,
0x1f20, 0x1f45,
0x1f48, 0x1f4d,
0x1f50, 0x1f57,
0x1f59, 0x1f59,
0x1f5b, 0x1f5b,
0x1f5d, 0x1f5d,
0x1f5f, 0x1f7d,
0x1f80, 0x1fb4,
0x1fb6, 0x1fc4,
0x1fc6, 0x1fd3,
0x1fd6, 0x1fdb,
0x1fdd, 0x1fef,
0x1ff2, 0x1ff4,
0x1ff6, 0x1ffe,
0x200b, 0x2027,
0x202a, 0x202e,
0x2030, 0x2054,
0x2057, 0x2057,
0x2060, 0x2063,
0x206a, 0x2071,
0x2074, 0x208e,
0x20a0, 0x20b1,
0x20d0, 0x20ea,
0x2100, 0x213b,
0x213d, 0x214b,
0x2153, 0x2183,
0x2190, 0x23d0,
0x2400, 0x2426,
0x2440, 0x244a,
0x2460, 0x2617,
0x2619, 0x267d,
0x2680, 0x2691,
0x26a0, 0x26a1,
0x2701, 0x2704,
0x2706, 0x2709,
0x270c, 0x2727,
0x2729, 0x274b,
0x274d, 0x274d,
0x274f, 0x2752,
0x2756, 0x2756,
0x2758, 0x275e,
0x2761, 0x2794,
0x2798, 0x27af,
0x27b1, 0x27be,
0x27d0, 0x27eb,
0x27f0, 0x2b0d,
0x2e80, 0x2e99,
0x2e9b, 0x2ef3,
0x2f00, 0x2fd5,
0x2ff0, 0x2ffb,
0x3001, 0x303f,
0x3041, 0x3096,
0x3099, 0x30ff,
0x3105, 0x312c,
0x3131, 0x318e,
0x3190, 0x31b7,
0x31f0, 0x321e,
0x3220, 0x3243,
0x3250, 0x327d,
0x327f, 0x32fe,
0x3300, 0x4db5,
0x4dc0, 0x9fa5,
0xa000, 0xa48c,
0xa490, 0xa4c6,
0xac00, 0xd7a3,
0xe000, 0xfa2d,
0xfa30, 0xfa6a,
0xfb00, 0xfb06,
0xfb13, 0xfb17,
0xfb1d, 0xfb36,
0xfb38, 0xfb3c,
0xfb3e, 0xfb3e,
0xfb40, 0xfb41,
0xfb43, 0xfb44,
0xfb46, 0xfbb1,
0xfbd3, 0xfd3f,
0xfd50, 0xfd8f,
0xfd92, 0xfdc7,
0xfdf0, 0xfdfd,
0xfe00, 0xfe0f,
0xfe20, 0xfe23,
0xfe30, 0xfe52,
0xfe54, 0xfe66,
0xfe68, 0xfe6b,
0xfe70, 0xfe74,
0xfe76, 0xfefc,
0xfeff, 0xfeff,
0xff01, 0xffbe,
0xffc2, 0xffc7,
0xffca, 0xffcf,
0xffd2, 0xffd7,
0xffda, 0xffdc,
0xffe0, 0xffe6,
0xffe8, 0xffee,
0xfff9, 0xfffd,
0x10000, 0x1000b,
0x1000d, 0x10026,
0x10028, 0x1003a,
0x1003c, 0x1003d,
0x1003f, 0x1004d,
0x10050, 0x1005d,
0x10080, 0x100fa,
0x10100, 0x10102,
0x10107, 0x10133,
0x10137, 0x1013f,
0x10300, 0x1031e,
0x10320, 0x10323,
0x10330, 0x1034a,
0x10380, 0x1039d,
0x1039f, 0x1039f,
0x10400, 0x1049d,
0x104a0, 0x104a9,
0x10800, 0x10805,
0x10808, 0x10808,
0x1080a, 0x10835,
0x10837, 0x10838,
0x1083c, 0x1083c,
0x1083f, 0x1083f,
0x1d000, 0x1d0f5,
0x1d100, 0x1d126,
0x1d12a, 0x1d1dd,
0x1d300, 0x1d356,
0x1d400, 0x1d454,
0x1d456, 0x1d49c,
0x1d49e, 0x1d49f,
0x1d4a2, 0x1d4a2,
0x1d4a5, 0x1d4a6,
0x1d4a9, 0x1d4ac,
0x1d4ae, 0x1d4b9,
0x1d4bb, 0x1d4bb,
0x1d4bd, 0x1d4c3,
0x1d4c5, 0x1d505,
0x1d507, 0x1d50a,
0x1d50d, 0x1d514,
0x1d516, 0x1d51c,
0x1d51e, 0x1d539,
0x1d53b, 0x1d53e,
0x1d540, 0x1d544,
0x1d546, 0x1d546,
0x1d54a, 0x1d550,
0x1d552, 0x1d6a3,
0x1d6a8, 0x1d7c9,
0x1d7ce, 0x1d7ff,
0x20000, 0x2a6d6,
0x2f800, 0x2fa1d,
0xe0001, 0xe0001,
0xe0020, 0xe007f,
0xe0100, 0xe01ef,
0xf0000, 0xffffd,
0x100000, 0x10fffd
#endif /* USE_UNICODE_FULL_RANGE_CTYPE */
}; /* end of MBGraph */
static const OnigCodePoint SBLower[] = {
1,
0x0061, 0x007a
};
static const OnigCodePoint MBLower[] = {
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
423,
#else
5,
#endif
0x00aa, 0x00aa,
0x00b5, 0x00b5,
0x00ba, 0x00ba,
0x00df, 0x00f6,
0x00f8, 0x00ff
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
,
0x0101, 0x0101,
0x0103, 0x0103,
0x0105, 0x0105,
0x0107, 0x0107,
0x0109, 0x0109,
0x010b, 0x010b,
0x010d, 0x010d,
0x010f, 0x010f,
0x0111, 0x0111,
0x0113, 0x0113,
0x0115, 0x0115,
0x0117, 0x0117,
0x0119, 0x0119,
0x011b, 0x011b,
0x011d, 0x011d,
0x011f, 0x011f,
0x0121, 0x0121,
0x0123, 0x0123,
0x0125, 0x0125,
0x0127, 0x0127,
0x0129, 0x0129,
0x012b, 0x012b,
0x012d, 0x012d,
0x012f, 0x012f,
0x0131, 0x0131,
0x0133, 0x0133,
0x0135, 0x0135,
0x0137, 0x0138,
0x013a, 0x013a,
0x013c, 0x013c,
0x013e, 0x013e,
0x0140, 0x0140,
0x0142, 0x0142,
0x0144, 0x0144,
0x0146, 0x0146,
0x0148, 0x0149,
0x014b, 0x014b,
0x014d, 0x014d,
0x014f, 0x014f,
0x0151, 0x0151,
0x0153, 0x0153,
0x0155, 0x0155,
0x0157, 0x0157,
0x0159, 0x0159,
0x015b, 0x015b,
0x015d, 0x015d,
0x015f, 0x015f,
0x0161, 0x0161,
0x0163, 0x0163,
0x0165, 0x0165,
0x0167, 0x0167,
0x0169, 0x0169,
0x016b, 0x016b,
0x016d, 0x016d,
0x016f, 0x016f,
0x0171, 0x0171,
0x0173, 0x0173,
0x0175, 0x0175,
0x0177, 0x0177,
0x017a, 0x017a,
0x017c, 0x017c,
0x017e, 0x0180,
0x0183, 0x0183,
0x0185, 0x0185,
0x0188, 0x0188,
0x018c, 0x018d,
0x0192, 0x0192,
0x0195, 0x0195,
0x0199, 0x019b,
0x019e, 0x019e,
0x01a1, 0x01a1,
0x01a3, 0x01a3,
0x01a5, 0x01a5,
0x01a8, 0x01a8,
0x01aa, 0x01ab,
0x01ad, 0x01ad,
0x01b0, 0x01b0,
0x01b4, 0x01b4,
0x01b6, 0x01b6,
0x01b9, 0x01ba,
0x01bd, 0x01bf,
0x01c6, 0x01c6,
0x01c9, 0x01c9,
0x01cc, 0x01cc,
0x01ce, 0x01ce,
0x01d0, 0x01d0,
0x01d2, 0x01d2,
0x01d4, 0x01d4,
0x01d6, 0x01d6,
0x01d8, 0x01d8,
0x01da, 0x01da,
0x01dc, 0x01dd,
0x01df, 0x01df,
0x01e1, 0x01e1,
0x01e3, 0x01e3,
0x01e5, 0x01e5,
0x01e7, 0x01e7,
0x01e9, 0x01e9,
0x01eb, 0x01eb,
0x01ed, 0x01ed,
0x01ef, 0x01f0,
0x01f3, 0x01f3,
0x01f5, 0x01f5,
0x01f9, 0x01f9,
0x01fb, 0x01fb,
0x01fd, 0x01fd,
0x01ff, 0x01ff,
0x0201, 0x0201,
0x0203, 0x0203,
0x0205, 0x0205,
0x0207, 0x0207,
0x0209, 0x0209,
0x020b, 0x020b,
0x020d, 0x020d,
0x020f, 0x020f,
0x0211, 0x0211,
0x0213, 0x0213,
0x0215, 0x0215,
0x0217, 0x0217,
0x0219, 0x0219,
0x021b, 0x021b,
0x021d, 0x021d,
0x021f, 0x021f,
0x0221, 0x0221,
0x0223, 0x0223,
0x0225, 0x0225,
0x0227, 0x0227,
0x0229, 0x0229,
0x022b, 0x022b,
0x022d, 0x022d,
0x022f, 0x022f,
0x0231, 0x0231,
0x0233, 0x0236,
0x0250, 0x02af,
0x0390, 0x0390,
0x03ac, 0x03ce,
0x03d0, 0x03d1,
0x03d5, 0x03d7,
0x03d9, 0x03d9,
0x03db, 0x03db,
0x03dd, 0x03dd,
0x03df, 0x03df,
0x03e1, 0x03e1,
0x03e3, 0x03e3,
0x03e5, 0x03e5,
0x03e7, 0x03e7,
0x03e9, 0x03e9,
0x03eb, 0x03eb,
0x03ed, 0x03ed,
0x03ef, 0x03f3,
0x03f5, 0x03f5,
0x03f8, 0x03f8,
0x03fb, 0x03fb,
0x0430, 0x045f,
0x0461, 0x0461,
0x0463, 0x0463,
0x0465, 0x0465,
0x0467, 0x0467,
0x0469, 0x0469,
0x046b, 0x046b,
0x046d, 0x046d,
0x046f, 0x046f,
0x0471, 0x0471,
0x0473, 0x0473,
0x0475, 0x0475,
0x0477, 0x0477,
0x0479, 0x0479,
0x047b, 0x047b,
0x047d, 0x047d,
0x047f, 0x047f,
0x0481, 0x0481,
0x048b, 0x048b,
0x048d, 0x048d,
0x048f, 0x048f,
0x0491, 0x0491,
0x0493, 0x0493,
0x0495, 0x0495,
0x0497, 0x0497,
0x0499, 0x0499,
0x049b, 0x049b,
0x049d, 0x049d,
0x049f, 0x049f,
0x04a1, 0x04a1,
0x04a3, 0x04a3,
0x04a5, 0x04a5,
0x04a7, 0x04a7,
0x04a9, 0x04a9,
0x04ab, 0x04ab,
0x04ad, 0x04ad,
0x04af, 0x04af,
0x04b1, 0x04b1,
0x04b3, 0x04b3,
0x04b5, 0x04b5,
0x04b7, 0x04b7,
0x04b9, 0x04b9,
0x04bb, 0x04bb,
0x04bd, 0x04bd,
0x04bf, 0x04bf,
0x04c2, 0x04c2,
0x04c4, 0x04c4,
0x04c6, 0x04c6,
0x04c8, 0x04c8,
0x04ca, 0x04ca,
0x04cc, 0x04cc,
0x04ce, 0x04ce,
0x04d1, 0x04d1,
0x04d3, 0x04d3,
0x04d5, 0x04d5,
0x04d7, 0x04d7,
0x04d9, 0x04d9,
0x04db, 0x04db,
0x04dd, 0x04dd,
0x04df, 0x04df,
0x04e1, 0x04e1,
0x04e3, 0x04e3,
0x04e5, 0x04e5,
0x04e7, 0x04e7,
0x04e9, 0x04e9,
0x04eb, 0x04eb,
0x04ed, 0x04ed,
0x04ef, 0x04ef,
0x04f1, 0x04f1,
0x04f3, 0x04f3,
0x04f5, 0x04f5,
0x04f9, 0x04f9,
0x0501, 0x0501,
0x0503, 0x0503,
0x0505, 0x0505,
0x0507, 0x0507,
0x0509, 0x0509,
0x050b, 0x050b,
0x050d, 0x050d,
0x050f, 0x050f,
0x0561, 0x0587,
0x1d00, 0x1d2b,
0x1d62, 0x1d6b,
0x1e01, 0x1e01,
0x1e03, 0x1e03,
0x1e05, 0x1e05,
0x1e07, 0x1e07,
0x1e09, 0x1e09,
0x1e0b, 0x1e0b,
0x1e0d, 0x1e0d,
0x1e0f, 0x1e0f,
0x1e11, 0x1e11,
0x1e13, 0x1e13,
0x1e15, 0x1e15,
0x1e17, 0x1e17,
0x1e19, 0x1e19,
0x1e1b, 0x1e1b,
0x1e1d, 0x1e1d,
0x1e1f, 0x1e1f,
0x1e21, 0x1e21,
0x1e23, 0x1e23,
0x1e25, 0x1e25,
0x1e27, 0x1e27,
0x1e29, 0x1e29,
0x1e2b, 0x1e2b,
0x1e2d, 0x1e2d,
0x1e2f, 0x1e2f,
0x1e31, 0x1e31,
0x1e33, 0x1e33,
0x1e35, 0x1e35,
0x1e37, 0x1e37,
0x1e39, 0x1e39,
0x1e3b, 0x1e3b,
0x1e3d, 0x1e3d,
0x1e3f, 0x1e3f,
0x1e41, 0x1e41,
0x1e43, 0x1e43,
0x1e45, 0x1e45,
0x1e47, 0x1e47,
0x1e49, 0x1e49,
0x1e4b, 0x1e4b,
0x1e4d, 0x1e4d,
0x1e4f, 0x1e4f,
0x1e51, 0x1e51,
0x1e53, 0x1e53,
0x1e55, 0x1e55,
0x1e57, 0x1e57,
0x1e59, 0x1e59,
0x1e5b, 0x1e5b,
0x1e5d, 0x1e5d,
0x1e5f, 0x1e5f,
0x1e61, 0x1e61,
0x1e63, 0x1e63,
0x1e65, 0x1e65,
0x1e67, 0x1e67,
0x1e69, 0x1e69,
0x1e6b, 0x1e6b,
0x1e6d, 0x1e6d,
0x1e6f, 0x1e6f,
0x1e71, 0x1e71,
0x1e73, 0x1e73,
0x1e75, 0x1e75,
0x1e77, 0x1e77,
0x1e79, 0x1e79,
0x1e7b, 0x1e7b,
0x1e7d, 0x1e7d,
0x1e7f, 0x1e7f,
0x1e81, 0x1e81,
0x1e83, 0x1e83,
0x1e85, 0x1e85,
0x1e87, 0x1e87,
0x1e89, 0x1e89,
0x1e8b, 0x1e8b,
0x1e8d, 0x1e8d,
0x1e8f, 0x1e8f,
0x1e91, 0x1e91,
0x1e93, 0x1e93,
0x1e95, 0x1e9b,
0x1ea1, 0x1ea1,
0x1ea3, 0x1ea3,
0x1ea5, 0x1ea5,
0x1ea7, 0x1ea7,
0x1ea9, 0x1ea9,
0x1eab, 0x1eab,
0x1ead, 0x1ead,
0x1eaf, 0x1eaf,
0x1eb1, 0x1eb1,
0x1eb3, 0x1eb3,
0x1eb5, 0x1eb5,
0x1eb7, 0x1eb7,
0x1eb9, 0x1eb9,
0x1ebb, 0x1ebb,
0x1ebd, 0x1ebd,
0x1ebf, 0x1ebf,
0x1ec1, 0x1ec1,
0x1ec3, 0x1ec3,
0x1ec5, 0x1ec5,
0x1ec7, 0x1ec7,
0x1ec9, 0x1ec9,
0x1ecb, 0x1ecb,
0x1ecd, 0x1ecd,
0x1ecf, 0x1ecf,
0x1ed1, 0x1ed1,
0x1ed3, 0x1ed3,
0x1ed5, 0x1ed5,
0x1ed7, 0x1ed7,
0x1ed9, 0x1ed9,
0x1edb, 0x1edb,
0x1edd, 0x1edd,
0x1edf, 0x1edf,
0x1ee1, 0x1ee1,
0x1ee3, 0x1ee3,
0x1ee5, 0x1ee5,
0x1ee7, 0x1ee7,
0x1ee9, 0x1ee9,
0x1eeb, 0x1eeb,
0x1eed, 0x1eed,
0x1eef, 0x1eef,
0x1ef1, 0x1ef1,
0x1ef3, 0x1ef3,
0x1ef5, 0x1ef5,
0x1ef7, 0x1ef7,
0x1ef9, 0x1ef9,
0x1f00, 0x1f07,
0x1f10, 0x1f15,
0x1f20, 0x1f27,
0x1f30, 0x1f37,
0x1f40, 0x1f45,
0x1f50, 0x1f57,
0x1f60, 0x1f67,
0x1f70, 0x1f7d,
0x1f80, 0x1f87,
0x1f90, 0x1f97,
0x1fa0, 0x1fa7,
0x1fb0, 0x1fb4,
0x1fb6, 0x1fb7,
0x1fbe, 0x1fbe,
0x1fc2, 0x1fc4,
0x1fc6, 0x1fc7,
0x1fd0, 0x1fd3,
0x1fd6, 0x1fd7,
0x1fe0, 0x1fe7,
0x1ff2, 0x1ff4,
0x1ff6, 0x1ff7,
0x2071, 0x2071,
0x207f, 0x207f,
0x210a, 0x210a,
0x210e, 0x210f,
0x2113, 0x2113,
0x212f, 0x212f,
0x2134, 0x2134,
0x2139, 0x2139,
0x213d, 0x213d,
0x2146, 0x2149,
0xfb00, 0xfb06,
0xfb13, 0xfb17,
0xff41, 0xff5a,
0x10428, 0x1044f,
0x1d41a, 0x1d433,
0x1d44e, 0x1d454,
0x1d456, 0x1d467,
0x1d482, 0x1d49b,
0x1d4b6, 0x1d4b9,
0x1d4bb, 0x1d4bb,
0x1d4bd, 0x1d4c3,
0x1d4c5, 0x1d4cf,
0x1d4ea, 0x1d503,
0x1d51e, 0x1d537,
0x1d552, 0x1d56b,
0x1d586, 0x1d59f,
0x1d5ba, 0x1d5d3,
0x1d5ee, 0x1d607,
0x1d622, 0x1d63b,
0x1d656, 0x1d66f,
0x1d68a, 0x1d6a3,
0x1d6c2, 0x1d6da,
0x1d6dc, 0x1d6e1,
0x1d6fc, 0x1d714,
0x1d716, 0x1d71b,
0x1d736, 0x1d74e,
0x1d750, 0x1d755,
0x1d770, 0x1d788,
0x1d78a, 0x1d78f,
0x1d7aa, 0x1d7c2,
0x1d7c4, 0x1d7c9
#endif /* USE_UNICODE_FULL_RANGE_CTYPE */
}; /* end of MBLower */
static const OnigCodePoint SBPrint[] = {
2,
0x0009, 0x000d,
0x0020, 0x007e
};
static const OnigCodePoint MBPrint[] = {
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
403,
#else
2,
#endif
0x0085, 0x0085,
0x00a0, 0x0236
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
,
0x0250, 0x0357,
0x035d, 0x036f,
0x0374, 0x0375,
0x037a, 0x037a,
0x037e, 0x037e,
0x0384, 0x038a,
0x038c, 0x038c,
0x038e, 0x03a1,
0x03a3, 0x03ce,
0x03d0, 0x03fb,
0x0400, 0x0486,
0x0488, 0x04ce,
0x04d0, 0x04f5,
0x04f8, 0x04f9,
0x0500, 0x050f,
0x0531, 0x0556,
0x0559, 0x055f,
0x0561, 0x0587,
0x0589, 0x058a,
0x0591, 0x05a1,
0x05a3, 0x05b9,
0x05bb, 0x05c4,
0x05d0, 0x05ea,
0x05f0, 0x05f4,
0x0600, 0x0603,
0x060c, 0x0615,
0x061b, 0x061b,
0x061f, 0x061f,
0x0621, 0x063a,
0x0640, 0x0658,
0x0660, 0x070d,
0x070f, 0x074a,
0x074d, 0x074f,
0x0780, 0x07b1,
0x0901, 0x0939,
0x093c, 0x094d,
0x0950, 0x0954,
0x0958, 0x0970,
0x0981, 0x0983,
0x0985, 0x098c,
0x098f, 0x0990,
0x0993, 0x09a8,
0x09aa, 0x09b0,
0x09b2, 0x09b2,
0x09b6, 0x09b9,
0x09bc, 0x09c4,
0x09c7, 0x09c8,
0x09cb, 0x09cd,
0x09d7, 0x09d7,
0x09dc, 0x09dd,
0x09df, 0x09e3,
0x09e6, 0x09fa,
0x0a01, 0x0a03,
0x0a05, 0x0a0a,
0x0a0f, 0x0a10,
0x0a13, 0x0a28,
0x0a2a, 0x0a30,
0x0a32, 0x0a33,
0x0a35, 0x0a36,
0x0a38, 0x0a39,
0x0a3c, 0x0a3c,
0x0a3e, 0x0a42,
0x0a47, 0x0a48,
0x0a4b, 0x0a4d,
0x0a59, 0x0a5c,
0x0a5e, 0x0a5e,
0x0a66, 0x0a74,
0x0a81, 0x0a83,
0x0a85, 0x0a8d,
0x0a8f, 0x0a91,
0x0a93, 0x0aa8,
0x0aaa, 0x0ab0,
0x0ab2, 0x0ab3,
0x0ab5, 0x0ab9,
0x0abc, 0x0ac5,
0x0ac7, 0x0ac9,
0x0acb, 0x0acd,
0x0ad0, 0x0ad0,
0x0ae0, 0x0ae3,
0x0ae6, 0x0aef,
0x0af1, 0x0af1,
0x0b01, 0x0b03,
0x0b05, 0x0b0c,
0x0b0f, 0x0b10,
0x0b13, 0x0b28,
0x0b2a, 0x0b30,
0x0b32, 0x0b33,
0x0b35, 0x0b39,
0x0b3c, 0x0b43,
0x0b47, 0x0b48,
0x0b4b, 0x0b4d,
0x0b56, 0x0b57,
0x0b5c, 0x0b5d,
0x0b5f, 0x0b61,
0x0b66, 0x0b71,
0x0b82, 0x0b83,
0x0b85, 0x0b8a,
0x0b8e, 0x0b90,
0x0b92, 0x0b95,
0x0b99, 0x0b9a,
0x0b9c, 0x0b9c,
0x0b9e, 0x0b9f,
0x0ba3, 0x0ba4,
0x0ba8, 0x0baa,
0x0bae, 0x0bb5,
0x0bb7, 0x0bb9,
0x0bbe, 0x0bc2,
0x0bc6, 0x0bc8,
0x0bca, 0x0bcd,
0x0bd7, 0x0bd7,
0x0be7, 0x0bfa,
0x0c01, 0x0c03,
0x0c05, 0x0c0c,
0x0c0e, 0x0c10,
0x0c12, 0x0c28,
0x0c2a, 0x0c33,
0x0c35, 0x0c39,
0x0c3e, 0x0c44,
0x0c46, 0x0c48,
0x0c4a, 0x0c4d,
0x0c55, 0x0c56,
0x0c60, 0x0c61,
0x0c66, 0x0c6f,
0x0c82, 0x0c83,
0x0c85, 0x0c8c,
0x0c8e, 0x0c90,
0x0c92, 0x0ca8,
0x0caa, 0x0cb3,
0x0cb5, 0x0cb9,
0x0cbc, 0x0cc4,
0x0cc6, 0x0cc8,
0x0cca, 0x0ccd,
0x0cd5, 0x0cd6,
0x0cde, 0x0cde,
0x0ce0, 0x0ce1,
0x0ce6, 0x0cef,
0x0d02, 0x0d03,
0x0d05, 0x0d0c,
0x0d0e, 0x0d10,
0x0d12, 0x0d28,
0x0d2a, 0x0d39,
0x0d3e, 0x0d43,
0x0d46, 0x0d48,
0x0d4a, 0x0d4d,
0x0d57, 0x0d57,
0x0d60, 0x0d61,
0x0d66, 0x0d6f,
0x0d82, 0x0d83,
0x0d85, 0x0d96,
0x0d9a, 0x0db1,
0x0db3, 0x0dbb,
0x0dbd, 0x0dbd,
0x0dc0, 0x0dc6,
0x0dca, 0x0dca,
0x0dcf, 0x0dd4,
0x0dd6, 0x0dd6,
0x0dd8, 0x0ddf,
0x0df2, 0x0df4,
0x0e01, 0x0e3a,
0x0e3f, 0x0e5b,
0x0e81, 0x0e82,
0x0e84, 0x0e84,
0x0e87, 0x0e88,
0x0e8a, 0x0e8a,
0x0e8d, 0x0e8d,
0x0e94, 0x0e97,
0x0e99, 0x0e9f,
0x0ea1, 0x0ea3,
0x0ea5, 0x0ea5,
0x0ea7, 0x0ea7,
0x0eaa, 0x0eab,
0x0ead, 0x0eb9,
0x0ebb, 0x0ebd,
0x0ec0, 0x0ec4,
0x0ec6, 0x0ec6,
0x0ec8, 0x0ecd,
0x0ed0, 0x0ed9,
0x0edc, 0x0edd,
0x0f00, 0x0f47,
0x0f49, 0x0f6a,
0x0f71, 0x0f8b,
0x0f90, 0x0f97,
0x0f99, 0x0fbc,
0x0fbe, 0x0fcc,
0x0fcf, 0x0fcf,
0x1000, 0x1021,
0x1023, 0x1027,
0x1029, 0x102a,
0x102c, 0x1032,
0x1036, 0x1039,
0x1040, 0x1059,
0x10a0, 0x10c5,
0x10d0, 0x10f8,
0x10fb, 0x10fb,
0x1100, 0x1159,
0x115f, 0x11a2,
0x11a8, 0x11f9,
0x1200, 0x1206,
0x1208, 0x1246,
0x1248, 0x1248,
0x124a, 0x124d,
0x1250, 0x1256,
0x1258, 0x1258,
0x125a, 0x125d,
0x1260, 0x1286,
0x1288, 0x1288,
0x128a, 0x128d,
0x1290, 0x12ae,
0x12b0, 0x12b0,
0x12b2, 0x12b5,
0x12b8, 0x12be,
0x12c0, 0x12c0,
0x12c2, 0x12c5,
0x12c8, 0x12ce,
0x12d0, 0x12d6,
0x12d8, 0x12ee,
0x12f0, 0x130e,
0x1310, 0x1310,
0x1312, 0x1315,
0x1318, 0x131e,
0x1320, 0x1346,
0x1348, 0x135a,
0x1361, 0x137c,
0x13a0, 0x13f4,
0x1401, 0x1676,
0x1680, 0x169c,
0x16a0, 0x16f0,
0x1700, 0x170c,
0x170e, 0x1714,
0x1720, 0x1736,
0x1740, 0x1753,
0x1760, 0x176c,
0x176e, 0x1770,
0x1772, 0x1773,
0x1780, 0x17dd,
0x17e0, 0x17e9,
0x17f0, 0x17f9,
0x1800, 0x180e,
0x1810, 0x1819,
0x1820, 0x1877,
0x1880, 0x18a9,
0x1900, 0x191c,
0x1920, 0x192b,
0x1930, 0x193b,
0x1940, 0x1940,
0x1944, 0x196d,
0x1970, 0x1974,
0x19e0, 0x19ff,
0x1d00, 0x1d6b,
0x1e00, 0x1e9b,
0x1ea0, 0x1ef9,
0x1f00, 0x1f15,
0x1f18, 0x1f1d,
0x1f20, 0x1f45,
0x1f48, 0x1f4d,
0x1f50, 0x1f57,
0x1f59, 0x1f59,
0x1f5b, 0x1f5b,
0x1f5d, 0x1f5d,
0x1f5f, 0x1f7d,
0x1f80, 0x1fb4,
0x1fb6, 0x1fc4,
0x1fc6, 0x1fd3,
0x1fd6, 0x1fdb,
0x1fdd, 0x1fef,
0x1ff2, 0x1ff4,
0x1ff6, 0x1ffe,
0x2000, 0x2054,
0x2057, 0x2057,
0x205f, 0x2063,
0x206a, 0x2071,
0x2074, 0x208e,
0x20a0, 0x20b1,
0x20d0, 0x20ea,
0x2100, 0x213b,
0x213d, 0x214b,
0x2153, 0x2183,
0x2190, 0x23d0,
0x2400, 0x2426,
0x2440, 0x244a,
0x2460, 0x2617,
0x2619, 0x267d,
0x2680, 0x2691,
0x26a0, 0x26a1,
0x2701, 0x2704,
0x2706, 0x2709,
0x270c, 0x2727,
0x2729, 0x274b,
0x274d, 0x274d,
0x274f, 0x2752,
0x2756, 0x2756,
0x2758, 0x275e,
0x2761, 0x2794,
0x2798, 0x27af,
0x27b1, 0x27be,
0x27d0, 0x27eb,
0x27f0, 0x2b0d,
0x2e80, 0x2e99,
0x2e9b, 0x2ef3,
0x2f00, 0x2fd5,
0x2ff0, 0x2ffb,
0x3000, 0x303f,
0x3041, 0x3096,
0x3099, 0x30ff,
0x3105, 0x312c,
0x3131, 0x318e,
0x3190, 0x31b7,
0x31f0, 0x321e,
0x3220, 0x3243,
0x3250, 0x327d,
0x327f, 0x32fe,
0x3300, 0x4db5,
0x4dc0, 0x9fa5,
0xa000, 0xa48c,
0xa490, 0xa4c6,
0xac00, 0xd7a3,
0xe000, 0xfa2d,
0xfa30, 0xfa6a,
0xfb00, 0xfb06,
0xfb13, 0xfb17,
0xfb1d, 0xfb36,
0xfb38, 0xfb3c,
0xfb3e, 0xfb3e,
0xfb40, 0xfb41,
0xfb43, 0xfb44,
0xfb46, 0xfbb1,
0xfbd3, 0xfd3f,
0xfd50, 0xfd8f,
0xfd92, 0xfdc7,
0xfdf0, 0xfdfd,
0xfe00, 0xfe0f,
0xfe20, 0xfe23,
0xfe30, 0xfe52,
0xfe54, 0xfe66,
0xfe68, 0xfe6b,
0xfe70, 0xfe74,
0xfe76, 0xfefc,
0xfeff, 0xfeff,
0xff01, 0xffbe,
0xffc2, 0xffc7,
0xffca, 0xffcf,
0xffd2, 0xffd7,
0xffda, 0xffdc,
0xffe0, 0xffe6,
0xffe8, 0xffee,
0xfff9, 0xfffd,
0x10000, 0x1000b,
0x1000d, 0x10026,
0x10028, 0x1003a,
0x1003c, 0x1003d,
0x1003f, 0x1004d,
0x10050, 0x1005d,
0x10080, 0x100fa,
0x10100, 0x10102,
0x10107, 0x10133,
0x10137, 0x1013f,
0x10300, 0x1031e,
0x10320, 0x10323,
0x10330, 0x1034a,
0x10380, 0x1039d,
0x1039f, 0x1039f,
0x10400, 0x1049d,
0x104a0, 0x104a9,
0x10800, 0x10805,
0x10808, 0x10808,
0x1080a, 0x10835,
0x10837, 0x10838,
0x1083c, 0x1083c,
0x1083f, 0x1083f,
0x1d000, 0x1d0f5,
0x1d100, 0x1d126,
0x1d12a, 0x1d1dd,
0x1d300, 0x1d356,
0x1d400, 0x1d454,
0x1d456, 0x1d49c,
0x1d49e, 0x1d49f,
0x1d4a2, 0x1d4a2,
0x1d4a5, 0x1d4a6,
0x1d4a9, 0x1d4ac,
0x1d4ae, 0x1d4b9,
0x1d4bb, 0x1d4bb,
0x1d4bd, 0x1d4c3,
0x1d4c5, 0x1d505,
0x1d507, 0x1d50a,
0x1d50d, 0x1d514,
0x1d516, 0x1d51c,
0x1d51e, 0x1d539,
0x1d53b, 0x1d53e,
0x1d540, 0x1d544,
0x1d546, 0x1d546,
0x1d54a, 0x1d550,
0x1d552, 0x1d6a3,
0x1d6a8, 0x1d7c9,
0x1d7ce, 0x1d7ff,
0x20000, 0x2a6d6,
0x2f800, 0x2fa1d,
0xe0001, 0xe0001,
0xe0020, 0xe007f,
0xe0100, 0xe01ef,
0xf0000, 0xffffd,
0x100000, 0x10fffd
#endif /* USE_UNICODE_FULL_RANGE_CTYPE */
}; /* end of MBPrint */
static const OnigCodePoint SBPunct[] = {
9,
0x0021, 0x0023,
0x0025, 0x002a,
0x002c, 0x002f,
0x003a, 0x003b,
0x003f, 0x0040,
0x005b, 0x005d,
0x005f, 0x005f,
0x007b, 0x007b,
0x007d, 0x007d
}; /* end of SBPunct */
static const OnigCodePoint MBPunct[] = {
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
77,
#else
5,
#endif
0x00a1, 0x00a1,
0x00ab, 0x00ab,
0x00b7, 0x00b7,
0x00bb, 0x00bb,
0x00bf, 0x00bf
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
,
0x037e, 0x037e,
0x0387, 0x0387,
0x055a, 0x055f,
0x0589, 0x058a,
0x05be, 0x05be,
0x05c0, 0x05c0,
0x05c3, 0x05c3,
0x05f3, 0x05f4,
0x060c, 0x060d,
0x061b, 0x061b,
0x061f, 0x061f,
0x066a, 0x066d,
0x06d4, 0x06d4,
0x0700, 0x070d,
0x0964, 0x0965,
0x0970, 0x0970,
0x0df4, 0x0df4,
0x0e4f, 0x0e4f,
0x0e5a, 0x0e5b,
0x0f04, 0x0f12,
0x0f3a, 0x0f3d,
0x0f85, 0x0f85,
0x104a, 0x104f,
0x10fb, 0x10fb,
0x1361, 0x1368,
0x166d, 0x166e,
0x169b, 0x169c,
0x16eb, 0x16ed,
0x1735, 0x1736,
0x17d4, 0x17d6,
0x17d8, 0x17da,
0x1800, 0x180a,
0x1944, 0x1945,
0x2010, 0x2027,
0x2030, 0x2043,
0x2045, 0x2051,
0x2053, 0x2054,
0x2057, 0x2057,
0x207d, 0x207e,
0x208d, 0x208e,
0x2329, 0x232a,
0x23b4, 0x23b6,
0x2768, 0x2775,
0x27e6, 0x27eb,
0x2983, 0x2998,
0x29d8, 0x29db,
0x29fc, 0x29fd,
0x3001, 0x3003,
0x3008, 0x3011,
0x3014, 0x301f,
0x3030, 0x3030,
0x303d, 0x303d,
0x30a0, 0x30a0,
0x30fb, 0x30fb,
0xfd3e, 0xfd3f,
0xfe30, 0xfe52,
0xfe54, 0xfe61,
0xfe63, 0xfe63,
0xfe68, 0xfe68,
0xfe6a, 0xfe6b,
0xff01, 0xff03,
0xff05, 0xff0a,
0xff0c, 0xff0f,
0xff1a, 0xff1b,
0xff1f, 0xff20,
0xff3b, 0xff3d,
0xff3f, 0xff3f,
0xff5b, 0xff5b,
0xff5d, 0xff5d,
0xff5f, 0xff65,
0x10100, 0x10101,
0x1039f, 0x1039f
#endif /* USE_UNICODE_FULL_RANGE_CTYPE */
}; /* end of MBPunct */
static const OnigCodePoint SBSpace[] = {
2,
0x0009, 0x000d,
0x0020, 0x0020
};
static const OnigCodePoint MBSpace[] = {
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
9,
#else
2,
#endif
0x0085, 0x0085,
0x00a0, 0x00a0
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
,
0x1680, 0x1680,
0x180e, 0x180e,
0x2000, 0x200a,
0x2028, 0x2029,
0x202f, 0x202f,
0x205f, 0x205f,
0x3000, 0x3000
#endif /* USE_UNICODE_FULL_RANGE_CTYPE */
}; /* end of MBSpace */
static const OnigCodePoint SBUpper[] = {
1,
0x0041, 0x005a
};
static const OnigCodePoint MBUpper[] = {
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
420,
#else
2,
#endif
0x00c0, 0x00d6,
0x00d8, 0x00de
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
,
0x0100, 0x0100,
0x0102, 0x0102,
0x0104, 0x0104,
0x0106, 0x0106,
0x0108, 0x0108,
0x010a, 0x010a,
0x010c, 0x010c,
0x010e, 0x010e,
0x0110, 0x0110,
0x0112, 0x0112,
0x0114, 0x0114,
0x0116, 0x0116,
0x0118, 0x0118,
0x011a, 0x011a,
0x011c, 0x011c,
0x011e, 0x011e,
0x0120, 0x0120,
0x0122, 0x0122,
0x0124, 0x0124,
0x0126, 0x0126,
0x0128, 0x0128,
0x012a, 0x012a,
0x012c, 0x012c,
0x012e, 0x012e,
0x0130, 0x0130,
0x0132, 0x0132,
0x0134, 0x0134,
0x0136, 0x0136,
0x0139, 0x0139,
0x013b, 0x013b,
0x013d, 0x013d,
0x013f, 0x013f,
0x0141, 0x0141,
0x0143, 0x0143,
0x0145, 0x0145,
0x0147, 0x0147,
0x014a, 0x014a,
0x014c, 0x014c,
0x014e, 0x014e,
0x0150, 0x0150,
0x0152, 0x0152,
0x0154, 0x0154,
0x0156, 0x0156,
0x0158, 0x0158,
0x015a, 0x015a,
0x015c, 0x015c,
0x015e, 0x015e,
0x0160, 0x0160,
0x0162, 0x0162,
0x0164, 0x0164,
0x0166, 0x0166,
0x0168, 0x0168,
0x016a, 0x016a,
0x016c, 0x016c,
0x016e, 0x016e,
0x0170, 0x0170,
0x0172, 0x0172,
0x0174, 0x0174,
0x0176, 0x0176,
0x0178, 0x0179,
0x017b, 0x017b,
0x017d, 0x017d,
0x0181, 0x0182,
0x0184, 0x0184,
0x0186, 0x0187,
0x0189, 0x018b,
0x018e, 0x0191,
0x0193, 0x0194,
0x0196, 0x0198,
0x019c, 0x019d,
0x019f, 0x01a0,
0x01a2, 0x01a2,
0x01a4, 0x01a4,
0x01a6, 0x01a7,
0x01a9, 0x01a9,
0x01ac, 0x01ac,
0x01ae, 0x01af,
0x01b1, 0x01b3,
0x01b5, 0x01b5,
0x01b7, 0x01b8,
0x01bc, 0x01bc,
0x01c4, 0x01c4,
0x01c7, 0x01c7,
0x01ca, 0x01ca,
0x01cd, 0x01cd,
0x01cf, 0x01cf,
0x01d1, 0x01d1,
0x01d3, 0x01d3,
0x01d5, 0x01d5,
0x01d7, 0x01d7,
0x01d9, 0x01d9,
0x01db, 0x01db,
0x01de, 0x01de,
0x01e0, 0x01e0,
0x01e2, 0x01e2,
0x01e4, 0x01e4,
0x01e6, 0x01e6,
0x01e8, 0x01e8,
0x01ea, 0x01ea,
0x01ec, 0x01ec,
0x01ee, 0x01ee,
0x01f1, 0x01f1,
0x01f4, 0x01f4,
0x01f6, 0x01f8,
0x01fa, 0x01fa,
0x01fc, 0x01fc,
0x01fe, 0x01fe,
0x0200, 0x0200,
0x0202, 0x0202,
0x0204, 0x0204,
0x0206, 0x0206,
0x0208, 0x0208,
0x020a, 0x020a,
0x020c, 0x020c,
0x020e, 0x020e,
0x0210, 0x0210,
0x0212, 0x0212,
0x0214, 0x0214,
0x0216, 0x0216,
0x0218, 0x0218,
0x021a, 0x021a,
0x021c, 0x021c,
0x021e, 0x021e,
0x0220, 0x0220,
0x0222, 0x0222,
0x0224, 0x0224,
0x0226, 0x0226,
0x0228, 0x0228,
0x022a, 0x022a,
0x022c, 0x022c,
0x022e, 0x022e,
0x0230, 0x0230,
0x0232, 0x0232,
0x0386, 0x0386,
0x0388, 0x038a,
0x038c, 0x038c,
0x038e, 0x038f,
0x0391, 0x03a1,
0x03a3, 0x03ab,
0x03d2, 0x03d4,
0x03d8, 0x03d8,
0x03da, 0x03da,
0x03dc, 0x03dc,
0x03de, 0x03de,
0x03e0, 0x03e0,
0x03e2, 0x03e2,
0x03e4, 0x03e4,
0x03e6, 0x03e6,
0x03e8, 0x03e8,
0x03ea, 0x03ea,
0x03ec, 0x03ec,
0x03ee, 0x03ee,
0x03f4, 0x03f4,
0x03f7, 0x03f7,
0x03f9, 0x03fa,
0x0400, 0x042f,
0x0460, 0x0460,
0x0462, 0x0462,
0x0464, 0x0464,
0x0466, 0x0466,
0x0468, 0x0468,
0x046a, 0x046a,
0x046c, 0x046c,
0x046e, 0x046e,
0x0470, 0x0470,
0x0472, 0x0472,
0x0474, 0x0474,
0x0476, 0x0476,
0x0478, 0x0478,
0x047a, 0x047a,
0x047c, 0x047c,
0x047e, 0x047e,
0x0480, 0x0480,
0x048a, 0x048a,
0x048c, 0x048c,
0x048e, 0x048e,
0x0490, 0x0490,
0x0492, 0x0492,
0x0494, 0x0494,
0x0496, 0x0496,
0x0498, 0x0498,
0x049a, 0x049a,
0x049c, 0x049c,
0x049e, 0x049e,
0x04a0, 0x04a0,
0x04a2, 0x04a2,
0x04a4, 0x04a4,
0x04a6, 0x04a6,
0x04a8, 0x04a8,
0x04aa, 0x04aa,
0x04ac, 0x04ac,
0x04ae, 0x04ae,
0x04b0, 0x04b0,
0x04b2, 0x04b2,
0x04b4, 0x04b4,
0x04b6, 0x04b6,
0x04b8, 0x04b8,
0x04ba, 0x04ba,
0x04bc, 0x04bc,
0x04be, 0x04be,
0x04c0, 0x04c1,
0x04c3, 0x04c3,
0x04c5, 0x04c5,
0x04c7, 0x04c7,
0x04c9, 0x04c9,
0x04cb, 0x04cb,
0x04cd, 0x04cd,
0x04d0, 0x04d0,
0x04d2, 0x04d2,
0x04d4, 0x04d4,
0x04d6, 0x04d6,
0x04d8, 0x04d8,
0x04da, 0x04da,
0x04dc, 0x04dc,
0x04de, 0x04de,
0x04e0, 0x04e0,
0x04e2, 0x04e2,
0x04e4, 0x04e4,
0x04e6, 0x04e6,
0x04e8, 0x04e8,
0x04ea, 0x04ea,
0x04ec, 0x04ec,
0x04ee, 0x04ee,
0x04f0, 0x04f0,
0x04f2, 0x04f2,
0x04f4, 0x04f4,
0x04f8, 0x04f8,
0x0500, 0x0500,
0x0502, 0x0502,
0x0504, 0x0504,
0x0506, 0x0506,
0x0508, 0x0508,
0x050a, 0x050a,
0x050c, 0x050c,
0x050e, 0x050e,
0x0531, 0x0556,
0x10a0, 0x10c5,
0x1e00, 0x1e00,
0x1e02, 0x1e02,
0x1e04, 0x1e04,
0x1e06, 0x1e06,
0x1e08, 0x1e08,
0x1e0a, 0x1e0a,
0x1e0c, 0x1e0c,
0x1e0e, 0x1e0e,
0x1e10, 0x1e10,
0x1e12, 0x1e12,
0x1e14, 0x1e14,
0x1e16, 0x1e16,
0x1e18, 0x1e18,
0x1e1a, 0x1e1a,
0x1e1c, 0x1e1c,
0x1e1e, 0x1e1e,
0x1e20, 0x1e20,
0x1e22, 0x1e22,
0x1e24, 0x1e24,
0x1e26, 0x1e26,
0x1e28, 0x1e28,
0x1e2a, 0x1e2a,
0x1e2c, 0x1e2c,
0x1e2e, 0x1e2e,
0x1e30, 0x1e30,
0x1e32, 0x1e32,
0x1e34, 0x1e34,
0x1e36, 0x1e36,
0x1e38, 0x1e38,
0x1e3a, 0x1e3a,
0x1e3c, 0x1e3c,
0x1e3e, 0x1e3e,
0x1e40, 0x1e40,
0x1e42, 0x1e42,
0x1e44, 0x1e44,
0x1e46, 0x1e46,
0x1e48, 0x1e48,
0x1e4a, 0x1e4a,
0x1e4c, 0x1e4c,
0x1e4e, 0x1e4e,
0x1e50, 0x1e50,
0x1e52, 0x1e52,
0x1e54, 0x1e54,
0x1e56, 0x1e56,
0x1e58, 0x1e58,
0x1e5a, 0x1e5a,
0x1e5c, 0x1e5c,
0x1e5e, 0x1e5e,
0x1e60, 0x1e60,
0x1e62, 0x1e62,
0x1e64, 0x1e64,
0x1e66, 0x1e66,
0x1e68, 0x1e68,
0x1e6a, 0x1e6a,
0x1e6c, 0x1e6c,
0x1e6e, 0x1e6e,
0x1e70, 0x1e70,
0x1e72, 0x1e72,
0x1e74, 0x1e74,
0x1e76, 0x1e76,
0x1e78, 0x1e78,
0x1e7a, 0x1e7a,
0x1e7c, 0x1e7c,
0x1e7e, 0x1e7e,
0x1e80, 0x1e80,
0x1e82, 0x1e82,
0x1e84, 0x1e84,
0x1e86, 0x1e86,
0x1e88, 0x1e88,
0x1e8a, 0x1e8a,
0x1e8c, 0x1e8c,
0x1e8e, 0x1e8e,
0x1e90, 0x1e90,
0x1e92, 0x1e92,
0x1e94, 0x1e94,
0x1ea0, 0x1ea0,
0x1ea2, 0x1ea2,
0x1ea4, 0x1ea4,
0x1ea6, 0x1ea6,
0x1ea8, 0x1ea8,
0x1eaa, 0x1eaa,
0x1eac, 0x1eac,
0x1eae, 0x1eae,
0x1eb0, 0x1eb0,
0x1eb2, 0x1eb2,
0x1eb4, 0x1eb4,
0x1eb6, 0x1eb6,
0x1eb8, 0x1eb8,
0x1eba, 0x1eba,
0x1ebc, 0x1ebc,
0x1ebe, 0x1ebe,
0x1ec0, 0x1ec0,
0x1ec2, 0x1ec2,
0x1ec4, 0x1ec4,
0x1ec6, 0x1ec6,
0x1ec8, 0x1ec8,
0x1eca, 0x1eca,
0x1ecc, 0x1ecc,
0x1ece, 0x1ece,
0x1ed0, 0x1ed0,
0x1ed2, 0x1ed2,
0x1ed4, 0x1ed4,
0x1ed6, 0x1ed6,
0x1ed8, 0x1ed8,
0x1eda, 0x1eda,
0x1edc, 0x1edc,
0x1ede, 0x1ede,
0x1ee0, 0x1ee0,
0x1ee2, 0x1ee2,
0x1ee4, 0x1ee4,
0x1ee6, 0x1ee6,
0x1ee8, 0x1ee8,
0x1eea, 0x1eea,
0x1eec, 0x1eec,
0x1eee, 0x1eee,
0x1ef0, 0x1ef0,
0x1ef2, 0x1ef2,
0x1ef4, 0x1ef4,
0x1ef6, 0x1ef6,
0x1ef8, 0x1ef8,
0x1f08, 0x1f0f,
0x1f18, 0x1f1d,
0x1f28, 0x1f2f,
0x1f38, 0x1f3f,
0x1f48, 0x1f4d,
0x1f59, 0x1f59,
0x1f5b, 0x1f5b,
0x1f5d, 0x1f5d,
0x1f5f, 0x1f5f,
0x1f68, 0x1f6f,
0x1fb8, 0x1fbb,
0x1fc8, 0x1fcb,
0x1fd8, 0x1fdb,
0x1fe8, 0x1fec,
0x1ff8, 0x1ffb,
0x2102, 0x2102,
0x2107, 0x2107,
0x210b, 0x210d,
0x2110, 0x2112,
0x2115, 0x2115,
0x2119, 0x211d,
0x2124, 0x2124,
0x2126, 0x2126,
0x2128, 0x2128,
0x212a, 0x212d,
0x2130, 0x2131,
0x2133, 0x2133,
0x213e, 0x213f,
0x2145, 0x2145,
0xff21, 0xff3a,
0x10400, 0x10427,
0x1d400, 0x1d419,
0x1d434, 0x1d44d,
0x1d468, 0x1d481,
0x1d49c, 0x1d49c,
0x1d49e, 0x1d49f,
0x1d4a2, 0x1d4a2,
0x1d4a5, 0x1d4a6,
0x1d4a9, 0x1d4ac,
0x1d4ae, 0x1d4b5,
0x1d4d0, 0x1d4e9,
0x1d504, 0x1d505,
0x1d507, 0x1d50a,
0x1d50d, 0x1d514,
0x1d516, 0x1d51c,
0x1d538, 0x1d539,
0x1d53b, 0x1d53e,
0x1d540, 0x1d544,
0x1d546, 0x1d546,
0x1d54a, 0x1d550,
0x1d56c, 0x1d585,
0x1d5a0, 0x1d5b9,
0x1d5d4, 0x1d5ed,
0x1d608, 0x1d621,
0x1d63c, 0x1d655,
0x1d670, 0x1d689,
0x1d6a8, 0x1d6c0,
0x1d6e2, 0x1d6fa,
0x1d71c, 0x1d734,
0x1d756, 0x1d76e,
0x1d790, 0x1d7a8
#endif /* USE_UNICODE_FULL_RANGE_CTYPE */
}; /* end of MBUpper */
static const OnigCodePoint SBXDigit[] = {
3,
0x0030, 0x0039,
0x0041, 0x0046,
0x0061, 0x0066
};
static const OnigCodePoint SBASCII[] = {
1,
0x0000, 0x007f
};
static const OnigCodePoint SBWord[] = {
4,
0x0030, 0x0039,
0x0041, 0x005a,
0x005f, 0x005f,
0x0061, 0x007a
};
static const OnigCodePoint MBWord[] = {
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
432,
#else
8,
#endif
0x00aa, 0x00aa,
0x00b2, 0x00b3,
0x00b5, 0x00b5,
0x00b9, 0x00ba,
0x00bc, 0x00be,
0x00c0, 0x00d6,
0x00d8, 0x00f6,
#ifndef USE_UNICODE_FULL_RANGE_CTYPE
0x00f8, 0x7fffffff
#else /* not USE_UNICODE_FULL_RANGE_CTYPE */
0x00f8, 0x0236,
0x0250, 0x02c1,
0x02c6, 0x02d1,
0x02e0, 0x02e4,
0x02ee, 0x02ee,
0x0300, 0x0357,
0x035d, 0x036f,
0x037a, 0x037a,
0x0386, 0x0386,
0x0388, 0x038a,
0x038c, 0x038c,
0x038e, 0x03a1,
0x03a3, 0x03ce,
0x03d0, 0x03f5,
0x03f7, 0x03fb,
0x0400, 0x0481,
0x0483, 0x0486,
0x0488, 0x04ce,
0x04d0, 0x04f5,
0x04f8, 0x04f9,
0x0500, 0x050f,
0x0531, 0x0556,
0x0559, 0x0559,
0x0561, 0x0587,
0x0591, 0x05a1,
0x05a3, 0x05b9,
0x05bb, 0x05bd,
0x05bf, 0x05bf,
0x05c1, 0x05c2,
0x05c4, 0x05c4,
0x05d0, 0x05ea,
0x05f0, 0x05f2,
0x0610, 0x0615,
0x0621, 0x063a,
0x0640, 0x0658,
0x0660, 0x0669,
0x066e, 0x06d3,
0x06d5, 0x06dc,
0x06de, 0x06e8,
0x06ea, 0x06fc,
0x06ff, 0x06ff,
0x0710, 0x074a,
0x074d, 0x074f,
0x0780, 0x07b1,
0x0901, 0x0939,
0x093c, 0x094d,
0x0950, 0x0954,
0x0958, 0x0963,
0x0966, 0x096f,
0x0981, 0x0983,
0x0985, 0x098c,
0x098f, 0x0990,
0x0993, 0x09a8,
0x09aa, 0x09b0,
0x09b2, 0x09b2,
0x09b6, 0x09b9,
0x09bc, 0x09c4,
0x09c7, 0x09c8,
0x09cb, 0x09cd,
0x09d7, 0x09d7,
0x09dc, 0x09dd,
0x09df, 0x09e3,
0x09e6, 0x09f1,
0x09f4, 0x09f9,
0x0a01, 0x0a03,
0x0a05, 0x0a0a,
0x0a0f, 0x0a10,
0x0a13, 0x0a28,
0x0a2a, 0x0a30,
0x0a32, 0x0a33,
0x0a35, 0x0a36,
0x0a38, 0x0a39,
0x0a3c, 0x0a3c,
0x0a3e, 0x0a42,
0x0a47, 0x0a48,
0x0a4b, 0x0a4d,
0x0a59, 0x0a5c,
0x0a5e, 0x0a5e,
0x0a66, 0x0a74,
0x0a81, 0x0a83,
0x0a85, 0x0a8d,
0x0a8f, 0x0a91,
0x0a93, 0x0aa8,
0x0aaa, 0x0ab0,
0x0ab2, 0x0ab3,
0x0ab5, 0x0ab9,
0x0abc, 0x0ac5,
0x0ac7, 0x0ac9,
0x0acb, 0x0acd,
0x0ad0, 0x0ad0,
0x0ae0, 0x0ae3,
0x0ae6, 0x0aef,
0x0b01, 0x0b03,
0x0b05, 0x0b0c,
0x0b0f, 0x0b10,
0x0b13, 0x0b28,
0x0b2a, 0x0b30,
0x0b32, 0x0b33,
0x0b35, 0x0b39,
0x0b3c, 0x0b43,
0x0b47, 0x0b48,
0x0b4b, 0x0b4d,
0x0b56, 0x0b57,
0x0b5c, 0x0b5d,
0x0b5f, 0x0b61,
0x0b66, 0x0b6f,
0x0b71, 0x0b71,
0x0b82, 0x0b83,
0x0b85, 0x0b8a,
0x0b8e, 0x0b90,
0x0b92, 0x0b95,
0x0b99, 0x0b9a,
0x0b9c, 0x0b9c,
0x0b9e, 0x0b9f,
0x0ba3, 0x0ba4,
0x0ba8, 0x0baa,
0x0bae, 0x0bb5,
0x0bb7, 0x0bb9,
0x0bbe, 0x0bc2,
0x0bc6, 0x0bc8,
0x0bca, 0x0bcd,
0x0bd7, 0x0bd7,
0x0be7, 0x0bf2,
0x0c01, 0x0c03,
0x0c05, 0x0c0c,
0x0c0e, 0x0c10,
0x0c12, 0x0c28,
0x0c2a, 0x0c33,
0x0c35, 0x0c39,
0x0c3e, 0x0c44,
0x0c46, 0x0c48,
0x0c4a, 0x0c4d,
0x0c55, 0x0c56,
0x0c60, 0x0c61,
0x0c66, 0x0c6f,
0x0c82, 0x0c83,
0x0c85, 0x0c8c,
0x0c8e, 0x0c90,
0x0c92, 0x0ca8,
0x0caa, 0x0cb3,
0x0cb5, 0x0cb9,
0x0cbc, 0x0cc4,
0x0cc6, 0x0cc8,
0x0cca, 0x0ccd,
0x0cd5, 0x0cd6,
0x0cde, 0x0cde,
0x0ce0, 0x0ce1,
0x0ce6, 0x0cef,
0x0d02, 0x0d03,
0x0d05, 0x0d0c,
0x0d0e, 0x0d10,
0x0d12, 0x0d28,
0x0d2a, 0x0d39,
0x0d3e, 0x0d43,
0x0d46, 0x0d48,
0x0d4a, 0x0d4d,
0x0d57, 0x0d57,
0x0d60, 0x0d61,
0x0d66, 0x0d6f,
0x0d82, 0x0d83,
0x0d85, 0x0d96,
0x0d9a, 0x0db1,
0x0db3, 0x0dbb,
0x0dbd, 0x0dbd,
0x0dc0, 0x0dc6,
0x0dca, 0x0dca,
0x0dcf, 0x0dd4,
0x0dd6, 0x0dd6,
0x0dd8, 0x0ddf,
0x0df2, 0x0df3,
0x0e01, 0x0e3a,
0x0e40, 0x0e4e,
0x0e50, 0x0e59,
0x0e81, 0x0e82,
0x0e84, 0x0e84,
0x0e87, 0x0e88,
0x0e8a, 0x0e8a,
0x0e8d, 0x0e8d,
0x0e94, 0x0e97,
0x0e99, 0x0e9f,
0x0ea1, 0x0ea3,
0x0ea5, 0x0ea5,
0x0ea7, 0x0ea7,
0x0eaa, 0x0eab,
0x0ead, 0x0eb9,
0x0ebb, 0x0ebd,
0x0ec0, 0x0ec4,
0x0ec6, 0x0ec6,
0x0ec8, 0x0ecd,
0x0ed0, 0x0ed9,
0x0edc, 0x0edd,
0x0f00, 0x0f00,
0x0f18, 0x0f19,
0x0f20, 0x0f33,
0x0f35, 0x0f35,
0x0f37, 0x0f37,
0x0f39, 0x0f39,
0x0f3e, 0x0f47,
0x0f49, 0x0f6a,
0x0f71, 0x0f84,
0x0f86, 0x0f8b,
0x0f90, 0x0f97,
0x0f99, 0x0fbc,
0x0fc6, 0x0fc6,
0x1000, 0x1021,
0x1023, 0x1027,
0x1029, 0x102a,
0x102c, 0x1032,
0x1036, 0x1039,
0x1040, 0x1049,
0x1050, 0x1059,
0x10a0, 0x10c5,
0x10d0, 0x10f8,
0x1100, 0x1159,
0x115f, 0x11a2,
0x11a8, 0x11f9,
0x1200, 0x1206,
0x1208, 0x1246,
0x1248, 0x1248,
0x124a, 0x124d,
0x1250, 0x1256,
0x1258, 0x1258,
0x125a, 0x125d,
0x1260, 0x1286,
0x1288, 0x1288,
0x128a, 0x128d,
0x1290, 0x12ae,
0x12b0, 0x12b0,
0x12b2, 0x12b5,
0x12b8, 0x12be,
0x12c0, 0x12c0,
0x12c2, 0x12c5,
0x12c8, 0x12ce,
0x12d0, 0x12d6,
0x12d8, 0x12ee,
0x12f0, 0x130e,
0x1310, 0x1310,
0x1312, 0x1315,
0x1318, 0x131e,
0x1320, 0x1346,
0x1348, 0x135a,
0x1369, 0x137c,
0x13a0, 0x13f4,
0x1401, 0x166c,
0x166f, 0x1676,
0x1681, 0x169a,
0x16a0, 0x16ea,
0x16ee, 0x16f0,
0x1700, 0x170c,
0x170e, 0x1714,
0x1720, 0x1734,
0x1740, 0x1753,
0x1760, 0x176c,
0x176e, 0x1770,
0x1772, 0x1773,
0x1780, 0x17b3,
0x17b6, 0x17d3,
0x17d7, 0x17d7,
0x17dc, 0x17dd,
0x17e0, 0x17e9,
0x17f0, 0x17f9,
0x180b, 0x180d,
0x1810, 0x1819,
0x1820, 0x1877,
0x1880, 0x18a9,
0x1900, 0x191c,
0x1920, 0x192b,
0x1930, 0x193b,
0x1946, 0x196d,
0x1970, 0x1974,
0x1d00, 0x1d6b,
0x1e00, 0x1e9b,
0x1ea0, 0x1ef9,
0x1f00, 0x1f15,
0x1f18, 0x1f1d,
0x1f20, 0x1f45,
0x1f48, 0x1f4d,
0x1f50, 0x1f57,
0x1f59, 0x1f59,
0x1f5b, 0x1f5b,
0x1f5d, 0x1f5d,
0x1f5f, 0x1f7d,
0x1f80, 0x1fb4,
0x1fb6, 0x1fbc,
0x1fbe, 0x1fbe,
0x1fc2, 0x1fc4,
0x1fc6, 0x1fcc,
0x1fd0, 0x1fd3,
0x1fd6, 0x1fdb,
0x1fe0, 0x1fec,
0x1ff2, 0x1ff4,
0x1ff6, 0x1ffc,
0x203f, 0x2040,
0x2054, 0x2054,
0x2070, 0x2071,
0x2074, 0x2079,
0x207f, 0x2089,
0x20d0, 0x20ea,
0x2102, 0x2102,
0x2107, 0x2107,
0x210a, 0x2113,
0x2115, 0x2115,
0x2119, 0x211d,
0x2124, 0x2124,
0x2126, 0x2126,
0x2128, 0x2128,
0x212a, 0x212d,
0x212f, 0x2131,
0x2133, 0x2139,
0x213d, 0x213f,
0x2145, 0x2149,
0x2153, 0x2183,
0x2460, 0x249b,
0x24ea, 0x24ff,
0x2776, 0x2793,
0x3005, 0x3007,
0x3021, 0x302f,
0x3031, 0x3035,
0x3038, 0x303c,
0x3041, 0x3096,
0x3099, 0x309a,
0x309d, 0x309f,
0x30a1, 0x30ff,
0x3105, 0x312c,
0x3131, 0x318e,
0x3192, 0x3195,
0x31a0, 0x31b7,
0x31f0, 0x31ff,
0x3220, 0x3229,
0x3251, 0x325f,
0x3280, 0x3289,
0x32b1, 0x32bf,
0x3400, 0x4db5,
0x4e00, 0x9fa5,
0xa000, 0xa48c,
0xac00, 0xd7a3,
0xf900, 0xfa2d,
0xfa30, 0xfa6a,
0xfb00, 0xfb06,
0xfb13, 0xfb17,
0xfb1d, 0xfb28,
0xfb2a, 0xfb36,
0xfb38, 0xfb3c,
0xfb3e, 0xfb3e,
0xfb40, 0xfb41,
0xfb43, 0xfb44,
0xfb46, 0xfbb1,
0xfbd3, 0xfd3d,
0xfd50, 0xfd8f,
0xfd92, 0xfdc7,
0xfdf0, 0xfdfb,
0xfe00, 0xfe0f,
0xfe20, 0xfe23,
0xfe33, 0xfe34,
0xfe4d, 0xfe4f,
0xfe70, 0xfe74,
0xfe76, 0xfefc,
0xff10, 0xff19,
0xff21, 0xff3a,
0xff3f, 0xff3f,
0xff41, 0xff5a,
0xff65, 0xffbe,
0xffc2, 0xffc7,
0xffca, 0xffcf,
0xffd2, 0xffd7,
0xffda, 0xffdc,
0x10000, 0x1000b,
0x1000d, 0x10026,
0x10028, 0x1003a,
0x1003c, 0x1003d,
0x1003f, 0x1004d,
0x10050, 0x1005d,
0x10080, 0x100fa,
0x10107, 0x10133,
0x10300, 0x1031e,
0x10320, 0x10323,
0x10330, 0x1034a,
0x10380, 0x1039d,
0x10400, 0x1049d,
0x104a0, 0x104a9,
0x10800, 0x10805,
0x10808, 0x10808,
0x1080a, 0x10835,
0x10837, 0x10838,
0x1083c, 0x1083c,
0x1083f, 0x1083f,
0x1d165, 0x1d169,
0x1d16d, 0x1d172,
0x1d17b, 0x1d182,
0x1d185, 0x1d18b,
0x1d1aa, 0x1d1ad,
0x1d400, 0x1d454,
0x1d456, 0x1d49c,
0x1d49e, 0x1d49f,
0x1d4a2, 0x1d4a2,
0x1d4a5, 0x1d4a6,
0x1d4a9, 0x1d4ac,
0x1d4ae, 0x1d4b9,
0x1d4bb, 0x1d4bb,
0x1d4bd, 0x1d4c3,
0x1d4c5, 0x1d505,
0x1d507, 0x1d50a,
0x1d50d, 0x1d514,
0x1d516, 0x1d51c,
0x1d51e, 0x1d539,
0x1d53b, 0x1d53e,
0x1d540, 0x1d544,
0x1d546, 0x1d546,
0x1d54a, 0x1d550,
0x1d552, 0x1d6a3,
0x1d6a8, 0x1d6c0,
0x1d6c2, 0x1d6da,
0x1d6dc, 0x1d6fa,
0x1d6fc, 0x1d714,
0x1d716, 0x1d734,
0x1d736, 0x1d74e,
0x1d750, 0x1d76e,
0x1d770, 0x1d788,
0x1d78a, 0x1d7a8,
0x1d7aa, 0x1d7c2,
0x1d7c4, 0x1d7c9,
0x1d7ce, 0x1d7ff,
0x20000, 0x2a6d6,
0x2f800, 0x2fa1d,
0xe0100, 0xe01ef
#endif /* USE_UNICODE_FULL_RANGE_CTYPE */
}; /* end of MBWord */
static int
utf8_get_ctype_code_range(int ctype,
const OnigCodePoint* sbr[], const OnigCodePoint* mbr[])
{
#define CR_SET(sbl,mbl) do { \
*sbr = sbl; \
*mbr = mbl; \
} while (0)
#define CR_SB_SET(sbl) do { \
*sbr = sbl; \
*mbr = EmptyRange; \
} while (0)
switch (ctype) {
case ONIGENC_CTYPE_ALPHA:
CR_SET(SBAlpha, MBAlpha);
break;
case ONIGENC_CTYPE_BLANK:
CR_SET(SBBlank, MBBlank);
break;
case ONIGENC_CTYPE_CNTRL:
CR_SET(SBCntrl, MBCntrl);
break;
case ONIGENC_CTYPE_DIGIT:
CR_SET(SBDigit, MBDigit);
break;
case ONIGENC_CTYPE_GRAPH:
CR_SET(SBGraph, MBGraph);
break;
case ONIGENC_CTYPE_LOWER:
CR_SET(SBLower, MBLower);
break;
case ONIGENC_CTYPE_PRINT:
CR_SET(SBPrint, MBPrint);
break;
case ONIGENC_CTYPE_PUNCT:
CR_SET(SBPunct, MBPunct);
break;
case ONIGENC_CTYPE_SPACE:
CR_SET(SBSpace, MBSpace);
break;
case ONIGENC_CTYPE_UPPER:
CR_SET(SBUpper, MBUpper);
break;
case ONIGENC_CTYPE_XDIGIT:
CR_SB_SET(SBXDigit);
break;
case ONIGENC_CTYPE_WORD:
CR_SET(SBWord, MBWord);
break;
case ONIGENC_CTYPE_ASCII:
CR_SB_SET(SBASCII);
break;
case ONIGENC_CTYPE_ALNUM:
CR_SET(SBAlnum, MBAlnum);
break;
default:
return ONIGENCERR_TYPE_BUG;
break;
}
return 0;
}
static int
utf8_is_code_ctype(OnigCodePoint code, unsigned int ctype)
{
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
const OnigCodePoint *range;
#endif
if (code < 256) {
return ONIGENC_IS_UNICODE_ISO_8859_1_CTYPE(code, ctype);
}
#ifdef USE_UNICODE_FULL_RANGE_CTYPE
switch (ctype) {
case ONIGENC_CTYPE_ALPHA:
range = MBAlpha;
break;
case ONIGENC_CTYPE_BLANK:
range = MBBlank;
break;
case ONIGENC_CTYPE_CNTRL:
range = MBCntrl;
break;
case ONIGENC_CTYPE_DIGIT:
range = MBDigit;
break;
case ONIGENC_CTYPE_GRAPH:
range = MBGraph;
break;
case ONIGENC_CTYPE_LOWER:
range = MBLower;
break;
case ONIGENC_CTYPE_PRINT:
range = MBPrint;
break;
case ONIGENC_CTYPE_PUNCT:
range = MBPunct;
break;
case ONIGENC_CTYPE_SPACE:
range = MBSpace;
break;
case ONIGENC_CTYPE_UPPER:
range = MBUpper;
break;
case ONIGENC_CTYPE_XDIGIT:
return FALSE;
break;
case ONIGENC_CTYPE_WORD:
range = MBWord;
break;
case ONIGENC_CTYPE_ASCII:
return FALSE;
break;
case ONIGENC_CTYPE_ALNUM:
range = MBAlnum;
break;
case ONIGENC_CTYPE_NEWLINE:
return FALSE;
break;
default:
return ONIGENCERR_TYPE_BUG;
break;
}
return onig_is_in_code_range((UChar* )range, code);
#else
if ((ctype & ONIGENC_CTYPE_WORD) != 0) {
#ifdef USE_INVALID_CODE_SCHEME
if (code <= VALID_CODE_LIMIT)
#endif
return TRUE;
}
#endif /* USE_UNICODE_FULL_RANGE_CTYPE */
return FALSE;
}
static UChar*
utf8_left_adjust_char_head(const UChar* start, const UChar* s)
{
const UChar *p;
if (s <= start) return (UChar* )s;
p = s;
while (!utf8_islead(*p) && p > start) p--;
return (UChar* )p;
}
OnigEncodingType OnigEncodingUTF8 = {
utf8_mbc_enc_len,
"UTF-8", /* name */
6, /* max byte length */
1, /* min byte length */
(ONIGENC_AMBIGUOUS_MATCH_ASCII_CASE |
ONIGENC_AMBIGUOUS_MATCH_NONASCII_CASE |
ONIGENC_AMBIGUOUS_MATCH_COMPOUND),
{
(OnigCodePoint )'\\' /* esc */
, (OnigCodePoint )ONIG_INEFFECTIVE_META_CHAR /* anychar '.' */
, (OnigCodePoint )ONIG_INEFFECTIVE_META_CHAR /* anytime '*' */
, (OnigCodePoint )ONIG_INEFFECTIVE_META_CHAR /* zero or one time '?' */
, (OnigCodePoint )ONIG_INEFFECTIVE_META_CHAR /* one or more time '+' */
, (OnigCodePoint )ONIG_INEFFECTIVE_META_CHAR /* anychar anytime */
},
utf8_is_mbc_newline,
utf8_mbc_to_code,
utf8_code_to_mbclen,
utf8_code_to_mbc,
utf8_mbc_to_normalize,
utf8_is_mbc_ambiguous,
onigenc_iso_8859_1_get_all_pair_ambig_codes,
onigenc_ess_tsett_get_all_comp_ambig_codes,
utf8_is_code_ctype,
utf8_get_ctype_code_range,
utf8_left_adjust_char_head,
onigenc_always_true_is_allowed_reverse_match
};