зеркало из https://github.com/github/ruby.git
[DOC] Regexp doc (#7923)
This commit is contained in:
Родитель
6be402e172
Коммит
932dd9f10e
|
@ -6,3 +6,5 @@ NEWS
|
|||
syntax
|
||||
optparse
|
||||
rdoc
|
||||
regexp/methods.rdoc
|
||||
regexp/unicode_properties.rdoc
|
||||
|
|
1785
doc/regexp.rdoc
1785
doc/regexp.rdoc
Разница между файлами не показана из-за своего большого размера
Загрузить разницу
|
@ -0,0 +1,41 @@
|
|||
== \Regexp Methods
|
||||
|
||||
Each of these Ruby core methods can accept a regexp as an argument:
|
||||
|
||||
- Enumerable#all?
|
||||
- Enumerable#any?
|
||||
- Enumerable#grep
|
||||
- Enumerable#grep_v
|
||||
- Enumerable#none?
|
||||
- Enumerable#one?
|
||||
- Enumerable#slice_after
|
||||
- Enumerable#slice_before
|
||||
- Regexp#=~
|
||||
- Regexp#match
|
||||
- Regexp#match?
|
||||
- Regexp.new
|
||||
- Regexp.union
|
||||
- String#=~
|
||||
- String#[]=
|
||||
- String#byteindex
|
||||
- String#byterindex
|
||||
- String#gsub
|
||||
- String#gsub!
|
||||
- String#index
|
||||
- String#match
|
||||
- String#match?
|
||||
- String#partition
|
||||
- String#rindex
|
||||
- String#rpartition
|
||||
- String#scan
|
||||
- String#slice
|
||||
- String#slice!
|
||||
- String#split
|
||||
- String#start_with?
|
||||
- String#sub
|
||||
- String#sub!
|
||||
- Symbol#=~
|
||||
- Symbol#match
|
||||
- Symbol#match?
|
||||
- Symbol#slice
|
||||
- Symbol#start_with?
|
|
@ -0,0 +1,863 @@
|
|||
== \Regexps Based on Unicode Properties
|
||||
|
||||
The properties shown here are those currently supported in Ruby.
|
||||
Older versions may not support all of these;
|
||||
newer versions may support additional properties.
|
||||
|
||||
=== POSIX brackets
|
||||
|
||||
- <tt>/\p{Alpha}/</tt>
|
||||
- <tt>/\p{Blank}/</tt>
|
||||
- <tt>/\p{Cntrl}/</tt>
|
||||
- <tt>/\p{Digit}/</tt>
|
||||
- <tt>/\p{Graph}/</tt>
|
||||
- <tt>/\p{Lower}/</tt>
|
||||
- <tt>/\p{Print}/</tt>
|
||||
- <tt>/\p{Punct}/</tt>
|
||||
- <tt>/\p{Space}/</tt>
|
||||
- <tt>/\p{Upper}/</tt>
|
||||
- <tt>/\p{XDigit}/</tt>
|
||||
- <tt>/\p{Word}/</tt>
|
||||
- <tt>/\p{Alnum}/</tt>
|
||||
- <tt>/\p{ASCII}/</tt>
|
||||
- <tt>/\p{XPosixPunct}/</tt>
|
||||
|
||||
=== Special
|
||||
|
||||
- <tt>/\p{Any}/</tt>
|
||||
- <tt>/\p{Assigned}/</tt>
|
||||
|
||||
=== Major and General Categories
|
||||
|
||||
- <tt>/\p{C}/</tt>
|
||||
- <tt>/\p{Cc}/</tt>
|
||||
- <tt>/\p{Cf}/</tt>
|
||||
- <tt>/\p{Cn}/</tt>
|
||||
- <tt>/\p{Co}/</tt>
|
||||
- <tt>/\p{Cs}/</tt>
|
||||
- <tt>/\p{L}/</tt>
|
||||
- <tt>/\p{LC}/</tt>
|
||||
- <tt>/\p{Ll}/</tt>
|
||||
- <tt>/\p{Lm}/</tt>
|
||||
- <tt>/\p{Lo}/</tt>
|
||||
- <tt>/\p{Lt}/</tt>
|
||||
- <tt>/\p{Lu}/</tt>
|
||||
- <tt>/\p{M}/</tt>
|
||||
- <tt>/\p{Mc}/</tt>
|
||||
- <tt>/\p{Me}/</tt>
|
||||
- <tt>/\p{Mn}/</tt>
|
||||
- <tt>/\p{N}/</tt>
|
||||
- <tt>/\p{Nd}/</tt>
|
||||
- <tt>/\p{Nl}/</tt>
|
||||
- <tt>/\p{No}/</tt>
|
||||
- <tt>/\p{P}/</tt>
|
||||
- <tt>/\p{Pc}/</tt>
|
||||
- <tt>/\p{Pd}/</tt>
|
||||
- <tt>/\p{Pe}/</tt>
|
||||
- <tt>/\p{Pf}/</tt>
|
||||
- <tt>/\p{Pi}/</tt>
|
||||
- <tt>/\p{Po}/</tt>
|
||||
- <tt>/\p{Ps}/</tt>
|
||||
- <tt>/\p{S}/</tt>
|
||||
- <tt>/\p{Sc}/</tt>
|
||||
- <tt>/\p{Sk}/</tt>
|
||||
- <tt>/\p{Sm}/</tt>
|
||||
- <tt>/\p{So}/</tt>
|
||||
- <tt>/\p{Z}/</tt>
|
||||
- <tt>/\p{Zl}/</tt>
|
||||
- <tt>/\p{Zp}/</tt>
|
||||
- <tt>/\p{Zs}/</tt>
|
||||
|
||||
=== Scripts
|
||||
|
||||
- <tt>/\p{Adlam}/</tt>
|
||||
- <tt>/\p{Ahom}/</tt>
|
||||
- <tt>/\p{Anatolian_Hieroglyphs}/</tt>
|
||||
- <tt>/\p{Arabic}/</tt>
|
||||
- <tt>/\p{Armenian}/</tt>
|
||||
- <tt>/\p{Avestan}/</tt>
|
||||
- <tt>/\p{Balinese}/</tt>
|
||||
- <tt>/\p{Bamum}/</tt>
|
||||
- <tt>/\p{Bassa_Vah}/</tt>
|
||||
- <tt>/\p{Batak}/</tt>
|
||||
- <tt>/\p{Bengali}/</tt>
|
||||
- <tt>/\p{Bhaiksuki}/</tt>
|
||||
- <tt>/\p{Bopomofo}/</tt>
|
||||
- <tt>/\p{Brahmi}/</tt>
|
||||
- <tt>/\p{Braille}/</tt>
|
||||
- <tt>/\p{Buginese}/</tt>
|
||||
- <tt>/\p{Buhid}/</tt>
|
||||
- <tt>/\p{Canadian_Aboriginal}/</tt>
|
||||
- <tt>/\p{Carian}/</tt>
|
||||
- <tt>/\p{Caucasian_Albanian}/</tt>
|
||||
- <tt>/\p{Chakma}/</tt>
|
||||
- <tt>/\p{Cham}/</tt>
|
||||
- <tt>/\p{Cherokee}/</tt>
|
||||
- <tt>/\p{Common}/</tt>
|
||||
- <tt>/\p{Coptic}/</tt>
|
||||
- <tt>/\p{Cuneiform}/</tt>
|
||||
- <tt>/\p{Cypriot}/</tt>
|
||||
- <tt>/\p{Cyrillic}/</tt>
|
||||
- <tt>/\p{Deseret}/</tt>
|
||||
- <tt>/\p{Devanagari}/</tt>
|
||||
- <tt>/\p{Dogra}/</tt>
|
||||
- <tt>/\p{Duployan}/</tt>
|
||||
- <tt>/\p{Egyptian_Hieroglyphs}/</tt>
|
||||
- <tt>/\p{Elbasan}/</tt>
|
||||
- <tt>/\p{Elymaic}/</tt>
|
||||
- <tt>/\p{Ethiopic}/</tt>
|
||||
- <tt>/\p{Georgian}/</tt>
|
||||
- <tt>/\p{Glagolitic}/</tt>
|
||||
- <tt>/\p{Gothic}/</tt>
|
||||
- <tt>/\p{Grantha}/</tt>
|
||||
- <tt>/\p{Greek}/</tt>
|
||||
- <tt>/\p{Gujarati}/</tt>
|
||||
- <tt>/\p{Gunjala_Gondi}/</tt>
|
||||
- <tt>/\p{Gurmukhi}/</tt>
|
||||
- <tt>/\p{Han}/</tt>
|
||||
- <tt>/\p{Hangul}/</tt>
|
||||
- <tt>/\p{Hanifi_Rohingya}/</tt>
|
||||
- <tt>/\p{Hanunoo}/</tt>
|
||||
- <tt>/\p{Hatran}/</tt>
|
||||
- <tt>/\p{Hebrew}/</tt>
|
||||
- <tt>/\p{Hiragana}/</tt>
|
||||
- <tt>/\p{Imperial_Aramaic}/</tt>
|
||||
- <tt>/\p{Inherited}/</tt>
|
||||
- <tt>/\p{Inscriptional_Pahlavi}/</tt>
|
||||
- <tt>/\p{Inscriptional_Parthian}/</tt>
|
||||
- <tt>/\p{Javanese}/</tt>
|
||||
- <tt>/\p{Kaithi}/</tt>
|
||||
- <tt>/\p{Kannada}/</tt>
|
||||
- <tt>/\p{Katakana}/</tt>
|
||||
- <tt>/\p{Kayah_Li}/</tt>
|
||||
- <tt>/\p{Kharoshthi}/</tt>
|
||||
- <tt>/\p{Khmer}/</tt>
|
||||
- <tt>/\p{Khojki}/</tt>
|
||||
- <tt>/\p{Khudawadi}/</tt>
|
||||
- <tt>/\p{Lao}/</tt>
|
||||
- <tt>/\p{Latin}/</tt>
|
||||
- <tt>/\p{Lepcha}/</tt>
|
||||
- <tt>/\p{Limbu}/</tt>
|
||||
- <tt>/\p{Linear_A}/</tt>
|
||||
- <tt>/\p{Linear_B}/</tt>
|
||||
- <tt>/\p{Lisu}/</tt>
|
||||
- <tt>/\p{Lycian}/</tt>
|
||||
- <tt>/\p{Lydian}/</tt>
|
||||
- <tt>/\p{Mahajani}/</tt>
|
||||
- <tt>/\p{Makasar}/</tt>
|
||||
- <tt>/\p{Malayalam}/</tt>
|
||||
- <tt>/\p{Mandaic}/</tt>
|
||||
- <tt>/\p{Manichaean}/</tt>
|
||||
- <tt>/\p{Marchen}/</tt>
|
||||
- <tt>/\p{Masaram_Gondi}/</tt>
|
||||
- <tt>/\p{Medefaidrin}/</tt>
|
||||
- <tt>/\p{Meetei_Mayek}/</tt>
|
||||
- <tt>/\p{Mende_Kikakui}/</tt>
|
||||
- <tt>/\p{Meroitic_Cursive}/</tt>
|
||||
- <tt>/\p{Meroitic_Hieroglyphs}/</tt>
|
||||
- <tt>/\p{Miao}/</tt>
|
||||
- <tt>/\p{Modi}/</tt>
|
||||
- <tt>/\p{Mongolian}/</tt>
|
||||
- <tt>/\p{Mro}/</tt>
|
||||
- <tt>/\p{Multani}/</tt>
|
||||
- <tt>/\p{Myanmar}/</tt>
|
||||
- <tt>/\p{Nabataean}/</tt>
|
||||
- <tt>/\p{Nandinagari}/</tt>
|
||||
- <tt>/\p{New_Tai_Lue}/</tt>
|
||||
- <tt>/\p{Newa}/</tt>
|
||||
- <tt>/\p{Nko}/</tt>
|
||||
- <tt>/\p{Nushu}/</tt>
|
||||
- <tt>/\p{Nyiakeng_Puachue_Hmong}/</tt>
|
||||
- <tt>/\p{Ogham}/</tt>
|
||||
- <tt>/\p{Ol_Chiki}/</tt>
|
||||
- <tt>/\p{Old_Hungarian}/</tt>
|
||||
- <tt>/\p{Old_Italic}/</tt>
|
||||
- <tt>/\p{Old_North_Arabian}/</tt>
|
||||
- <tt>/\p{Old_Permic}/</tt>
|
||||
- <tt>/\p{Old_Persian}/</tt>
|
||||
- <tt>/\p{Old_Sogdian}/</tt>
|
||||
- <tt>/\p{Old_South_Arabian}/</tt>
|
||||
- <tt>/\p{Old_Turkic}/</tt>
|
||||
- <tt>/\p{Oriya}/</tt>
|
||||
- <tt>/\p{Osage}/</tt>
|
||||
- <tt>/\p{Osmanya}/</tt>
|
||||
- <tt>/\p{Pahawh_Hmong}/</tt>
|
||||
- <tt>/\p{Palmyrene}/</tt>
|
||||
- <tt>/\p{Pau_Cin_Hau}/</tt>
|
||||
- <tt>/\p{Phags_Pa}/</tt>
|
||||
- <tt>/\p{Phoenician}/</tt>
|
||||
- <tt>/\p{Psalter_Pahlavi}/</tt>
|
||||
- <tt>/\p{Rejang}/</tt>
|
||||
- <tt>/\p{Runic}/</tt>
|
||||
- <tt>/\p{Samaritan}/</tt>
|
||||
- <tt>/\p{Saurashtra}/</tt>
|
||||
- <tt>/\p{Sharada}/</tt>
|
||||
- <tt>/\p{Shavian}/</tt>
|
||||
- <tt>/\p{Siddham}/</tt>
|
||||
- <tt>/\p{SignWriting}/</tt>
|
||||
- <tt>/\p{Sinhala}/</tt>
|
||||
- <tt>/\p{Sogdian}/</tt>
|
||||
- <tt>/\p{Sora_Sompeng}/</tt>
|
||||
- <tt>/\p{Soyombo}/</tt>
|
||||
- <tt>/\p{Sundanese}/</tt>
|
||||
- <tt>/\p{Syloti_Nagri}/</tt>
|
||||
- <tt>/\p{Syriac}/</tt>
|
||||
- <tt>/\p{Tagalog}/</tt>
|
||||
- <tt>/\p{Tagbanwa}/</tt>
|
||||
- <tt>/\p{Tai_Le}/</tt>
|
||||
- <tt>/\p{Tai_Tham}/</tt>
|
||||
- <tt>/\p{Tai_Viet}/</tt>
|
||||
- <tt>/\p{Takri}/</tt>
|
||||
- <tt>/\p{Tamil}/</tt>
|
||||
- <tt>/\p{Tangut}/</tt>
|
||||
- <tt>/\p{Telugu}/</tt>
|
||||
- <tt>/\p{Thaana}/</tt>
|
||||
- <tt>/\p{Thai}/</tt>
|
||||
- <tt>/\p{Tibetan}/</tt>
|
||||
- <tt>/\p{Tifinagh}/</tt>
|
||||
- <tt>/\p{Tirhuta}/</tt>
|
||||
- <tt>/\p{Ugaritic}/</tt>
|
||||
- <tt>/\p{Unknown}/</tt>
|
||||
- <tt>/\p{Vai}/</tt>
|
||||
- <tt>/\p{Wancho}/</tt>
|
||||
- <tt>/\p{Warang_Citi}/</tt>
|
||||
- <tt>/\p{Yi}/</tt>
|
||||
- <tt>/\p{Zanabazar_Square}/</tt>
|
||||
|
||||
=== Derived Core Properties
|
||||
|
||||
- <tt>/\p{Alphabetic}/</tt>
|
||||
- <tt>/\p{Case_Ignorable}/</tt>
|
||||
- <tt>/\p{Cased}/</tt>
|
||||
- <tt>/\p{Changes_When_Casefolded}/</tt>
|
||||
- <tt>/\p{Changes_When_Casemapped}/</tt>
|
||||
- <tt>/\p{Changes_When_Lowercased}/</tt>
|
||||
- <tt>/\p{Changes_When_Titlecased}/</tt>
|
||||
- <tt>/\p{Changes_When_Uppercased}/</tt>
|
||||
- <tt>/\p{Default_Ignorable_Code_Point}/</tt>
|
||||
- <tt>/\p{Grapheme_Base}/</tt>
|
||||
- <tt>/\p{Grapheme_Extend}/</tt>
|
||||
- <tt>/\p{Grapheme_Link}/</tt>
|
||||
- <tt>/\p{ID_Continue}/</tt>
|
||||
- <tt>/\p{ID_Start}/</tt>
|
||||
- <tt>/\p{Lowercase}/</tt>
|
||||
- <tt>/\p{Math}/</tt>
|
||||
- <tt>/\p{Uppercase}/</tt>
|
||||
- <tt>/\p{XID_Continue}/</tt>
|
||||
- <tt>/\p{XID_Start}/</tt>
|
||||
|
||||
=== Prop List
|
||||
|
||||
- <tt>/\p{ASCII_Hex_Digit}/</tt>
|
||||
- <tt>/\p{Bidi_Control}/</tt>
|
||||
- <tt>/\p{Dash}/</tt>
|
||||
- <tt>/\p{Deprecated}/</tt>
|
||||
- <tt>/\p{Diacritic}/</tt>
|
||||
- <tt>/\p{Extender}/</tt>
|
||||
- <tt>/\p{Hex_Digit}/</tt>
|
||||
- <tt>/\p{Hyphen}/</tt>
|
||||
- <tt>/\p{IDS_Binary_Operator}/</tt>
|
||||
- <tt>/\p{IDS_Trinary_Operator}/</tt>
|
||||
- <tt>/\p{Ideographic}/</tt>
|
||||
- <tt>/\p{Join_Control}/</tt>
|
||||
- <tt>/\p{Logical_Order_Exception}/</tt>
|
||||
- <tt>/\p{Noncharacter_Code_Point}/</tt>
|
||||
- <tt>/\p{Other_Alphabetic}/</tt>
|
||||
- <tt>/\p{Other_Default_Ignorable_Code_Point}/</tt>
|
||||
- <tt>/\p{Other_Grapheme_Extend}/</tt>
|
||||
- <tt>/\p{Other_ID_Continue}/</tt>
|
||||
- <tt>/\p{Other_ID_Start}/</tt>
|
||||
- <tt>/\p{Other_Lowercase}/</tt>
|
||||
- <tt>/\p{Other_Math}/</tt>
|
||||
- <tt>/\p{Other_Uppercase}/</tt>
|
||||
- <tt>/\p{Pattern_Syntax}/</tt>
|
||||
- <tt>/\p{Pattern_White_Space}/</tt>
|
||||
- <tt>/\p{Prepended_Concatenation_Mark}/</tt>
|
||||
- <tt>/\p{Quotation_Mark}/</tt>
|
||||
- <tt>/\p{Radical}/</tt>
|
||||
- <tt>/\p{Regional_Indicator}/</tt>
|
||||
- <tt>/\p{Sentence_Terminal}/</tt>
|
||||
- <tt>/\p{Soft_Dotted}/</tt>
|
||||
- <tt>/\p{Terminal_Punctuation}/</tt>
|
||||
- <tt>/\p{Unified_Ideograph}/</tt>
|
||||
- <tt>/\p{Variation_Selector}/</tt>
|
||||
- <tt>/\p{White_Space}/</tt>
|
||||
|
||||
=== Emoji
|
||||
|
||||
- <tt>/\p{Emoji}/</tt>
|
||||
- <tt>/\p{Emoji_Component}/</tt>
|
||||
- <tt>/\p{Emoji_Modifier}/</tt>
|
||||
- <tt>/\p{Emoji_Modifier_Base}/</tt>
|
||||
- <tt>/\p{Emoji_Presentation}/</tt>
|
||||
|
||||
=== Property Aliases
|
||||
|
||||
- <tt>/\p{AHex}/</tt>
|
||||
- <tt>/\p{Bidi_C}/</tt>
|
||||
- <tt>/\p{CI}/</tt>
|
||||
- <tt>/\p{CWCF}/</tt>
|
||||
- <tt>/\p{CWCM}/</tt>
|
||||
- <tt>/\p{CWL}/</tt>
|
||||
- <tt>/\p{CWT}/</tt>
|
||||
- <tt>/\p{CWU}/</tt>
|
||||
- <tt>/\p{DI}/</tt>
|
||||
- <tt>/\p{Dep}/</tt>
|
||||
- <tt>/\p{Dia}/</tt>
|
||||
- <tt>/\p{Ext}/</tt>
|
||||
- <tt>/\p{Gr_Base}/</tt>
|
||||
- <tt>/\p{Gr_Ext}/</tt>
|
||||
- <tt>/\p{Gr_Link}/</tt>
|
||||
- <tt>/\p{Hex}/</tt>
|
||||
- <tt>/\p{IDC}/</tt>
|
||||
- <tt>/\p{IDS}/</tt>
|
||||
- <tt>/\p{IDSB}/</tt>
|
||||
- <tt>/\p{IDST}/</tt>
|
||||
- <tt>/\p{Ideo}/</tt>
|
||||
- <tt>/\p{Join_C}/</tt>
|
||||
- <tt>/\p{LOE}/</tt>
|
||||
- <tt>/\p{NChar}/</tt>
|
||||
- <tt>/\p{OAlpha}/</tt>
|
||||
- <tt>/\p{ODI}/</tt>
|
||||
- <tt>/\p{OGr_Ext}/</tt>
|
||||
- <tt>/\p{OIDC}/</tt>
|
||||
- <tt>/\p{OIDS}/</tt>
|
||||
- <tt>/\p{OLower}/</tt>
|
||||
- <tt>/\p{OMath}/</tt>
|
||||
- <tt>/\p{OUpper}/</tt>
|
||||
- <tt>/\p{PCM}/</tt>
|
||||
- <tt>/\p{Pat_Syn}/</tt>
|
||||
- <tt>/\p{Pat_WS}/</tt>
|
||||
- <tt>/\p{QMark}/</tt>
|
||||
- <tt>/\p{RI}/</tt>
|
||||
- <tt>/\p{SD}/</tt>
|
||||
- <tt>/\p{STerm}/</tt>
|
||||
- <tt>/\p{Term}/</tt>
|
||||
- <tt>/\p{UIdeo}/</tt>
|
||||
- <tt>/\p{VS}/</tt>
|
||||
- <tt>/\p{WSpace}/</tt>
|
||||
- <tt>/\p{XIDC}/</tt>
|
||||
- <tt>/\p{XIDS}/</tt>
|
||||
|
||||
=== Property Value Aliases (General Category)
|
||||
|
||||
- <tt>/\p{Other}/</tt>
|
||||
- <tt>/\p{Control}/</tt>
|
||||
- <tt>/\p{Format}/</tt>
|
||||
- <tt>/\p{Unassigned}/</tt>
|
||||
- <tt>/\p{Private_Use}/</tt>
|
||||
- <tt>/\p{Surrogate}/</tt>
|
||||
- <tt>/\p{Letter}/</tt>
|
||||
- <tt>/\p{Cased_Letter}/</tt>
|
||||
- <tt>/\p{Lowercase_Letter}/</tt>
|
||||
- <tt>/\p{Modifier_Letter}/</tt>
|
||||
- <tt>/\p{Other_Letter}/</tt>
|
||||
- <tt>/\p{Titlecase_Letter}/</tt>
|
||||
- <tt>/\p{Uppercase_Letter}/</tt>
|
||||
- <tt>/\p{Mark}/</tt>
|
||||
- <tt>/\p{Combining_Mark}/</tt>
|
||||
- <tt>/\p{Spacing_Mark}/</tt>
|
||||
- <tt>/\p{Enclosing_Mark}/</tt>
|
||||
- <tt>/\p{Nonspacing_Mark}/</tt>
|
||||
- <tt>/\p{Number}/</tt>
|
||||
- <tt>/\p{Decimal_Number}/</tt>
|
||||
- <tt>/\p{Letter_Number}/</tt>
|
||||
- <tt>/\p{Other_Number}/</tt>
|
||||
- <tt>/\p{Punctuation}/</tt>
|
||||
- <tt>/\p{Connector_Punctuation}/</tt>
|
||||
- <tt>/\p{Dash_Punctuation}/</tt>
|
||||
- <tt>/\p{Close_Punctuation}/</tt>
|
||||
- <tt>/\p{Final_Punctuation}/</tt>
|
||||
- <tt>/\p{Initial_Punctuation}/</tt>
|
||||
- <tt>/\p{Other_Punctuation}/</tt>
|
||||
- <tt>/\p{Open_Punctuation}/</tt>
|
||||
- <tt>/\p{Symbol}/</tt>
|
||||
- <tt>/\p{Currency_Symbol}/</tt>
|
||||
- <tt>/\p{Modifier_Symbol}/</tt>
|
||||
- <tt>/\p{Math_Symbol}/</tt>
|
||||
- <tt>/\p{Other_Symbol}/</tt>
|
||||
- <tt>/\p{Separator}/</tt>
|
||||
- <tt>/\p{Line_Separator}/</tt>
|
||||
- <tt>/\p{Paragraph_Separator}/</tt>
|
||||
- <tt>/\p{Space_Separator}/</tt>
|
||||
|
||||
=== Property Value Aliases (Script)
|
||||
|
||||
- <tt>/\p{Adlm}/</tt>
|
||||
- <tt>/\p{Aghb}/</tt>
|
||||
- <tt>/\p{Arab}/</tt>
|
||||
- <tt>/\p{Armi}/</tt>
|
||||
- <tt>/\p{Armn}/</tt>
|
||||
- <tt>/\p{Avst}/</tt>
|
||||
- <tt>/\p{Bali}/</tt>
|
||||
- <tt>/\p{Bamu}/</tt>
|
||||
- <tt>/\p{Bass}/</tt>
|
||||
- <tt>/\p{Batk}/</tt>
|
||||
- <tt>/\p{Beng}/</tt>
|
||||
- <tt>/\p{Bhks}/</tt>
|
||||
- <tt>/\p{Bopo}/</tt>
|
||||
- <tt>/\p{Brah}/</tt>
|
||||
- <tt>/\p{Brai}/</tt>
|
||||
- <tt>/\p{Bugi}/</tt>
|
||||
- <tt>/\p{Buhd}/</tt>
|
||||
- <tt>/\p{Cakm}/</tt>
|
||||
- <tt>/\p{Cans}/</tt>
|
||||
- <tt>/\p{Cari}/</tt>
|
||||
- <tt>/\p{Cher}/</tt>
|
||||
- <tt>/\p{Copt}/</tt>
|
||||
- <tt>/\p{Qaac}/</tt>
|
||||
- <tt>/\p{Cprt}/</tt>
|
||||
- <tt>/\p{Cyrl}/</tt>
|
||||
- <tt>/\p{Deva}/</tt>
|
||||
- <tt>/\p{Dogr}/</tt>
|
||||
- <tt>/\p{Dsrt}/</tt>
|
||||
- <tt>/\p{Dupl}/</tt>
|
||||
- <tt>/\p{Egyp}/</tt>
|
||||
- <tt>/\p{Elba}/</tt>
|
||||
- <tt>/\p{Elym}/</tt>
|
||||
- <tt>/\p{Ethi}/</tt>
|
||||
- <tt>/\p{Geor}/</tt>
|
||||
- <tt>/\p{Glag}/</tt>
|
||||
- <tt>/\p{Gong}/</tt>
|
||||
- <tt>/\p{Gonm}/</tt>
|
||||
- <tt>/\p{Goth}/</tt>
|
||||
- <tt>/\p{Gran}/</tt>
|
||||
- <tt>/\p{Grek}/</tt>
|
||||
- <tt>/\p{Gujr}/</tt>
|
||||
- <tt>/\p{Guru}/</tt>
|
||||
- <tt>/\p{Hang}/</tt>
|
||||
- <tt>/\p{Hani}/</tt>
|
||||
- <tt>/\p{Hano}/</tt>
|
||||
- <tt>/\p{Hatr}/</tt>
|
||||
- <tt>/\p{Hebr}/</tt>
|
||||
- <tt>/\p{Hira}/</tt>
|
||||
- <tt>/\p{Hluw}/</tt>
|
||||
- <tt>/\p{Hmng}/</tt>
|
||||
- <tt>/\p{Hmnp}/</tt>
|
||||
- <tt>/\p{Hung}/</tt>
|
||||
- <tt>/\p{Ital}/</tt>
|
||||
- <tt>/\p{Java}/</tt>
|
||||
- <tt>/\p{Kali}/</tt>
|
||||
- <tt>/\p{Kana}/</tt>
|
||||
- <tt>/\p{Khar}/</tt>
|
||||
- <tt>/\p{Khmr}/</tt>
|
||||
- <tt>/\p{Khoj}/</tt>
|
||||
- <tt>/\p{Knda}/</tt>
|
||||
- <tt>/\p{Kthi}/</tt>
|
||||
- <tt>/\p{Lana}/</tt>
|
||||
- <tt>/\p{Laoo}/</tt>
|
||||
- <tt>/\p{Latn}/</tt>
|
||||
- <tt>/\p{Lepc}/</tt>
|
||||
- <tt>/\p{Limb}/</tt>
|
||||
- <tt>/\p{Lina}/</tt>
|
||||
- <tt>/\p{Linb}/</tt>
|
||||
- <tt>/\p{Lyci}/</tt>
|
||||
- <tt>/\p{Lydi}/</tt>
|
||||
- <tt>/\p{Mahj}/</tt>
|
||||
- <tt>/\p{Maka}/</tt>
|
||||
- <tt>/\p{Mand}/</tt>
|
||||
- <tt>/\p{Mani}/</tt>
|
||||
- <tt>/\p{Marc}/</tt>
|
||||
- <tt>/\p{Medf}/</tt>
|
||||
- <tt>/\p{Mend}/</tt>
|
||||
- <tt>/\p{Merc}/</tt>
|
||||
- <tt>/\p{Mero}/</tt>
|
||||
- <tt>/\p{Mlym}/</tt>
|
||||
- <tt>/\p{Mong}/</tt>
|
||||
- <tt>/\p{Mroo}/</tt>
|
||||
- <tt>/\p{Mtei}/</tt>
|
||||
- <tt>/\p{Mult}/</tt>
|
||||
- <tt>/\p{Mymr}/</tt>
|
||||
- <tt>/\p{Nand}/</tt>
|
||||
- <tt>/\p{Narb}/</tt>
|
||||
- <tt>/\p{Nbat}/</tt>
|
||||
- <tt>/\p{Nkoo}/</tt>
|
||||
- <tt>/\p{Nshu}/</tt>
|
||||
- <tt>/\p{Ogam}/</tt>
|
||||
- <tt>/\p{Olck}/</tt>
|
||||
- <tt>/\p{Orkh}/</tt>
|
||||
- <tt>/\p{Orya}/</tt>
|
||||
- <tt>/\p{Osge}/</tt>
|
||||
- <tt>/\p{Osma}/</tt>
|
||||
- <tt>/\p{Palm}/</tt>
|
||||
- <tt>/\p{Pauc}/</tt>
|
||||
- <tt>/\p{Perm}/</tt>
|
||||
- <tt>/\p{Phag}/</tt>
|
||||
- <tt>/\p{Phli}/</tt>
|
||||
- <tt>/\p{Phlp}/</tt>
|
||||
- <tt>/\p{Phnx}/</tt>
|
||||
- <tt>/\p{Plrd}/</tt>
|
||||
- <tt>/\p{Prti}/</tt>
|
||||
- <tt>/\p{Rjng}/</tt>
|
||||
- <tt>/\p{Rohg}/</tt>
|
||||
- <tt>/\p{Runr}/</tt>
|
||||
- <tt>/\p{Samr}/</tt>
|
||||
- <tt>/\p{Sarb}/</tt>
|
||||
- <tt>/\p{Saur}/</tt>
|
||||
- <tt>/\p{Sgnw}/</tt>
|
||||
- <tt>/\p{Shaw}/</tt>
|
||||
- <tt>/\p{Shrd}/</tt>
|
||||
- <tt>/\p{Sidd}/</tt>
|
||||
- <tt>/\p{Sind}/</tt>
|
||||
- <tt>/\p{Sinh}/</tt>
|
||||
- <tt>/\p{Sogd}/</tt>
|
||||
- <tt>/\p{Sogo}/</tt>
|
||||
- <tt>/\p{Sora}/</tt>
|
||||
- <tt>/\p{Soyo}/</tt>
|
||||
- <tt>/\p{Sund}/</tt>
|
||||
- <tt>/\p{Sylo}/</tt>
|
||||
- <tt>/\p{Syrc}/</tt>
|
||||
- <tt>/\p{Tagb}/</tt>
|
||||
- <tt>/\p{Takr}/</tt>
|
||||
- <tt>/\p{Tale}/</tt>
|
||||
- <tt>/\p{Talu}/</tt>
|
||||
- <tt>/\p{Taml}/</tt>
|
||||
- <tt>/\p{Tang}/</tt>
|
||||
- <tt>/\p{Tavt}/</tt>
|
||||
- <tt>/\p{Telu}/</tt>
|
||||
- <tt>/\p{Tfng}/</tt>
|
||||
- <tt>/\p{Tglg}/</tt>
|
||||
- <tt>/\p{Thaa}/</tt>
|
||||
- <tt>/\p{Tibt}/</tt>
|
||||
- <tt>/\p{Tirh}/</tt>
|
||||
- <tt>/\p{Ugar}/</tt>
|
||||
- <tt>/\p{Vaii}/</tt>
|
||||
- <tt>/\p{Wara}/</tt>
|
||||
- <tt>/\p{Wcho}/</tt>
|
||||
- <tt>/\p{Xpeo}/</tt>
|
||||
- <tt>/\p{Xsux}/</tt>
|
||||
- <tt>/\p{Yiii}/</tt>
|
||||
- <tt>/\p{Zanb}/</tt>
|
||||
- <tt>/\p{Zinh}/</tt>
|
||||
- <tt>/\p{Qaai}/</tt>
|
||||
- <tt>/\p{Zyyy}/</tt>
|
||||
- <tt>/\p{Zzzz}/</tt>
|
||||
|
||||
=== Derived Ages
|
||||
|
||||
- <tt>/\p{Age=1.1}/</tt>
|
||||
- <tt>/\p{Age=10.0}/</tt>
|
||||
- <tt>/\p{Age=11.0}/</tt>
|
||||
- <tt>/\p{Age=12.0}/</tt>
|
||||
- <tt>/\p{Age=12.1}/</tt>
|
||||
- <tt>/\p{Age=2.0}/</tt>
|
||||
- <tt>/\p{Age=2.1}/</tt>
|
||||
- <tt>/\p{Age=3.0}/</tt>
|
||||
- <tt>/\p{Age=3.1}/</tt>
|
||||
- <tt>/\p{Age=3.2}/</tt>
|
||||
- <tt>/\p{Age=4.0}/</tt>
|
||||
- <tt>/\p{Age=4.1}/</tt>
|
||||
- <tt>/\p{Age=5.0}/</tt>
|
||||
- <tt>/\p{Age=5.1}/</tt>
|
||||
- <tt>/\p{Age=5.2}/</tt>
|
||||
- <tt>/\p{Age=6.0}/</tt>
|
||||
- <tt>/\p{Age=6.1}/</tt>
|
||||
- <tt>/\p{Age=6.2}/</tt>
|
||||
- <tt>/\p{Age=6.3}/</tt>
|
||||
- <tt>/\p{Age=7.0}/</tt>
|
||||
- <tt>/\p{Age=8.0}/</tt>
|
||||
- <tt>/\p{Age=9.0}/</tt>
|
||||
|
||||
=== Blocks
|
||||
|
||||
- <tt>/\p{In_Basic_Latin}/</tt>
|
||||
- <tt>/\p{In_Latin_1_Supplement}/</tt>
|
||||
- <tt>/\p{In_Latin_Extended_A}/</tt>
|
||||
- <tt>/\p{In_Latin_Extended_B}/</tt>
|
||||
- <tt>/\p{In_IPA_Extensions}/</tt>
|
||||
- <tt>/\p{In_Spacing_Modifier_Letters}/</tt>
|
||||
- <tt>/\p{In_Combining_Diacritical_Marks}/</tt>
|
||||
- <tt>/\p{In_Greek_and_Coptic}/</tt>
|
||||
- <tt>/\p{In_Cyrillic}/</tt>
|
||||
- <tt>/\p{In_Cyrillic_Supplement}/</tt>
|
||||
- <tt>/\p{In_Armenian}/</tt>
|
||||
- <tt>/\p{In_Hebrew}/</tt>
|
||||
- <tt>/\p{In_Arabic}/</tt>
|
||||
- <tt>/\p{In_Syriac}/</tt>
|
||||
- <tt>/\p{In_Arabic_Supplement}/</tt>
|
||||
- <tt>/\p{In_Thaana}/</tt>
|
||||
- <tt>/\p{In_NKo}/</tt>
|
||||
- <tt>/\p{In_Samaritan}/</tt>
|
||||
- <tt>/\p{In_Mandaic}/</tt>
|
||||
- <tt>/\p{In_Syriac_Supplement}/</tt>
|
||||
- <tt>/\p{In_Arabic_Extended_A}/</tt>
|
||||
- <tt>/\p{In_Devanagari}/</tt>
|
||||
- <tt>/\p{In_Bengali}/</tt>
|
||||
- <tt>/\p{In_Gurmukhi}/</tt>
|
||||
- <tt>/\p{In_Gujarati}/</tt>
|
||||
- <tt>/\p{In_Oriya}/</tt>
|
||||
- <tt>/\p{In_Tamil}/</tt>
|
||||
- <tt>/\p{In_Telugu}/</tt>
|
||||
- <tt>/\p{In_Kannada}/</tt>
|
||||
- <tt>/\p{In_Malayalam}/</tt>
|
||||
- <tt>/\p{In_Sinhala}/</tt>
|
||||
- <tt>/\p{In_Thai}/</tt>
|
||||
- <tt>/\p{In_Lao}/</tt>
|
||||
- <tt>/\p{In_Tibetan}/</tt>
|
||||
- <tt>/\p{In_Myanmar}/</tt>
|
||||
- <tt>/\p{In_Georgian}/</tt>
|
||||
- <tt>/\p{In_Hangul_Jamo}/</tt>
|
||||
- <tt>/\p{In_Ethiopic}/</tt>
|
||||
- <tt>/\p{In_Ethiopic_Supplement}/</tt>
|
||||
- <tt>/\p{In_Cherokee}/</tt>
|
||||
- <tt>/\p{In_Unified_Canadian_Aboriginal_Syllabics}/</tt>
|
||||
- <tt>/\p{In_Ogham}/</tt>
|
||||
- <tt>/\p{In_Runic}/</tt>
|
||||
- <tt>/\p{In_Tagalog}/</tt>
|
||||
- <tt>/\p{In_Hanunoo}/</tt>
|
||||
- <tt>/\p{In_Buhid}/</tt>
|
||||
- <tt>/\p{In_Tagbanwa}/</tt>
|
||||
- <tt>/\p{In_Khmer}/</tt>
|
||||
- <tt>/\p{In_Mongolian}/</tt>
|
||||
- <tt>/\p{In_Unified_Canadian_Aboriginal_Syllabics_Extended}/</tt>
|
||||
- <tt>/\p{In_Limbu}/</tt>
|
||||
- <tt>/\p{In_Tai_Le}/</tt>
|
||||
- <tt>/\p{In_New_Tai_Lue}/</tt>
|
||||
- <tt>/\p{In_Khmer_Symbols}/</tt>
|
||||
- <tt>/\p{In_Buginese}/</tt>
|
||||
- <tt>/\p{In_Tai_Tham}/</tt>
|
||||
- <tt>/\p{In_Combining_Diacritical_Marks_Extended}/</tt>
|
||||
- <tt>/\p{In_Balinese}/</tt>
|
||||
- <tt>/\p{In_Sundanese}/</tt>
|
||||
- <tt>/\p{In_Batak}/</tt>
|
||||
- <tt>/\p{In_Lepcha}/</tt>
|
||||
- <tt>/\p{In_Ol_Chiki}/</tt>
|
||||
- <tt>/\p{In_Cyrillic_Extended_C}/</tt>
|
||||
- <tt>/\p{In_Georgian_Extended}/</tt>
|
||||
- <tt>/\p{In_Sundanese_Supplement}/</tt>
|
||||
- <tt>/\p{In_Vedic_Extensions}/</tt>
|
||||
- <tt>/\p{In_Phonetic_Extensions}/</tt>
|
||||
- <tt>/\p{In_Phonetic_Extensions_Supplement}/</tt>
|
||||
- <tt>/\p{In_Combining_Diacritical_Marks_Supplement}/</tt>
|
||||
- <tt>/\p{In_Latin_Extended_Additional}/</tt>
|
||||
- <tt>/\p{In_Greek_Extended}/</tt>
|
||||
- <tt>/\p{In_General_Punctuation}/</tt>
|
||||
- <tt>/\p{In_Superscripts_and_Subscripts}/</tt>
|
||||
- <tt>/\p{In_Currency_Symbols}/</tt>
|
||||
- <tt>/\p{In_Combining_Diacritical_Marks_for_Symbols}/</tt>
|
||||
- <tt>/\p{In_Letterlike_Symbols}/</tt>
|
||||
- <tt>/\p{In_Number_Forms}/</tt>
|
||||
- <tt>/\p{In_Arrows}/</tt>
|
||||
- <tt>/\p{In_Mathematical_Operators}/</tt>
|
||||
- <tt>/\p{In_Miscellaneous_Technical}/</tt>
|
||||
- <tt>/\p{In_Control_Pictures}/</tt>
|
||||
- <tt>/\p{In_Optical_Character_Recognition}/</tt>
|
||||
- <tt>/\p{In_Enclosed_Alphanumerics}/</tt>
|
||||
- <tt>/\p{In_Box_Drawing}/</tt>
|
||||
- <tt>/\p{In_Block_Elements}/</tt>
|
||||
- <tt>/\p{In_Geometric_Shapes}/</tt>
|
||||
- <tt>/\p{In_Miscellaneous_Symbols}/</tt>
|
||||
- <tt>/\p{In_Dingbats}/</tt>
|
||||
- <tt>/\p{In_Miscellaneous_Mathematical_Symbols_A}/</tt>
|
||||
- <tt>/\p{In_Supplemental_Arrows_A}/</tt>
|
||||
- <tt>/\p{In_Braille_Patterns}/</tt>
|
||||
- <tt>/\p{In_Supplemental_Arrows_B}/</tt>
|
||||
- <tt>/\p{In_Miscellaneous_Mathematical_Symbols_B}/</tt>
|
||||
- <tt>/\p{In_Supplemental_Mathematical_Operators}/</tt>
|
||||
- <tt>/\p{In_Miscellaneous_Symbols_and_Arrows}/</tt>
|
||||
- <tt>/\p{In_Glagolitic}/</tt>
|
||||
- <tt>/\p{In_Latin_Extended_C}/</tt>
|
||||
- <tt>/\p{In_Coptic}/</tt>
|
||||
- <tt>/\p{In_Georgian_Supplement}/</tt>
|
||||
- <tt>/\p{In_Tifinagh}/</tt>
|
||||
- <tt>/\p{In_Ethiopic_Extended}/</tt>
|
||||
- <tt>/\p{In_Cyrillic_Extended_A}/</tt>
|
||||
- <tt>/\p{In_Supplemental_Punctuation}/</tt>
|
||||
- <tt>/\p{In_CJK_Radicals_Supplement}/</tt>
|
||||
- <tt>/\p{In_Kangxi_Radicals}/</tt>
|
||||
- <tt>/\p{In_Ideographic_Description_Characters}/</tt>
|
||||
- <tt>/\p{In_CJK_Symbols_and_Punctuation}/</tt>
|
||||
- <tt>/\p{In_Hiragana}/</tt>
|
||||
- <tt>/\p{In_Katakana}/</tt>
|
||||
- <tt>/\p{In_Bopomofo}/</tt>
|
||||
- <tt>/\p{In_Hangul_Compatibility_Jamo}/</tt>
|
||||
- <tt>/\p{In_Kanbun}/</tt>
|
||||
- <tt>/\p{In_Bopomofo_Extended}/</tt>
|
||||
- <tt>/\p{In_CJK_Strokes}/</tt>
|
||||
- <tt>/\p{In_Katakana_Phonetic_Extensions}/</tt>
|
||||
- <tt>/\p{In_Enclosed_CJK_Letters_and_Months}/</tt>
|
||||
- <tt>/\p{In_CJK_Compatibility}/</tt>
|
||||
- <tt>/\p{In_CJK_Unified_Ideographs_Extension_A}/</tt>
|
||||
- <tt>/\p{In_Yijing_Hexagram_Symbols}/</tt>
|
||||
- <tt>/\p{In_CJK_Unified_Ideographs}/</tt>
|
||||
- <tt>/\p{In_Yi_Syllables}/</tt>
|
||||
- <tt>/\p{In_Yi_Radicals}/</tt>
|
||||
- <tt>/\p{In_Lisu}/</tt>
|
||||
- <tt>/\p{In_Vai}/</tt>
|
||||
- <tt>/\p{In_Cyrillic_Extended_B}/</tt>
|
||||
- <tt>/\p{In_Bamum}/</tt>
|
||||
- <tt>/\p{In_Modifier_Tone_Letters}/</tt>
|
||||
- <tt>/\p{In_Latin_Extended_D}/</tt>
|
||||
- <tt>/\p{In_Syloti_Nagri}/</tt>
|
||||
- <tt>/\p{In_Common_Indic_Number_Forms}/</tt>
|
||||
- <tt>/\p{In_Phags_pa}/</tt>
|
||||
- <tt>/\p{In_Saurashtra}/</tt>
|
||||
- <tt>/\p{In_Devanagari_Extended}/</tt>
|
||||
- <tt>/\p{In_Kayah_Li}/</tt>
|
||||
- <tt>/\p{In_Rejang}/</tt>
|
||||
- <tt>/\p{In_Hangul_Jamo_Extended_A}/</tt>
|
||||
- <tt>/\p{In_Javanese}/</tt>
|
||||
- <tt>/\p{In_Myanmar_Extended_B}/</tt>
|
||||
- <tt>/\p{In_Cham}/</tt>
|
||||
- <tt>/\p{In_Myanmar_Extended_A}/</tt>
|
||||
- <tt>/\p{In_Tai_Viet}/</tt>
|
||||
- <tt>/\p{In_Meetei_Mayek_Extensions}/</tt>
|
||||
- <tt>/\p{In_Ethiopic_Extended_A}/</tt>
|
||||
- <tt>/\p{In_Latin_Extended_E}/</tt>
|
||||
- <tt>/\p{In_Cherokee_Supplement}/</tt>
|
||||
- <tt>/\p{In_Meetei_Mayek}/</tt>
|
||||
- <tt>/\p{In_Hangul_Syllables}/</tt>
|
||||
- <tt>/\p{In_Hangul_Jamo_Extended_B}/</tt>
|
||||
- <tt>/\p{In_High_Surrogates}/</tt>
|
||||
- <tt>/\p{In_High_Private_Use_Surrogates}/</tt>
|
||||
- <tt>/\p{In_Low_Surrogates}/</tt>
|
||||
- <tt>/\p{In_Private_Use_Area}/</tt>
|
||||
- <tt>/\p{In_CJK_Compatibility_Ideographs}/</tt>
|
||||
- <tt>/\p{In_Alphabetic_Presentation_Forms}/</tt>
|
||||
- <tt>/\p{In_Arabic_Presentation_Forms_A}/</tt>
|
||||
- <tt>/\p{In_Variation_Selectors}/</tt>
|
||||
- <tt>/\p{In_Vertical_Forms}/</tt>
|
||||
- <tt>/\p{In_Combining_Half_Marks}/</tt>
|
||||
- <tt>/\p{In_CJK_Compatibility_Forms}/</tt>
|
||||
- <tt>/\p{In_Small_Form_Variants}/</tt>
|
||||
- <tt>/\p{In_Arabic_Presentation_Forms_B}/</tt>
|
||||
- <tt>/\p{In_Halfwidth_and_Fullwidth_Forms}/</tt>
|
||||
- <tt>/\p{In_Specials}/</tt>
|
||||
- <tt>/\p{In_Linear_B_Syllabary}/</tt>
|
||||
- <tt>/\p{In_Linear_B_Ideograms}/</tt>
|
||||
- <tt>/\p{In_Aegean_Numbers}/</tt>
|
||||
- <tt>/\p{In_Ancient_Greek_Numbers}/</tt>
|
||||
- <tt>/\p{In_Ancient_Symbols}/</tt>
|
||||
- <tt>/\p{In_Phaistos_Disc}/</tt>
|
||||
- <tt>/\p{In_Lycian}/</tt>
|
||||
- <tt>/\p{In_Carian}/</tt>
|
||||
- <tt>/\p{In_Coptic_Epact_Numbers}/</tt>
|
||||
- <tt>/\p{In_Old_Italic}/</tt>
|
||||
- <tt>/\p{In_Gothic}/</tt>
|
||||
- <tt>/\p{In_Old_Permic}/</tt>
|
||||
- <tt>/\p{In_Ugaritic}/</tt>
|
||||
- <tt>/\p{In_Old_Persian}/</tt>
|
||||
- <tt>/\p{In_Deseret}/</tt>
|
||||
- <tt>/\p{In_Shavian}/</tt>
|
||||
- <tt>/\p{In_Osmanya}/</tt>
|
||||
- <tt>/\p{In_Osage}/</tt>
|
||||
- <tt>/\p{In_Elbasan}/</tt>
|
||||
- <tt>/\p{In_Caucasian_Albanian}/</tt>
|
||||
- <tt>/\p{In_Linear_A}/</tt>
|
||||
- <tt>/\p{In_Cypriot_Syllabary}/</tt>
|
||||
- <tt>/\p{In_Imperial_Aramaic}/</tt>
|
||||
- <tt>/\p{In_Palmyrene}/</tt>
|
||||
- <tt>/\p{In_Nabataean}/</tt>
|
||||
- <tt>/\p{In_Hatran}/</tt>
|
||||
- <tt>/\p{In_Phoenician}/</tt>
|
||||
- <tt>/\p{In_Lydian}/</tt>
|
||||
- <tt>/\p{In_Meroitic_Hieroglyphs}/</tt>
|
||||
- <tt>/\p{In_Meroitic_Cursive}/</tt>
|
||||
- <tt>/\p{In_Kharoshthi}/</tt>
|
||||
- <tt>/\p{In_Old_South_Arabian}/</tt>
|
||||
- <tt>/\p{In_Old_North_Arabian}/</tt>
|
||||
- <tt>/\p{In_Manichaean}/</tt>
|
||||
- <tt>/\p{In_Avestan}/</tt>
|
||||
- <tt>/\p{In_Inscriptional_Parthian}/</tt>
|
||||
- <tt>/\p{In_Inscriptional_Pahlavi}/</tt>
|
||||
- <tt>/\p{In_Psalter_Pahlavi}/</tt>
|
||||
- <tt>/\p{In_Old_Turkic}/</tt>
|
||||
- <tt>/\p{In_Old_Hungarian}/</tt>
|
||||
- <tt>/\p{In_Hanifi_Rohingya}/</tt>
|
||||
- <tt>/\p{In_Rumi_Numeral_Symbols}/</tt>
|
||||
- <tt>/\p{In_Old_Sogdian}/</tt>
|
||||
- <tt>/\p{In_Sogdian}/</tt>
|
||||
- <tt>/\p{In_Elymaic}/</tt>
|
||||
- <tt>/\p{In_Brahmi}/</tt>
|
||||
- <tt>/\p{In_Kaithi}/</tt>
|
||||
- <tt>/\p{In_Sora_Sompeng}/</tt>
|
||||
- <tt>/\p{In_Chakma}/</tt>
|
||||
- <tt>/\p{In_Mahajani}/</tt>
|
||||
- <tt>/\p{In_Sharada}/</tt>
|
||||
- <tt>/\p{In_Sinhala_Archaic_Numbers}/</tt>
|
||||
- <tt>/\p{In_Khojki}/</tt>
|
||||
- <tt>/\p{In_Multani}/</tt>
|
||||
- <tt>/\p{In_Khudawadi}/</tt>
|
||||
- <tt>/\p{In_Grantha}/</tt>
|
||||
- <tt>/\p{In_Newa}/</tt>
|
||||
- <tt>/\p{In_Tirhuta}/</tt>
|
||||
- <tt>/\p{In_Siddham}/</tt>
|
||||
- <tt>/\p{In_Modi}/</tt>
|
||||
- <tt>/\p{In_Mongolian_Supplement}/</tt>
|
||||
- <tt>/\p{In_Takri}/</tt>
|
||||
- <tt>/\p{In_Ahom}/</tt>
|
||||
- <tt>/\p{In_Dogra}/</tt>
|
||||
- <tt>/\p{In_Warang_Citi}/</tt>
|
||||
- <tt>/\p{In_Nandinagari}/</tt>
|
||||
- <tt>/\p{In_Zanabazar_Square}/</tt>
|
||||
- <tt>/\p{In_Soyombo}/</tt>
|
||||
- <tt>/\p{In_Pau_Cin_Hau}/</tt>
|
||||
- <tt>/\p{In_Bhaiksuki}/</tt>
|
||||
- <tt>/\p{In_Marchen}/</tt>
|
||||
- <tt>/\p{In_Masaram_Gondi}/</tt>
|
||||
- <tt>/\p{In_Gunjala_Gondi}/</tt>
|
||||
- <tt>/\p{In_Makasar}/</tt>
|
||||
- <tt>/\p{In_Tamil_Supplement}/</tt>
|
||||
- <tt>/\p{In_Cuneiform}/</tt>
|
||||
- <tt>/\p{In_Cuneiform_Numbers_and_Punctuation}/</tt>
|
||||
- <tt>/\p{In_Early_Dynastic_Cuneiform}/</tt>
|
||||
- <tt>/\p{In_Egyptian_Hieroglyphs}/</tt>
|
||||
- <tt>/\p{In_Egyptian_Hieroglyph_Format_Controls}/</tt>
|
||||
- <tt>/\p{In_Anatolian_Hieroglyphs}/</tt>
|
||||
- <tt>/\p{In_Bamum_Supplement}/</tt>
|
||||
- <tt>/\p{In_Mro}/</tt>
|
||||
- <tt>/\p{In_Bassa_Vah}/</tt>
|
||||
- <tt>/\p{In_Pahawh_Hmong}/</tt>
|
||||
- <tt>/\p{In_Medefaidrin}/</tt>
|
||||
- <tt>/\p{In_Miao}/</tt>
|
||||
- <tt>/\p{In_Ideographic_Symbols_and_Punctuation}/</tt>
|
||||
- <tt>/\p{In_Tangut}/</tt>
|
||||
- <tt>/\p{In_Tangut_Components}/</tt>
|
||||
- <tt>/\p{In_Kana_Supplement}/</tt>
|
||||
- <tt>/\p{In_Kana_Extended_A}/</tt>
|
||||
- <tt>/\p{In_Small_Kana_Extension}/</tt>
|
||||
- <tt>/\p{In_Nushu}/</tt>
|
||||
- <tt>/\p{In_Duployan}/</tt>
|
||||
- <tt>/\p{In_Shorthand_Format_Controls}/</tt>
|
||||
- <tt>/\p{In_Byzantine_Musical_Symbols}/</tt>
|
||||
- <tt>/\p{In_Musical_Symbols}/</tt>
|
||||
- <tt>/\p{In_Ancient_Greek_Musical_Notation}/</tt>
|
||||
- <tt>/\p{In_Mayan_Numerals}/</tt>
|
||||
- <tt>/\p{In_Tai_Xuan_Jing_Symbols}/</tt>
|
||||
- <tt>/\p{In_Counting_Rod_Numerals}/</tt>
|
||||
- <tt>/\p{In_Mathematical_Alphanumeric_Symbols}/</tt>
|
||||
- <tt>/\p{In_Sutton_SignWriting}/</tt>
|
||||
- <tt>/\p{In_Glagolitic_Supplement}/</tt>
|
||||
- <tt>/\p{In_Nyiakeng_Puachue_Hmong}/</tt>
|
||||
- <tt>/\p{In_Wancho}/</tt>
|
||||
- <tt>/\p{In_Mende_Kikakui}/</tt>
|
||||
- <tt>/\p{In_Adlam}/</tt>
|
||||
- <tt>/\p{In_Indic_Siyaq_Numbers}/</tt>
|
||||
- <tt>/\p{In_Ottoman_Siyaq_Numbers}/</tt>
|
||||
- <tt>/\p{In_Arabic_Mathematical_Alphabetic_Symbols}/</tt>
|
||||
- <tt>/\p{In_Mahjong_Tiles}/</tt>
|
||||
- <tt>/\p{In_Domino_Tiles}/</tt>
|
||||
- <tt>/\p{In_Playing_Cards}/</tt>
|
||||
- <tt>/\p{In_Enclosed_Alphanumeric_Supplement}/</tt>
|
||||
- <tt>/\p{In_Enclosed_Ideographic_Supplement}/</tt>
|
||||
- <tt>/\p{In_Miscellaneous_Symbols_and_Pictographs}/</tt>
|
||||
- <tt>/\p{In_Emoticons}/</tt>
|
||||
- <tt>/\p{In_Ornamental_Dingbats}/</tt>
|
||||
- <tt>/\p{In_Transport_and_Map_Symbols}/</tt>
|
||||
- <tt>/\p{In_Alchemical_Symbols}/</tt>
|
||||
- <tt>/\p{In_Geometric_Shapes_Extended}/</tt>
|
||||
- <tt>/\p{In_Supplemental_Arrows_C}/</tt>
|
||||
- <tt>/\p{In_Supplemental_Symbols_and_Pictographs}/</tt>
|
||||
- <tt>/\p{In_Chess_Symbols}/</tt>
|
||||
- <tt>/\p{In_Symbols_and_Pictographs_Extended_A}/</tt>
|
||||
- <tt>/\p{In_CJK_Unified_Ideographs_Extension_B}/</tt>
|
||||
- <tt>/\p{In_CJK_Unified_Ideographs_Extension_C}/</tt>
|
||||
- <tt>/\p{In_CJK_Unified_Ideographs_Extension_D}/</tt>
|
||||
- <tt>/\p{In_CJK_Unified_Ideographs_Extension_E}/</tt>
|
||||
- <tt>/\p{In_CJK_Unified_Ideographs_Extension_F}/</tt>
|
||||
- <tt>/\p{In_CJK_Compatibility_Ideographs_Supplement}/</tt>
|
||||
- <tt>/\p{In_Tags}/</tt>
|
||||
- <tt>/\p{In_Variation_Selectors_Supplement}/</tt>
|
||||
- <tt>/\p{In_Supplementary_Private_Use_Area_A}/</tt>
|
||||
- <tt>/\p{In_Supplementary_Private_Use_Area_B}/</tt>
|
||||
- <tt>/\p{In_No_Block}/</tt>
|
|
@ -414,9 +414,9 @@ slash (<tt>'/'</tt>) characters:
|
|||
re = /foo/ # => /foo/
|
||||
re.class # => Regexp
|
||||
|
||||
The trailing slash may be followed by one or more _flag_ characters
|
||||
that modify the behavior.
|
||||
See {Regexp options}[rdoc-ref:Regexp@Options] for details.
|
||||
The trailing slash may be followed by one or more modifiers characters
|
||||
that set modes for the regexp.
|
||||
See {Regexp modes}[rdoc-ref:Regexp@Modes] for details.
|
||||
|
||||
Interpolation may be used inside regular expressions along with escaped
|
||||
characters. Note that a regular expression may require additional escaped
|
||||
|
@ -523,9 +523,9 @@ A few "symmetrical" character pairs may be used as delimiters:
|
|||
%r(foo) # => /foo/
|
||||
%r<foo> # => /foo/
|
||||
|
||||
The trailing delimiter may be followed by one or more _flag_ characters
|
||||
that modify the behavior.
|
||||
See {Regexp options}[rdoc-ref:Regexp@Options] for details.
|
||||
The trailing delimiter may be followed by one or more modifier characters
|
||||
that set modes for the regexp.
|
||||
See {Regexp modes}[rdoc-ref:Regexp@Modes] for details.
|
||||
|
||||
=== <tt>%x</tt>: Backtick Literals
|
||||
|
||||
|
|
8
re.c
8
re.c
|
@ -538,7 +538,7 @@ static VALUE rb_reg_str_with_term(VALUE re, int term);
|
|||
*
|
||||
* The returned string may be used as an argument to Regexp.new,
|
||||
* or as interpolated text for a
|
||||
* {Regexp literal}[rdoc-ref:regexp.rdoc@Regexp+Literal]:
|
||||
* {Regexp interpolation}[rdoc-ref:regexp.rdoc@Interpolation+Mode]:
|
||||
*
|
||||
* r1 = Regexp.new(s0) # => /(?ix-m:ab+c)/
|
||||
* r2 = /#{s0}/ # => /(?ix-m:ab+c)/
|
||||
|
@ -3568,7 +3568,7 @@ reg_match_pos(VALUE re, VALUE *strp, long pos, VALUE* set_match)
|
|||
* Returns the integer index (in characters) of the first match
|
||||
* for +self+ and +string+, or +nil+ if none;
|
||||
* also sets the
|
||||
* {rdoc-ref:Regexp Global Variables}[rdoc-ref:Regexp@Regexp+Global+Variables]:
|
||||
* {rdoc-ref:Regexp global variables}[rdoc-ref:Regexp@Global+Variables]:
|
||||
*
|
||||
* /at/ =~ 'input data' # => 7
|
||||
* $~ # => #<MatchData "at">
|
||||
|
@ -3581,7 +3581,7 @@ reg_match_pos(VALUE re, VALUE *strp, long pos, VALUE* set_match)
|
|||
* - Is a regexp literal;
|
||||
* see {Regexp Literals}[rdoc-ref:literals.rdoc@Regexp+Literals].
|
||||
* - Does not contain interpolations;
|
||||
* see {Regexp Interpolation}[rdoc-ref:Regexp@Regexp+Interpolation].
|
||||
* see {Regexp interpolation}[rdoc-ref:Regexp@Interpolation+Mode].
|
||||
* - Is at the left of the expression.
|
||||
*
|
||||
* Example:
|
||||
|
@ -4559,7 +4559,7 @@ match_setter(VALUE val, ID _x, VALUE *_y)
|
|||
*
|
||||
* With no argument, returns the value of <tt>$!</tt>,
|
||||
* which is the result of the most recent pattern match
|
||||
* (see {Regexp Global Variables}[rdoc-ref:Regexp@Regexp+Global+Variables]):
|
||||
* (see {Regexp global variables}[rdoc-ref:Regexp@Global+Variables]):
|
||||
*
|
||||
* /c(.)t/ =~ 'cat' # => 0
|
||||
* Regexp.last_match # => #<MatchData "cat" 1:"a">
|
||||
|
|
6
string.c
6
string.c
|
@ -4348,7 +4348,7 @@ rb_str_byterindex_m(int argc, VALUE *argv, VALUE str)
|
|||
* 'foo' =~ /o/ # => 1
|
||||
* 'foo' =~ /x/ # => nil
|
||||
*
|
||||
* Note: also updates Regexp@Special+global+variables.
|
||||
* Note: also updates Regexp@Global+Variables.
|
||||
*
|
||||
* If the given +object+ is not a \Regexp, returns the value
|
||||
* returned by <tt>object =~ self</tt>.
|
||||
|
@ -4390,7 +4390,7 @@ static VALUE get_pat(VALUE);
|
|||
*
|
||||
* Returns a \MatchData object (or +nil+) based on +self+ and the given +pattern+.
|
||||
*
|
||||
* Note: also updates Regexp@Special+global+variables.
|
||||
* Note: also updates Regexp@Global+Variables.
|
||||
*
|
||||
* - Computes +regexp+ by converting +pattern+ (if not already a \Regexp).
|
||||
* regexp = Regexp.new(pattern)
|
||||
|
@ -4439,7 +4439,7 @@ rb_str_match_m(int argc, VALUE *argv, VALUE str)
|
|||
*
|
||||
* Returns +true+ or +false+ based on whether a match is found for +self+ and +pattern+.
|
||||
*
|
||||
* Note: does not update Regexp@Special+global+variables.
|
||||
* Note: does not update Regexp@Global+Variables.
|
||||
*
|
||||
* Computes +regexp+ by converting +pattern+ (if not already a \Regexp).
|
||||
* regexp = Regexp.new(pattern)
|
||||
|
|
|
@ -278,7 +278,7 @@
|
|||
# If argument +capture+ is given and not <tt>0</tt>,
|
||||
# it should be either an capture group index (integer)
|
||||
# or a capture group name (string or symbol);
|
||||
# the slice is the specified capture (see Regexp@Capturing):
|
||||
# the slice is the specified capture (see Regexp@Groups+and+Captures):
|
||||
#
|
||||
# s = 'hello there'
|
||||
# s[/[aeiou](.)\1/, 1] # => "l"
|
||||
|
|
Загрузка…
Ссылка в новой задаче