diff options
author | Janosch Müller <[email protected]> | 2023-07-01 16:22:17 +0200 |
---|---|---|
committer | <[email protected]> | 2023-07-01 23:22:17 +0900 |
commit | 08b3fb11524e6cde453476f24ac80fd60457dfef () | |
tree | 58390c5ff62bcd0116b6aa857c228818a5b465b4 | |
parent | 3fd1968d6f10579a36f77eb3838f6c62a3e9f205 (diff) |
[Bug #19728] Auto-generate unicode property docs
https://bugs.ruby-lang.org/issues/19728
Notes: Merged: https://.com/ruby/ruby/pull/7944 Merged-By: nobu <[email protected]>
-rw-r--r-- | common.mk | 16 | ||||
-rw-r--r-- | doc/regexp/unicode_properties.rdoc | 1485 | ||||
-rw-r--r-- | enc/unicode/15.0.0/name2ctype.h | 2 | ||||
-rwxr-xr-x | template/unicode_properties.rdoc.tmpl | 59 | ||||
-rwxr-xr-x | tool/enc-unicode.rb | 15 |
5 files changed, 722 insertions, 855 deletions
@@ -430,7 +430,7 @@ ruby.imp: $(COMMONOBJS) sort -u -o $@ install: install-$(INSTALLDOC) -docs: $(DOCTARGETS) pkgconfig-data: $(ruby_pc) $(ruby_pc): $(srcdir)/template/ruby.pc.in config.status @@ -624,15 +624,15 @@ do-install-dbg: $(PROGRAM) pre-install-dbg post-install-dbg:: @$(NULLCMD) -rdoc: PHONY main @echo Generating RDoc documentation $(Q) $(RDOC) --ri --op "$(RDOCOUT)" $(RDOC_GEN_OPTS) $(RDOCFLAGS) "$(srcdir)" -html: PHONY main @echo Generating RDoc HTML files $(Q) $(RDOC) --op "$(HTMLOUT)" $(RDOC_GEN_OPTS) $(RDOCFLAGS) "$(srcdir)" -rdoc-coverage: PHONY main @echo Generating RDoc coverage report $(Q) $(RDOC) --quiet -C $(RDOCFLAGS) "$(srcdir)" @@ -1142,7 +1142,7 @@ common-srcs: $(srcs_vpath)parse.c $(srcs_vpath)lex.c $(srcs_vpath)enc/trans/newl missing-srcs: $(srcdir)/missing/des_tables.c -srcs: common-srcs missing-srcs srcs-enc RIPPER_SRCS = $(srcdir)/ext/ripper/ripper.c \ $(srcdir)/ext/ripper/ripper_init.c \ @@ -1730,6 +1730,12 @@ $(UNICODE_HDR_DIR)/name2ctype.h: $(UNICODE_SRC_DATA_DIR) $(UNICODE_SRC_EMOJI_DATA_DIR) > [email protected] $(MV) [email protected] $@ # the next non-comment line was: # $(UNICODE_HDR_DIR)/casefold.h: $(tooldir)/enc-case-folding.rb \ # but was changed to make sure CI works on systems that don't have gperf @@ -1,863 +1,678 @@ == \Regexps Based on Unicode Properties The properties shown here are those currently supported in Ruby. -Older versions may not support all of these; -newer versions may support additional properties. === POSIX brackets -- <tt>/\p{Alpha}/</tt> -- <tt>/\p{Blank}/</tt> -- <tt>/\p{Cntrl}/</tt> -- <tt>/\p{Digit}/</tt> -- <tt>/\p{Graph}/</tt> -- <tt>/\p{Lower}/</tt> -- <tt>/\p{Print}/</tt> -- <tt>/\p{Punct}/</tt> -- <tt>/\p{Space}/</tt> -- <tt>/\p{Upper}/</tt> -- <tt>/\p{XDigit}/</tt> -- <tt>/\p{Word}/</tt> -- <tt>/\p{Alnum}/</tt> -- <tt>/\p{ASCII}/</tt> -- <tt>/\p{XPosixPunct}/</tt> === Special -- <tt>/\p{Any}/</tt> -- <tt>/\p{Assigned}/</tt> === Major and General Categories -- <tt>/\p{C}/</tt> -- <tt>/\p{Cc}/</tt> -- <tt>/\p{Cf}/</tt> -- <tt>/\p{Cn}/</tt> -- <tt>/\p{Co}/</tt> -- <tt>/\p{Cs}/</tt> -- <tt>/\p{L}/</tt> -- <tt>/\p{LC}/</tt> -- <tt>/\p{Ll}/</tt> -- <tt>/\p{Lm}/</tt> -- <tt>/\p{Lo}/</tt> -- <tt>/\p{Lt}/</tt> -- <tt>/\p{Lu}/</tt> -- <tt>/\p{M}/</tt> -- <tt>/\p{Mc}/</tt> -- <tt>/\p{Me}/</tt> -- <tt>/\p{Mn}/</tt> -- <tt>/\p{N}/</tt> -- <tt>/\p{Nd}/</tt> -- <tt>/\p{Nl}/</tt> -- <tt>/\p{No}/</tt> -- <tt>/\p{P}/</tt> -- <tt>/\p{Pc}/</tt> -- <tt>/\p{Pd}/</tt> -- <tt>/\p{Pe}/</tt> -- <tt>/\p{Pf}/</tt> -- <tt>/\p{Pi}/</tt> -- <tt>/\p{Po}/</tt> -- <tt>/\p{Ps}/</tt> -- <tt>/\p{S}/</tt> -- <tt>/\p{Sc}/</tt> -- <tt>/\p{Sk}/</tt> -- <tt>/\p{Sm}/</tt> -- <tt>/\p{So}/</tt> -- <tt>/\p{Z}/</tt> -- <tt>/\p{Zl}/</tt> -- <tt>/\p{Zp}/</tt> -- <tt>/\p{Zs}/</tt> -=== Scripts -- <tt>/\p{Adlam}/</tt> -- <tt>/\p{Ahom}/</tt> -- <tt>/\p{Anatolian_Hieroglyphs}/</tt> -- <tt>/\p{Arabic}/</tt> -- <tt>/\p{Armenian}/</tt> -- <tt>/\p{Avestan}/</tt> -- <tt>/\p{Balinese}/</tt> -- <tt>/\p{Bamum}/</tt> -- <tt>/\p{Bassa_Vah}/</tt> -- <tt>/\p{Batak}/</tt> -- <tt>/\p{Bengali}/</tt> -- <tt>/\p{Bhaiksuki}/</tt> -- <tt>/\p{Bopomofo}/</tt> -- <tt>/\p{Brahmi}/</tt> -- <tt>/\p{Braille}/</tt> -- <tt>/\p{Buginese}/</tt> -- <tt>/\p{Buhid}/</tt> -- <tt>/\p{Canadian_Aboriginal}/</tt> -- <tt>/\p{Carian}/</tt> -- <tt>/\p{Caucasian_Albanian}/</tt> -- <tt>/\p{Chakma}/</tt> -- <tt>/\p{Cham}/</tt> -- <tt>/\p{Cherokee}/</tt> -- <tt>/\p{Common}/</tt> -- <tt>/\p{Coptic}/</tt> -- <tt>/\p{Cuneiform}/</tt> -- <tt>/\p{Cypriot}/</tt> -- <tt>/\p{Cyrillic}/</tt> -- <tt>/\p{Deseret}/</tt> -- <tt>/\p{Devanagari}/</tt> -- <tt>/\p{Dogra}/</tt> -- <tt>/\p{Duployan}/</tt> -- <tt>/\p{Egyptian_Hieroglyphs}/</tt> -- <tt>/\p{Elbasan}/</tt> -- <tt>/\p{Elymaic}/</tt> -- <tt>/\p{Ethiopic}/</tt> -- <tt>/\p{Georgian}/</tt> -- <tt>/\p{Glagolitic}/</tt> -- <tt>/\p{Gothic}/</tt> -- <tt>/\p{Grantha}/</tt> -- <tt>/\p{Greek}/</tt> -- <tt>/\p{Gujarati}/</tt> -- <tt>/\p{Gunjala_Gondi}/</tt> -- <tt>/\p{Gurmukhi}/</tt> -- <tt>/\p{Han}/</tt> -- <tt>/\p{Hangul}/</tt> -- <tt>/\p{Hanifi_Rohingya}/</tt> -- <tt>/\p{Hanunoo}/</tt> -- <tt>/\p{Hatran}/</tt> -- <tt>/\p{Hebrew}/</tt> -- <tt>/\p{Hiragana}/</tt> -- <tt>/\p{Imperial_Aramaic}/</tt> -- <tt>/\p{Inherited}/</tt> -- <tt>/\p{Inscriptional_Pahlavi}/</tt> -- <tt>/\p{Inscriptional_Parthian}/</tt> -- <tt>/\p{Javanese}/</tt> -- <tt>/\p{Kaithi}/</tt> -- <tt>/\p{Kannada}/</tt> -- <tt>/\p{Katakana}/</tt> -- <tt>/\p{Kayah_Li}/</tt> -- <tt>/\p{Kharoshthi}/</tt> -- <tt>/\p{Khmer}/</tt> -- <tt>/\p{Khojki}/</tt> -- <tt>/\p{Khudawadi}/</tt> -- <tt>/\p{Lao}/</tt> -- <tt>/\p{Latin}/</tt> -- <tt>/\p{Lepcha}/</tt> -- <tt>/\p{Limbu}/</tt> -- <tt>/\p{Linear_A}/</tt> -- <tt>/\p{Linear_B}/</tt> -- <tt>/\p{Lisu}/</tt> -- <tt>/\p{Lycian}/</tt> -- <tt>/\p{Lydian}/</tt> -- <tt>/\p{Mahajani}/</tt> -- <tt>/\p{Makasar}/</tt> -- <tt>/\p{Malayalam}/</tt> -- <tt>/\p{Mandaic}/</tt> -- <tt>/\p{Manichaean}/</tt> -- <tt>/\p{Marchen}/</tt> -- <tt>/\p{Masaram_Gondi}/</tt> -- <tt>/\p{Medefaidrin}/</tt> -- <tt>/\p{Meetei_Mayek}/</tt> -- <tt>/\p{Mende_Kikakui}/</tt> -- <tt>/\p{Meroitic_Cursive}/</tt> -- <tt>/\p{Meroitic_Hieroglyphs}/</tt> -- <tt>/\p{Miao}/</tt> -- <tt>/\p{Modi}/</tt> -- <tt>/\p{Mongolian}/</tt> -- <tt>/\p{Mro}/</tt> -- <tt>/\p{Multani}/</tt> -- <tt>/\p{Myanmar}/</tt> -- <tt>/\p{Nabataean}/</tt> -- <tt>/\p{Nandinagari}/</tt> -- <tt>/\p{New_Tai_Lue}/</tt> -- <tt>/\p{Newa}/</tt> -- <tt>/\p{Nko}/</tt> -- <tt>/\p{Nushu}/</tt> -- <tt>/\p{Nyiakeng_Puachue_Hmong}/</tt> -- <tt>/\p{Ogham}/</tt> -- <tt>/\p{Ol_Chiki}/</tt> -- <tt>/\p{Old_Hungarian}/</tt> -- <tt>/\p{Old_Italic}/</tt> -- <tt>/\p{Old_North_Arabian}/</tt> -- <tt>/\p{Old_Permic}/</tt> -- <tt>/\p{Old_Persian}/</tt> -- <tt>/\p{Old_Sogdian}/</tt> -- <tt>/\p{Old_South_Arabian}/</tt> -- <tt>/\p{Old_Turkic}/</tt> -- <tt>/\p{Oriya}/</tt> -- <tt>/\p{Osage}/</tt> -- <tt>/\p{Osmanya}/</tt> -- <tt>/\p{Pahawh_Hmong}/</tt> -- <tt>/\p{Palmyrene}/</tt> -- <tt>/\p{Pau_Cin_Hau}/</tt> -- <tt>/\p{Phags_Pa}/</tt> -- <tt>/\p{Phoenician}/</tt> -- <tt>/\p{Psalter_Pahlavi}/</tt> -- <tt>/\p{Rejang}/</tt> -- <tt>/\p{Runic}/</tt> -- <tt>/\p{Samaritan}/</tt> -- <tt>/\p{Saurashtra}/</tt> -- <tt>/\p{Sharada}/</tt> -- <tt>/\p{Shavian}/</tt> -- <tt>/\p{Siddham}/</tt> -- <tt>/\p{SignWriting}/</tt> -- <tt>/\p{Sinhala}/</tt> -- <tt>/\p{Sogdian}/</tt> -- <tt>/\p{Sora_Sompeng}/</tt> -- <tt>/\p{Soyombo}/</tt> -- <tt>/\p{Sundanese}/</tt> -- <tt>/\p{Syloti_Nagri}/</tt> -- <tt>/\p{Syriac}/</tt> -- <tt>/\p{Tagalog}/</tt> -- <tt>/\p{Tagbanwa}/</tt> -- <tt>/\p{Tai_Le}/</tt> -- <tt>/\p{Tai_Tham}/</tt> -- <tt>/\p{Tai_Viet}/</tt> -- <tt>/\p{Takri}/</tt> -- <tt>/\p{Tamil}/</tt> -- <tt>/\p{Tangut}/</tt> -- <tt>/\p{Telugu}/</tt> -- <tt>/\p{Thaana}/</tt> -- <tt>/\p{Thai}/</tt> -- <tt>/\p{Tibetan}/</tt> -- <tt>/\p{Tifinagh}/</tt> -- <tt>/\p{Tirhuta}/</tt> -- <tt>/\p{Ugaritic}/</tt> -- <tt>/\p{Unknown}/</tt> -- <tt>/\p{Vai}/</tt> -- <tt>/\p{Wancho}/</tt> -- <tt>/\p{Warang_Citi}/</tt> -- <tt>/\p{Yi}/</tt> -- <tt>/\p{Zanabazar_Square}/</tt> === Derived Core Properties -- <tt>/\p{Alphabetic}/</tt> -- <tt>/\p{Case_Ignorable}/</tt> -- <tt>/\p{Cased}/</tt> -- <tt>/\p{Changes_When_Casefolded}/</tt> -- <tt>/\p{Changes_When_Casemapped}/</tt> -- <tt>/\p{Changes_When_Lowercased}/</tt> -- <tt>/\p{Changes_When_Titlecased}/</tt> -- <tt>/\p{Changes_When_Uppercased}/</tt> -- <tt>/\p{Default_Ignorable_Code_Point}/</tt> -- <tt>/\p{Grapheme_Base}/</tt> -- <tt>/\p{Grapheme_Extend}/</tt> -- <tt>/\p{Grapheme_Link}/</tt> -- <tt>/\p{ID_Continue}/</tt> -- <tt>/\p{ID_Start}/</tt> -- <tt>/\p{Lowercase}/</tt> -- <tt>/\p{Math}/</tt> -- <tt>/\p{Uppercase}/</tt> -- <tt>/\p{XID_Continue}/</tt> -- <tt>/\p{XID_Start}/</tt> - -=== Prop List - -- <tt>/\p{ASCII_Hex_Digit}/</tt> -- <tt>/\p{Bidi_Control}/</tt> -- <tt>/\p{Dash}/</tt> -- <tt>/\p{Deprecated}/</tt> -- <tt>/\p{Diacritic}/</tt> -- <tt>/\p{Extender}/</tt> -- <tt>/\p{Hex_Digit}/</tt> -- <tt>/\p{Hyphen}/</tt> -- <tt>/\p{IDS_Binary_Operator}/</tt> -- <tt>/\p{IDS_Trinary_Operator}/</tt> -- <tt>/\p{Ideographic}/</tt> -- <tt>/\p{Join_Control}/</tt> -- <tt>/\p{Logical_Order_Exception}/</tt> -- <tt>/\p{Noncharacter_Code_Point}/</tt> -- <tt>/\p{Other_Alphabetic}/</tt> -- <tt>/\p{Other_Default_Ignorable_Code_Point}/</tt> -- <tt>/\p{Other_Grapheme_Extend}/</tt> -- <tt>/\p{Other_ID_Continue}/</tt> -- <tt>/\p{Other_ID_Start}/</tt> -- <tt>/\p{Other_Lowercase}/</tt> -- <tt>/\p{Other_Math}/</tt> -- <tt>/\p{Other_Uppercase}/</tt> -- <tt>/\p{Pattern_Syntax}/</tt> -- <tt>/\p{Pattern_White_Space}/</tt> -- <tt>/\p{Prepended_Concatenation_Mark}/</tt> -- <tt>/\p{Quotation_Mark}/</tt> -- <tt>/\p{Radical}/</tt> -- <tt>/\p{Regional_Indicator}/</tt> -- <tt>/\p{Sentence_Terminal}/</tt> -- <tt>/\p{Soft_Dotted}/</tt> -- <tt>/\p{Terminal_Punctuation}/</tt> -- <tt>/\p{Unified_Ideograph}/</tt> -- <tt>/\p{Variation_Selector}/</tt> -- <tt>/\p{White_Space}/</tt> -=== Emoji -- <tt>/\p{Emoji}/</tt> -- <tt>/\p{Emoji_Component}/</tt> -- <tt>/\p{Emoji_Modifier}/</tt> -- <tt>/\p{Emoji_Modifier_Base}/</tt> -- <tt>/\p{Emoji_Presentation}/</tt> -=== Property Aliases -- <tt>/\p{AHex}/</tt> -- <tt>/\p{Bidi_C}/</tt> -- <tt>/\p{CI}/</tt> -- <tt>/\p{CWCF}/</tt> -- <tt>/\p{CWCM}/</tt> -- <tt>/\p{CWL}/</tt> -- <tt>/\p{CWT}/</tt> -- <tt>/\p{CWU}/</tt> -- <tt>/\p{DI}/</tt> -- <tt>/\p{Dep}/</tt> -- <tt>/\p{Dia}/</tt> -- <tt>/\p{Ext}/</tt> -- <tt>/\p{Gr_Base}/</tt> -- <tt>/\p{Gr_Ext}/</tt> -- <tt>/\p{Gr_Link}/</tt> -- <tt>/\p{Hex}/</tt> -- <tt>/\p{IDC}/</tt> -- <tt>/\p{IDS}/</tt> -- <tt>/\p{IDSB}/</tt> -- <tt>/\p{IDST}/</tt> -- <tt>/\p{Ideo}/</tt> -- <tt>/\p{Join_C}/</tt> -- <tt>/\p{LOE}/</tt> -- <tt>/\p{NChar}/</tt> -- <tt>/\p{OAlpha}/</tt> -- <tt>/\p{ODI}/</tt> -- <tt>/\p{OGr_Ext}/</tt> -- <tt>/\p{OIDC}/</tt> -- <tt>/\p{OIDS}/</tt> -- <tt>/\p{OLower}/</tt> -- <tt>/\p{OMath}/</tt> -- <tt>/\p{OUpper}/</tt> -- <tt>/\p{PCM}/</tt> -- <tt>/\p{Pat_Syn}/</tt> -- <tt>/\p{Pat_WS}/</tt> -- <tt>/\p{QMark}/</tt> -- <tt>/\p{RI}/</tt> -- <tt>/\p{SD}/</tt> -- <tt>/\p{STerm}/</tt> -- <tt>/\p{Term}/</tt> -- <tt>/\p{UIdeo}/</tt> -- <tt>/\p{VS}/</tt> -- <tt>/\p{WSpace}/</tt> -- <tt>/\p{XIDC}/</tt> -- <tt>/\p{XIDS}/</tt> -=== Property Value Aliases (General Category) -- <tt>/\p{Other}/</tt> -- <tt>/\p{Control}/</tt> -- <tt>/\p{Format}/</tt> -- <tt>/\p{Unassigned}/</tt> -- <tt>/\p{Private_Use}/</tt> -- <tt>/\p{Surrogate}/</tt> -- <tt>/\p{Letter}/</tt> -- <tt>/\p{Cased_Letter}/</tt> -- <tt>/\p{Lowercase_Letter}/</tt> -- <tt>/\p{Modifier_Letter}/</tt> -- <tt>/\p{Other_Letter}/</tt> -- <tt>/\p{Titlecase_Letter}/</tt> -- <tt>/\p{Uppercase_Letter}/</tt> -- <tt>/\p{Mark}/</tt> -- <tt>/\p{Combining_Mark}/</tt> -- <tt>/\p{Spacing_Mark}/</tt> -- <tt>/\p{Enclosing_Mark}/</tt> -- <tt>/\p{Nonspacing_Mark}/</tt> -- <tt>/\p{Number}/</tt> -- <tt>/\p{Decimal_Number}/</tt> -- <tt>/\p{Letter_Number}/</tt> -- <tt>/\p{Other_Number}/</tt> -- <tt>/\p{Punctuation}/</tt> -- <tt>/\p{Connector_Punctuation}/</tt> -- <tt>/\p{Dash_Punctuation}/</tt> -- <tt>/\p{Close_Punctuation}/</tt> -- <tt>/\p{Final_Punctuation}/</tt> -- <tt>/\p{Initial_Punctuation}/</tt> -- <tt>/\p{Other_Punctuation}/</tt> -- <tt>/\p{Open_Punctuation}/</tt> -- <tt>/\p{Symbol}/</tt> -- <tt>/\p{Currency_Symbol}/</tt> -- <tt>/\p{Modifier_Symbol}/</tt> -- <tt>/\p{Math_Symbol}/</tt> -- <tt>/\p{Other_Symbol}/</tt> -- <tt>/\p{Separator}/</tt> -- <tt>/\p{Line_Separator}/</tt> -- <tt>/\p{Paragraph_Separator}/</tt> -- <tt>/\p{Space_Separator}/</tt> -=== Property Value Aliases (Script) -- <tt>/\p{Adlm}/</tt> -- <tt>/\p{Aghb}/</tt> -- <tt>/\p{Arab}/</tt> -- <tt>/\p{Armi}/</tt> -- <tt>/\p{Armn}/</tt> -- <tt>/\p{Avst}/</tt> -- <tt>/\p{Bali}/</tt> -- <tt>/\p{Bamu}/</tt> -- <tt>/\p{Bass}/</tt> -- <tt>/\p{Batk}/</tt> -- <tt>/\p{Beng}/</tt> -- <tt>/\p{Bhks}/</tt> -- <tt>/\p{Bopo}/</tt> -- <tt>/\p{Brah}/</tt> -- <tt>/\p{Brai}/</tt> -- <tt>/\p{Bugi}/</tt> -- <tt>/\p{Buhd}/</tt> -- <tt>/\p{Cakm}/</tt> -- <tt>/\p{Cans}/</tt> -- <tt>/\p{Cari}/</tt> -- <tt>/\p{Cher}/</tt> -- <tt>/\p{Copt}/</tt> -- <tt>/\p{Qaac}/</tt> -- <tt>/\p{Cprt}/</tt> -- <tt>/\p{Cyrl}/</tt> -- <tt>/\p{Deva}/</tt> -- <tt>/\p{Dogr}/</tt> -- <tt>/\p{Dsrt}/</tt> -- <tt>/\p{Dupl}/</tt> -- <tt>/\p{Egyp}/</tt> -- <tt>/\p{Elba}/</tt> -- <tt>/\p{Elym}/</tt> -- <tt>/\p{Ethi}/</tt> -- <tt>/\p{Geor}/</tt> -- <tt>/\p{Glag}/</tt> -- <tt>/\p{Gong}/</tt> -- <tt>/\p{Gonm}/</tt> -- <tt>/\p{Goth}/</tt> -- <tt>/\p{Gran}/</tt> -- <tt>/\p{Grek}/</tt> -- <tt>/\p{Gujr}/</tt> -- <tt>/\p{Guru}/</tt> -- <tt>/\p{Hang}/</tt> -- <tt>/\p{Hani}/</tt> -- <tt>/\p{Hano}/</tt> -- <tt>/\p{Hatr}/</tt> -- <tt>/\p{Hebr}/</tt> -- <tt>/\p{Hira}/</tt> -- <tt>/\p{Hluw}/</tt> -- <tt>/\p{Hmng}/</tt> -- <tt>/\p{Hmnp}/</tt> -- <tt>/\p{Hung}/</tt> -- <tt>/\p{Ital}/</tt> -- <tt>/\p{Java}/</tt> -- <tt>/\p{Kali}/</tt> -- <tt>/\p{Kana}/</tt> -- <tt>/\p{Khar}/</tt> -- <tt>/\p{Khmr}/</tt> -- <tt>/\p{Khoj}/</tt> -- <tt>/\p{Knda}/</tt> -- <tt>/\p{Kthi}/</tt> -- <tt>/\p{Lana}/</tt> -- <tt>/\p{Laoo}/</tt> -- <tt>/\p{Latn}/</tt> -- <tt>/\p{Lepc}/</tt> -- <tt>/\p{Limb}/</tt> -- <tt>/\p{Lina}/</tt> -- <tt>/\p{Linb}/</tt> -- <tt>/\p{Lyci}/</tt> -- <tt>/\p{Lydi}/</tt> -- <tt>/\p{Mahj}/</tt> -- <tt>/\p{Maka}/</tt> -- <tt>/\p{Mand}/</tt> -- <tt>/\p{Mani}/</tt> -- <tt>/\p{Marc}/</tt> -- <tt>/\p{Medf}/</tt> -- <tt>/\p{Mend}/</tt> -- <tt>/\p{Merc}/</tt> -- <tt>/\p{Mero}/</tt> -- <tt>/\p{Mlym}/</tt> -- <tt>/\p{Mong}/</tt> -- <tt>/\p{Mroo}/</tt> -- <tt>/\p{Mtei}/</tt> -- <tt>/\p{Mult}/</tt> -- <tt>/\p{Mymr}/</tt> -- <tt>/\p{Nand}/</tt> -- <tt>/\p{Narb}/</tt> -- <tt>/\p{Nbat}/</tt> -- <tt>/\p{Nkoo}/</tt> -- <tt>/\p{Nshu}/</tt> -- <tt>/\p{Ogam}/</tt> -- <tt>/\p{Olck}/</tt> -- <tt>/\p{Orkh}/</tt> -- <tt>/\p{Orya}/</tt> -- <tt>/\p{Osge}/</tt> -- <tt>/\p{Osma}/</tt> -- <tt>/\p{Palm}/</tt> -- <tt>/\p{Pauc}/</tt> -- <tt>/\p{Perm}/</tt> -- <tt>/\p{Phag}/</tt> -- <tt>/\p{Phli}/</tt> -- <tt>/\p{Phlp}/</tt> -- <tt>/\p{Phnx}/</tt> -- <tt>/\p{Plrd}/</tt> -- <tt>/\p{Prti}/</tt> -- <tt>/\p{Rjng}/</tt> -- <tt>/\p{Rohg}/</tt> -- <tt>/\p{Runr}/</tt> -- <tt>/\p{Samr}/</tt> -- <tt>/\p{Sarb}/</tt> -- <tt>/\p{Saur}/</tt> -- <tt>/\p{Sgnw}/</tt> -- <tt>/\p{Shaw}/</tt> -- <tt>/\p{Shrd}/</tt> -- <tt>/\p{Sidd}/</tt> -- <tt>/\p{Sind}/</tt> -- <tt>/\p{Sinh}/</tt> -- <tt>/\p{Sogd}/</tt> -- <tt>/\p{Sogo}/</tt> -- <tt>/\p{Sora}/</tt> -- <tt>/\p{Soyo}/</tt> -- <tt>/\p{Sund}/</tt> -- <tt>/\p{Sylo}/</tt> -- <tt>/\p{Syrc}/</tt> -- <tt>/\p{Tagb}/</tt> -- <tt>/\p{Takr}/</tt> -- <tt>/\p{Tale}/</tt> -- <tt>/\p{Talu}/</tt> -- <tt>/\p{Taml}/</tt> -- <tt>/\p{Tang}/</tt> -- <tt>/\p{Tavt}/</tt> -- <tt>/\p{Telu}/</tt> -- <tt>/\p{Tfng}/</tt> -- <tt>/\p{Tglg}/</tt> -- <tt>/\p{Thaa}/</tt> -- <tt>/\p{Tibt}/</tt> -- <tt>/\p{Tirh}/</tt> -- <tt>/\p{Ugar}/</tt> -- <tt>/\p{Vaii}/</tt> -- <tt>/\p{Wara}/</tt> -- <tt>/\p{Wcho}/</tt> -- <tt>/\p{Xpeo}/</tt> -- <tt>/\p{Xsux}/</tt> -- <tt>/\p{Yiii}/</tt> -- <tt>/\p{Zanb}/</tt> -- <tt>/\p{Zinh}/</tt> -- <tt>/\p{Qaai}/</tt> -- <tt>/\p{Zyyy}/</tt> -- <tt>/\p{Zzzz}/</tt> === Derived Ages -- <tt>/\p{Age=1.1}/</tt> -- <tt>/\p{Age=10.0}/</tt> -- <tt>/\p{Age=11.0}/</tt> -- <tt>/\p{Age=12.0}/</tt> -- <tt>/\p{Age=12.1}/</tt> -- <tt>/\p{Age=2.0}/</tt> -- <tt>/\p{Age=2.1}/</tt> -- <tt>/\p{Age=3.0}/</tt> -- <tt>/\p{Age=3.1}/</tt> -- <tt>/\p{Age=3.2}/</tt> -- <tt>/\p{Age=4.0}/</tt> -- <tt>/\p{Age=4.1}/</tt> -- <tt>/\p{Age=5.0}/</tt> -- <tt>/\p{Age=5.1}/</tt> -- <tt>/\p{Age=5.2}/</tt> -- <tt>/\p{Age=6.0}/</tt> -- <tt>/\p{Age=6.1}/</tt> -- <tt>/\p{Age=6.2}/</tt> -- <tt>/\p{Age=6.3}/</tt> -- <tt>/\p{Age=7.0}/</tt> -- <tt>/\p{Age=8.0}/</tt> -- <tt>/\p{Age=9.0}/</tt> - -=== Blocks - -- <tt>/\p{In_Basic_Latin}/</tt> -- <tt>/\p{In_Latin_1_Supplement}/</tt> -- <tt>/\p{In_Latin_Extended_A}/</tt> -- <tt>/\p{In_Latin_Extended_B}/</tt> -- <tt>/\p{In_IPA_Extensions}/</tt> -- <tt>/\p{In_Spacing_Modifier_Letters}/</tt> -- <tt>/\p{In_Combining_Diacritical_Marks}/</tt> -- <tt>/\p{In_Greek_and_Coptic}/</tt> -- <tt>/\p{In_Cyrillic}/</tt> -- <tt>/\p{In_Cyrillic_Supplement}/</tt> -- <tt>/\p{In_Armenian}/</tt> -- <tt>/\p{In_Hebrew}/</tt> -- <tt>/\p{In_Arabic}/</tt> -- <tt>/\p{In_Syriac}/</tt> -- <tt>/\p{In_Arabic_Supplement}/</tt> -- <tt>/\p{In_Thaana}/</tt> -- <tt>/\p{In_NKo}/</tt> -- <tt>/\p{In_Samaritan}/</tt> -- <tt>/\p{In_Mandaic}/</tt> -- <tt>/\p{In_Syriac_Supplement}/</tt> -- <tt>/\p{In_Arabic_Extended_A}/</tt> -- <tt>/\p{In_Devanagari}/</tt> -- <tt>/\p{In_Bengali}/</tt> -- <tt>/\p{In_Gurmukhi}/</tt> -- <tt>/\p{In_Gujarati}/</tt> -- <tt>/\p{In_Oriya}/</tt> -- <tt>/\p{In_Tamil}/</tt> -- <tt>/\p{In_Telugu}/</tt> -- <tt>/\p{In_Kannada}/</tt> -- <tt>/\p{In_Malayalam}/</tt> -- <tt>/\p{In_Sinhala}/</tt> -- <tt>/\p{In_Thai}/</tt> -- <tt>/\p{In_Lao}/</tt> -- <tt>/\p{In_Tibetan}/</tt> -- <tt>/\p{In_Myanmar}/</tt> -- <tt>/\p{In_Georgian}/</tt> -- <tt>/\p{In_Hangul_Jamo}/</tt> -- <tt>/\p{In_Ethiopic}/</tt> -- <tt>/\p{In_Ethiopic_Supplement}/</tt> -- <tt>/\p{In_Cherokee}/</tt> -- <tt>/\p{In_Unified_Canadian_Aboriginal_Syllabics}/</tt> -- <tt>/\p{In_Ogham}/</tt> -- <tt>/\p{In_Runic}/</tt> -- <tt>/\p{In_Tagalog}/</tt> -- <tt>/\p{In_Hanunoo}/</tt> -- <tt>/\p{In_Buhid}/</tt> -- <tt>/\p{In_Tagbanwa}/</tt> -- <tt>/\p{In_Khmer}/</tt> -- <tt>/\p{In_Mongolian}/</tt> -- <tt>/\p{In_Unified_Canadian_Aboriginal_Syllabics_Extended}/</tt> -- <tt>/\p{In_Limbu}/</tt> -- <tt>/\p{In_Tai_Le}/</tt> -- <tt>/\p{In_New_Tai_Lue}/</tt> -- <tt>/\p{In_Khmer_Symbols}/</tt> -- <tt>/\p{In_Buginese}/</tt> -- <tt>/\p{In_Tai_Tham}/</tt> -- <tt>/\p{In_Combining_Diacritical_Marks_Extended}/</tt> -- <tt>/\p{In_Balinese}/</tt> -- <tt>/\p{In_Sundanese}/</tt> -- <tt>/\p{In_Batak}/</tt> -- <tt>/\p{In_Lepcha}/</tt> -- <tt>/\p{In_Ol_Chiki}/</tt> -- <tt>/\p{In_Cyrillic_Extended_C}/</tt> -- <tt>/\p{In_Georgian_Extended}/</tt> -- <tt>/\p{In_Sundanese_Supplement}/</tt> -- <tt>/\p{In_Vedic_Extensions}/</tt> -- <tt>/\p{In_Phonetic_Extensions}/</tt> -- <tt>/\p{In_Phonetic_Extensions_Supplement}/</tt> -- <tt>/\p{In_Combining_Diacritical_Marks_Supplement}/</tt> -- <tt>/\p{In_Latin_Extended_Additional}/</tt> -- <tt>/\p{In_Greek_Extended}/</tt> -- <tt>/\p{In_General_Punctuation}/</tt> -- <tt>/\p{In_Superscripts_and_Subscripts}/</tt> -- <tt>/\p{In_Currency_Symbols}/</tt> -- <tt>/\p{In_Combining_Diacritical_Marks_for_Symbols}/</tt> -- <tt>/\p{In_Letterlike_Symbols}/</tt> -- <tt>/\p{In_Number_Forms}/</tt> -- <tt>/\p{In_Arrows}/</tt> -- <tt>/\p{In_Mathematical_Operators}/</tt> -- <tt>/\p{In_Miscellaneous_Technical}/</tt> -- <tt>/\p{In_Control_Pictures}/</tt> -- <tt>/\p{In_Optical_Character_Recognition}/</tt> -- <tt>/\p{In_Enclosed_Alphanumerics}/</tt> -- <tt>/\p{In_Box_Drawing}/</tt> -- <tt>/\p{In_Block_Elements}/</tt> -- <tt>/\p{In_Geometric_Shapes}/</tt> -- <tt>/\p{In_Miscellaneous_Symbols}/</tt> -- <tt>/\p{In_Dingbats}/</tt> -- <tt>/\p{In_Miscellaneous_Mathematical_Symbols_A}/</tt> -- <tt>/\p{In_Supplemental_Arrows_A}/</tt> -- <tt>/\p{In_Braille_Patterns}/</tt> -- <tt>/\p{In_Supplemental_Arrows_B}/</tt> -- <tt>/\p{In_Miscellaneous_Mathematical_Symbols_B}/</tt> -- <tt>/\p{In_Supplemental_Mathematical_Operators}/</tt> -- <tt>/\p{In_Miscellaneous_Symbols_and_Arrows}/</tt> -- <tt>/\p{In_Glagolitic}/</tt> -- <tt>/\p{In_Latin_Extended_C}/</tt> -- <tt>/\p{In_Coptic}/</tt> -- <tt>/\p{In_Georgian_Supplement}/</tt> -- <tt>/\p{In_Tifinagh}/</tt> -- <tt>/\p{In_Ethiopic_Extended}/</tt> -- <tt>/\p{In_Cyrillic_Extended_A}/</tt> -- <tt>/\p{In_Supplemental_Punctuation}/</tt> -- <tt>/\p{In_CJK_Radicals_Supplement}/</tt> -- <tt>/\p{In_Kangxi_Radicals}/</tt> -- <tt>/\p{In_Ideographic_Description_Characters}/</tt> -- <tt>/\p{In_CJK_Symbols_and_Punctuation}/</tt> -- <tt>/\p{In_Hiragana}/</tt> -- <tt>/\p{In_Katakana}/</tt> -- <tt>/\p{In_Bopomofo}/</tt> -- <tt>/\p{In_Hangul_Compatibility_Jamo}/</tt> -- <tt>/\p{In_Kanbun}/</tt> -- <tt>/\p{In_Bopomofo_Extended}/</tt> -- <tt>/\p{In_CJK_Strokes}/</tt> -- <tt>/\p{In_Katakana_Phonetic_Extensions}/</tt> -- <tt>/\p{In_Enclosed_CJK_Letters_and_Months}/</tt> -- <tt>/\p{In_CJK_Compatibility}/</tt> -- <tt>/\p{In_CJK_Unified_Ideographs_Extension_A}/</tt> -- <tt>/\p{In_Yijing_Hexagram_Symbols}/</tt> -- <tt>/\p{In_CJK_Unified_Ideographs}/</tt> -- <tt>/\p{In_Yi_Syllables}/</tt> -- <tt>/\p{In_Yi_Radicals}/</tt> -- <tt>/\p{In_Lisu}/</tt> -- <tt>/\p{In_Vai}/</tt> -- <tt>/\p{In_Cyrillic_Extended_B}/</tt> -- <tt>/\p{In_Bamum}/</tt> -- <tt>/\p{In_Modifier_Tone_Letters}/</tt> -- <tt>/\p{In_Latin_Extended_D}/</tt> -- <tt>/\p{In_Syloti_Nagri}/</tt> -- <tt>/\p{In_Common_Indic_Number_Forms}/</tt> -- <tt>/\p{In_Phags_pa}/</tt> -- <tt>/\p{In_Saurashtra}/</tt> -- <tt>/\p{In_Devanagari_Extended}/</tt> -- <tt>/\p{In_Kayah_Li}/</tt> -- <tt>/\p{In_Rejang}/</tt> -- <tt>/\p{In_Hangul_Jamo_Extended_A}/</tt> -- <tt>/\p{In_Javanese}/</tt> -- <tt>/\p{In_Myanmar_Extended_B}/</tt> -- <tt>/\p{In_Cham}/</tt> -- <tt>/\p{In_Myanmar_Extended_A}/</tt> -- <tt>/\p{In_Tai_Viet}/</tt> -- <tt>/\p{In_Meetei_Mayek_Extensions}/</tt> -- <tt>/\p{In_Ethiopic_Extended_A}/</tt> -- <tt>/\p{In_Latin_Extended_E}/</tt> -- <tt>/\p{In_Cherokee_Supplement}/</tt> -- <tt>/\p{In_Meetei_Mayek}/</tt> -- <tt>/\p{In_Hangul_Syllables}/</tt> -- <tt>/\p{In_Hangul_Jamo_Extended_B}/</tt> -- <tt>/\p{In_High_Surrogates}/</tt> -- <tt>/\p{In_High_Private_Use_Surrogates}/</tt> -- <tt>/\p{In_Low_Surrogates}/</tt> -- <tt>/\p{In_Private_Use_Area}/</tt> -- <tt>/\p{In_CJK_Compatibility_Ideographs}/</tt> -- <tt>/\p{In_Alphabetic_Presentation_Forms}/</tt> -- <tt>/\p{In_Arabic_Presentation_Forms_A}/</tt> -- <tt>/\p{In_Variation_Selectors}/</tt> -- <tt>/\p{In_Vertical_Forms}/</tt> -- <tt>/\p{In_Combining_Half_Marks}/</tt> -- <tt>/\p{In_CJK_Compatibility_Forms}/</tt> -- <tt>/\p{In_Small_Form_Variants}/</tt> -- <tt>/\p{In_Arabic_Presentation_Forms_B}/</tt> -- <tt>/\p{In_Halfwidth_and_Fullwidth_Forms}/</tt> -- <tt>/\p{In_Specials}/</tt> -- <tt>/\p{In_Linear_B_Syllabary}/</tt> -- <tt>/\p{In_Linear_B_Ideograms}/</tt> -- <tt>/\p{In_Aegean_Numbers}/</tt> -- <tt>/\p{In_Ancient_Greek_Numbers}/</tt> -- <tt>/\p{In_Ancient_Symbols}/</tt> -- <tt>/\p{In_Phaistos_Disc}/</tt> -- <tt>/\p{In_Lycian}/</tt> -- <tt>/\p{In_Carian}/</tt> -- <tt>/\p{In_Coptic_Epact_Numbers}/</tt> -- <tt>/\p{In_Old_Italic}/</tt> -- <tt>/\p{In_Gothic}/</tt> -- <tt>/\p{In_Old_Permic}/</tt> -- <tt>/\p{In_Ugaritic}/</tt> -- <tt>/\p{In_Old_Persian}/</tt> -- <tt>/\p{In_Deseret}/</tt> -- <tt>/\p{In_Shavian}/</tt> -- <tt>/\p{In_Osmanya}/</tt> -- <tt>/\p{In_Osage}/</tt> -- <tt>/\p{In_Elbasan}/</tt> -- <tt>/\p{In_Caucasian_Albanian}/</tt> -- <tt>/\p{In_Linear_A}/</tt> -- <tt>/\p{In_Cypriot_Syllabary}/</tt> -- <tt>/\p{In_Imperial_Aramaic}/</tt> -- <tt>/\p{In_Palmyrene}/</tt> -- <tt>/\p{In_Nabataean}/</tt> -- <tt>/\p{In_Hatran}/</tt> -- <tt>/\p{In_Phoenician}/</tt> -- <tt>/\p{In_Lydian}/</tt> -- <tt>/\p{In_Meroitic_Hieroglyphs}/</tt> -- <tt>/\p{In_Meroitic_Cursive}/</tt> -- <tt>/\p{In_Kharoshthi}/</tt> -- <tt>/\p{In_Old_South_Arabian}/</tt> -- <tt>/\p{In_Old_North_Arabian}/</tt> -- <tt>/\p{In_Manichaean}/</tt> -- <tt>/\p{In_Avestan}/</tt> -- <tt>/\p{In_Inscriptional_Parthian}/</tt> -- <tt>/\p{In_Inscriptional_Pahlavi}/</tt> -- <tt>/\p{In_Psalter_Pahlavi}/</tt> -- <tt>/\p{In_Old_Turkic}/</tt> -- <tt>/\p{In_Old_Hungarian}/</tt> -- <tt>/\p{In_Hanifi_Rohingya}/</tt> -- <tt>/\p{In_Rumi_Numeral_Symbols}/</tt> -- <tt>/\p{In_Old_Sogdian}/</tt> -- <tt>/\p{In_Sogdian}/</tt> -- <tt>/\p{In_Elymaic}/</tt> -- <tt>/\p{In_Brahmi}/</tt> -- <tt>/\p{In_Kaithi}/</tt> -- <tt>/\p{In_Sora_Sompeng}/</tt> -- <tt>/\p{In_Chakma}/</tt> -- <tt>/\p{In_Mahajani}/</tt> -- <tt>/\p{In_Sharada}/</tt> -- <tt>/\p{In_Sinhala_Archaic_Numbers}/</tt> -- <tt>/\p{In_Khojki}/</tt> -- <tt>/\p{In_Multani}/</tt> -- <tt>/\p{In_Khudawadi}/</tt> -- <tt>/\p{In_Grantha}/</tt> -- <tt>/\p{In_Newa}/</tt> -- <tt>/\p{In_Tirhuta}/</tt> -- <tt>/\p{In_Siddham}/</tt> -- <tt>/\p{In_Modi}/</tt> -- <tt>/\p{In_Mongolian_Supplement}/</tt> -- <tt>/\p{In_Takri}/</tt> -- <tt>/\p{In_Ahom}/</tt> -- <tt>/\p{In_Dogra}/</tt> -- <tt>/\p{In_Warang_Citi}/</tt> -- <tt>/\p{In_Nandinagari}/</tt> -- <tt>/\p{In_Zanabazar_Square}/</tt> -- <tt>/\p{In_Soyombo}/</tt> -- <tt>/\p{In_Pau_Cin_Hau}/</tt> -- <tt>/\p{In_Bhaiksuki}/</tt> -- <tt>/\p{In_Marchen}/</tt> -- <tt>/\p{In_Masaram_Gondi}/</tt> -- <tt>/\p{In_Gunjala_Gondi}/</tt> -- <tt>/\p{In_Makasar}/</tt> -- <tt>/\p{In_Tamil_Supplement}/</tt> -- <tt>/\p{In_Cuneiform}/</tt> -- <tt>/\p{In_Cuneiform_Numbers_and_Punctuation}/</tt> -- <tt>/\p{In_Early_Dynastic_Cuneiform}/</tt> -- <tt>/\p{In_Egyptian_Hieroglyphs}/</tt> -- <tt>/\p{In_Egyptian_Hieroglyph_Format_Controls}/</tt> -- <tt>/\p{In_Anatolian_Hieroglyphs}/</tt> -- <tt>/\p{In_Bamum_Supplement}/</tt> -- <tt>/\p{In_Mro}/</tt> -- <tt>/\p{In_Bassa_Vah}/</tt> -- <tt>/\p{In_Pahawh_Hmong}/</tt> -- <tt>/\p{In_Medefaidrin}/</tt> -- <tt>/\p{In_Miao}/</tt> -- <tt>/\p{In_Ideographic_Symbols_and_Punctuation}/</tt> -- <tt>/\p{In_Tangut}/</tt> -- <tt>/\p{In_Tangut_Components}/</tt> -- <tt>/\p{In_Kana_Supplement}/</tt> -- <tt>/\p{In_Kana_Extended_A}/</tt> -- <tt>/\p{In_Small_Kana_Extension}/</tt> -- <tt>/\p{In_Nushu}/</tt> -- <tt>/\p{In_Duployan}/</tt> -- <tt>/\p{In_Shorthand_Format_Controls}/</tt> -- <tt>/\p{In_Byzantine_Musical_Symbols}/</tt> -- <tt>/\p{In_Musical_Symbols}/</tt> -- <tt>/\p{In_Ancient_Greek_Musical_Notation}/</tt> -- <tt>/\p{In_Mayan_Numerals}/</tt> -- <tt>/\p{In_Tai_Xuan_Jing_Symbols}/</tt> -- <tt>/\p{In_Counting_Rod_Numerals}/</tt> -- <tt>/\p{In_Mathematical_Alphanumeric_Symbols}/</tt> -- <tt>/\p{In_Sutton_SignWriting}/</tt> -- <tt>/\p{In_Glagolitic_Supplement}/</tt> -- <tt>/\p{In_Nyiakeng_Puachue_Hmong}/</tt> -- <tt>/\p{In_Wancho}/</tt> -- <tt>/\p{In_Mende_Kikakui}/</tt> -- <tt>/\p{In_Adlam}/</tt> -- <tt>/\p{In_Indic_Siyaq_Numbers}/</tt> -- <tt>/\p{In_Ottoman_Siyaq_Numbers}/</tt> -- <tt>/\p{In_Arabic_Mathematical_Alphabetic_Symbols}/</tt> -- <tt>/\p{In_Mahjong_Tiles}/</tt> -- <tt>/\p{In_Domino_Tiles}/</tt> -- <tt>/\p{In_Playing_Cards}/</tt> -- <tt>/\p{In_Enclosed_Alphanumeric_Supplement}/</tt> -- <tt>/\p{In_Enclosed_Ideographic_Supplement}/</tt> -- <tt>/\p{In_Miscellaneous_Symbols_and_Pictographs}/</tt> -- <tt>/\p{In_Emoticons}/</tt> -- <tt>/\p{In_Ornamental_Dingbats}/</tt> -- <tt>/\p{In_Transport_and_Map_Symbols}/</tt> -- <tt>/\p{In_Alchemical_Symbols}/</tt> -- <tt>/\p{In_Geometric_Shapes_Extended}/</tt> -- <tt>/\p{In_Supplemental_Arrows_C}/</tt> -- <tt>/\p{In_Supplemental_Symbols_and_Pictographs}/</tt> -- <tt>/\p{In_Chess_Symbols}/</tt> -- <tt>/\p{In_Symbols_and_Pictographs_Extended_A}/</tt> -- <tt>/\p{In_CJK_Unified_Ideographs_Extension_B}/</tt> -- <tt>/\p{In_CJK_Unified_Ideographs_Extension_C}/</tt> -- <tt>/\p{In_CJK_Unified_Ideographs_Extension_D}/</tt> -- <tt>/\p{In_CJK_Unified_Ideographs_Extension_E}/</tt> -- <tt>/\p{In_CJK_Unified_Ideographs_Extension_F}/</tt> -- <tt>/\p{In_CJK_Compatibility_Ideographs_Supplement}/</tt> -- <tt>/\p{In_Tags}/</tt> -- <tt>/\p{In_Variation_Selectors_Supplement}/</tt> -- <tt>/\p{In_Supplementary_Private_Use_Area_A}/</tt> -- <tt>/\p{In_Supplementary_Private_Use_Area_B}/</tt> -- <tt>/\p{In_No_Block}/</tt> @@ -5402,7 +5402,7 @@ static const OnigCodePoint CR_ASCII[] = { 0x0000, 0x007f, }; /* CR_ASCII */ -/* 'Punct' */ static const OnigCodePoint CR_Punct[] = { 191, 0x0021, 0x0023, @@ -0,0 +1,59 @@ @@ -269,23 +269,12 @@ def parse_block(data) blocks << constname end -# shim for Ruby 1.8 -unless {}.respond_to?(:key) - class Hash - alias key index - end -end - $const_cache = {} # make_const(property, pairs, name): Prints a 'static const' structure for a # given property, group of paired codepoints, and a human-friendly name for # the group def make_const(prop, data, name) - if name.empty? - puts "\n/* '#{prop}' */" - else - puts "\n/* '#{prop}': #{name} */" - end if origprop = $const_cache.key(data) puts "#define CR_#{prop} CR_#{origprop}" else @@ -437,8 +426,6 @@ define_posix_props(data) POSIX_NAMES.each do |name| if name == 'XPosixPunct' make_const(name, data[name], "[[:Punct:]]") - elsif name == 'Punct' - make_const(name, data[name], "") else make_const(name, data[name], "[[:#{name}:]]") end |