Big mktables rewrite from Jeffrey;
[p5sagit/p5-mst-13.2.git] / lib / unicore / Is.pl
index 86e5926..55bb355 100644 (file)
 # !!!!!!!   DO NOT EDIT THIS FILE   !!!!!!! 
 # This file is built by mktables from e.g. Unicode.txt.
 # Any changes made here will be lost!
-%utf8::Is =
-(
-'Close_Punctuation'                           => 'Pe',
-'Connector_Punctuation'                       => 'Pc',
-'Control'                                     => 'Cc',
-'Currency_Symbol'                             => 'Sc',
-'Dash_Punctuation'                            => 'Pd',
-'Decimal_Number'                              => 'Nd',
-'Enclosing_Mark'                              => 'Me',
-'Final_Punctuation'                           => 'Pf',
-'Format'                                      => 'Cf',
-'Initial_Punctuation'                         => 'Pi',
-'Letter'                                      => 'L',
-'Letter_Number'                               => 'Nl',
-'Line_Separator'                              => 'Zl',
-'Lowercase_Letter'                            => 'Ll',
-'Mark'                                        => 'M',
-'Math_Symbol'                                 => 'Sm',
-'Modifier_Letter'                             => 'Lm',
-'Modifier_Symbol'                             => 'Sk',
-'Non_Spacing_Mark'                            => 'Mn',
-'Number'                                      => 'N',
-'Open_Punctuation'                            => 'Ps',
-'Other'                                       => 'C',
-'Other_Letter'                                => 'Lo',
-'Other_Number'                                => 'No',
-'Other_Punctuation'                           => 'Po',
-'Other_Symbol'                                => 'So',
-'Paragraph_Separator'                         => 'Zp',
-'Private Use'                                 => 'Co',
-'Punctuation'                                 => 'P',
-'Separator'                                   => 'Z',
-'Space_Separator'                             => 'Zs',
-'Spacing_Mark'                                => 'Mc',
-'Surrogate'                                   => 'Cs',
-'Symbol'                                      => 'S',
-'Titlecase_Letter'                            => 'Lt',
-'Unassigned'                                  => 'Cn',
-'Uppercase_Letter'                            => 'Lu',
+# Built Mon Jan 14 15:52:42 2002.
+
+##
+## Data in this file used by ../utf8_heavy.pl
+##
+
+## Mapping from name to filename in ./Is
+%utf8::Is = (
+  'ASCII'                                   => 'ASCII',
+  'Alnum'                                   => 'Alnum',
+  'Alpha'                                   => 'Alpha',
+  'BidiAL'                                  => 'BidiAL',
+  'BidiAN'                                  => 'BidiAN',
+  'BidiB'                                   => 'BidiB',
+  'BidiBN'                                  => 'BidiBN',
+  'BidiCS'                                  => 'BidiCS',
+  'BidiEN'                                  => 'BidiEN',
+  'BidiES'                                  => 'BidiES',
+  'BidiET'                                  => 'BidiET',
+  'BidiL'                                   => 'BidiL',
+  'BidiLRE'                                 => 'BidiLRE',
+  'BidiLRO'                                 => 'BidiLRO',
+  'BidiNSM'                                 => 'BidiNSM',
+  'BidiON'                                  => 'BidiON',
+  'BidiPDF'                                 => 'BidiPDF',
+  'BidiR'                                   => 'BidiR',
+  'BidiRLE'                                 => 'BidiRLE',
+  'BidiRLO'                                 => 'BidiRLO',
+  'BidiS'                                   => 'BidiS',
+  'BidiWS'                                  => 'BidiWS',
+  'Blank'                                   => 'Blank',
+  'C'                                       => 'C',
+  'Canon'                                   => 'Canon',
+  'Cc'                                      => 'Cc',
+  'Cf'                                      => 'Cf',
+  'Cn'                                      => 'Cn',
+  'Cntrl'                                   => 'Cntrl',
+  'Co'                                      => 'Co',
+  'Compat'                                  => 'Compat',
+  'Cs'                                      => 'Cs',
+  'DCcircle'                                => 'DCcircle',
+  'DCcompat'                                => 'DCcompat',
+  'DCfinal'                                 => 'DCfinal',
+  'DCfont'                                  => 'DCfont',
+  'DCfraction'                              => 'DCfracti',
+  'DCinitial'                               => 'DCinitia',
+  'DCisolated'                              => 'DCisolat',
+  'DCmedial'                                => 'DCmedial',
+  'DCnarrow'                                => 'DCnarrow',
+  'DCnoBreak'                               => 'DCnoBrea',
+  'DCsmall'                                 => 'DCsmall',
+  'DCsquare'                                => 'DCsquare',
+  'DCsub'                                   => 'DCsub',
+  'DCsuper'                                 => 'DCsuper',
+  'DCvertical'                              => 'DCvertic',
+  'DCwide'                                  => 'DCwide',
+  'Digit'                                   => 'Digit',
+  'Graph'                                   => 'Graph',
+  'L'                                       => '2',
+  'L&'                                      => 'L',
+  'LbrkAI'                                  => 'LbrkAI',
+  'LbrkAL'                                  => 'LbrkAL',
+  'LbrkB2'                                  => 'LbrkB2',
+  'LbrkBA'                                  => 'LbrkBA',
+  'LbrkBB'                                  => 'LbrkBB',
+  'LbrkBK'                                  => 'LbrkBK',
+  'LbrkCB'                                  => 'LbrkCB',
+  'LbrkCL'                                  => 'LbrkCL',
+  'LbrkCM'                                  => 'LbrkCM',
+  'LbrkCR'                                  => 'LbrkCR',
+  'LbrkEX'                                  => 'LbrkEX',
+  'LbrkGL'                                  => 'LbrkGL',
+  'LbrkHY'                                  => 'LbrkHY',
+  'LbrkID'                                  => 'LbrkID',
+  'LbrkIN'                                  => 'LbrkIN',
+  'LbrkIS'                                  => 'LbrkIS',
+  'LbrkLF'                                  => 'LbrkLF',
+  'LbrkNS'                                  => 'LbrkNS',
+  'LbrkNU'                                  => 'LbrkNU',
+  'LbrkOP'                                  => 'LbrkOP',
+  'LbrkPO'                                  => 'LbrkPO',
+  'LbrkPR'                                  => 'LbrkPR',
+  'LbrkQU'                                  => 'LbrkQU',
+  'LbrkSA'                                  => 'LbrkSA',
+  'LbrkSG'                                  => 'LbrkSG',
+  'LbrkSP'                                  => 'LbrkSP',
+  'LbrkSY'                                  => 'LbrkSY',
+  'LbrkXX'                                  => 'LbrkXX',
+  'LbrkZW'                                  => 'LbrkZW',
+  'Ll'                                      => 'Ll',
+  'Lm'                                      => 'Lm',
+  'Lo'                                      => 'Lo',
+  'Lower'                                   => 'Lower',
+  'Lt'                                      => 'Lt',
+  'Lu'                                      => 'Lu',
+  'M'                                       => 'M',
+  'Mc'                                      => 'Mc',
+  'Me'                                      => 'Me',
+  'Mirrored'                                => 'Mirrored',
+  'Mn'                                      => 'Mn',
+  'N'                                       => 'N',
+  'Nd'                                      => 'Nd',
+  'Nl'                                      => 'Nl',
+  'No'                                      => 'No',
+  'P'                                       => 'P',
+  'Pc'                                      => 'Pc',
+  'Pd'                                      => 'Pd',
+  'Pe'                                      => 'Pe',
+  'Pf'                                      => 'Pf',
+  'Pi'                                      => 'Pi',
+  'Po'                                      => 'Po',
+  'Print'                                   => 'Print',
+  'Ps'                                      => 'Ps',
+  'Punct'                                   => 'Punct',
+  'S'                                       => 'S',
+  'Sc'                                      => 'Sc',
+  'Sk'                                      => 'Sk',
+  'Sm'                                      => 'Sm',
+  'So'                                      => 'So',
+  'Space'                                   => 'Space',
+  'SpacePerl'                               => 'SpacePer',
+  'Title'                                   => 'Title',
+  'Upper'                                   => 'Upper',
+  'Word'                                    => 'Word',
+  'XDigit'                                  => 'XDigit',
+  'Z'                                       => 'Z',
+  'Zl'                                      => 'Zl',
+  'Zp'                                      => 'Zp',
+  'Zs'                                      => 'Zs',
 );
-%utf8::IsPat =
-(
-'cl' => {
+
+## Mappings from regex to filename in ./Is/
+%utf8::IsPat = (
+ 'al' => {
+       'Alphabetic' => 'Alphabet',
+       'All' => 'Any',
+ },
+ 'an' => {
+       'Any' => 'Any',
+ },
+ 'ar' => {
+       'Armenian' => 'Armenian',
+       'Arabic' => 'Arabic',
+ },
+ 'as' => {
+       'ASCII(?:[-_]|\s+)?Hex(?:[-_]|\s+)?Digit' => 'ASCIIHex',
+       'Assigned' => 'Assigned',
+ },
+ 'be' => {
+       'Bengali' => 'Bengali',
+ },
+ 'bi' => {
+       'Bidi(?:[-_]|\s+)?Control' => 'BidiCont',
+ },
+ 'bo' => {
+       'Bopomofo' => 'Bopomofo',
+ },
+ 'ca' => {
+       'Canadian(?:[-_]|\s+)?Aboriginal' => 'Canadian',
+ },
+ 'ch' => {
+       'Cherokee' => 'Cherokee',
+ },
+ 'cl' => {
        'Close(?:[-_]|\s+)?Punctuation' => 'Pe',
-},
-'co' => {
+ },
+ 'co' => {
        'Connector(?:[-_]|\s+)?Punctuation' => 'Pc',
        'Control' => 'Cc',
-},
-'cu' => {
+       'Common' => 'Common',
+ },
+ 'cu' => {
        'Currency(?:[-_]|\s+)?Symbol' => 'Sc',
-},
-'da' => {
+ },
+ 'cy' => {
+       'Cyrillic' => 'Cyrillic',
+ },
+ 'da' => {
        'Dash(?:[-_]|\s+)?Punctuation' => 'Pd',
-},
-'de' => {
+       'Dash' => 'Dash',
+ },
+ 'de' => {
+       'Devanagari' => 'Devanaga',
        'Decimal(?:[-_]|\s+)?Number' => 'Nd',
-},
-'en' => {
+       'Deseret' => 'Deseret',
+ },
+ 'di' => {
+       'Diacritic' => 'Diacriti',
+ },
+ 'en' => {
        'Enclosing(?:[-_]|\s+)?Mark' => 'Me',
-},
-'fi' => {
+ },
+ 'et' => {
+       'Ethiopic' => 'Ethiopic',
+ },
+ 'ex' => {
+       'Extender' => 'Extender',
+ },
+ 'fi' => {
        'Final(?:[-_]|\s+)?Punctuation' => 'Pf',
-},
-'fo' => {
+ },
+ 'fo' => {
        'Format' => 'Cf',
-},
-'in' => {
+ },
+ 'ge' => {
+       'Georgian' => 'Georgian',
+ },
+ 'go' => {
+       'Gothic' => 'Gothic',
+ },
+ 'gr' => {
+       'Greek' => 'Greek',
+ },
+ 'gu' => {
+       'Gurmukhi' => 'Gurmukhi',
+       'Gujarati' => 'Gujarati',
+ },
+ 'ha' => {
+       'Han' => 'Han',
+       'Hangul' => 'Hangul',
+ },
+ 'he' => {
+       'Hebrew' => 'Hebrew',
+       'Hex(?:[-_]|\s+)?Digit' => 'HexDigit',
+ },
+ 'hi' => {
+       'Hiragana' => 'Hiragana',
+ },
+ 'hy' => {
+       'Hyphen' => 'Hyphen',
+ },
+ 'id' => {
+       'Ideographic' => 'Ideograp',
+       'ID(?:[-_]|\s+)?Continue' => 'IDContin',
+       'ID(?:[-_]|\s+)?Start' => 'IDStart',
+ },
+ 'in' => {
+       'Inherited' => 'Inherite',
        'Initial(?:[-_]|\s+)?Punctuation' => 'Pi',
-},
-'le' => {
-       'Letter' => 'L',
+ },
+ 'jo' => {
+       'Join(?:[-_]|\s+)?Control' => 'JoinCont',
+ },
+ 'ka' => {
+       'Katakana' => 'Katakana',
+       'Kannada' => 'Kannada',
+ },
+ 'kh' => {
+       'Khmer' => 'Khmer',
+ },
+ 'la' => {
+       'Latin' => 'Latin',
+       'Lao' => 'Lao',
+ },
+ 'le' => {
        'Letter(?:[-_]|\s+)?Number' => 'Nl',
-},
-'li' => {
+       'Letter' => '2',
+ },
+ 'li' => {
        'Line(?:[-_]|\s+)?Separator' => 'Zl',
-},
-'lo' => {
+ },
+ 'lo' => {
        'Lowercase(?:[-_]|\s+)?Letter' => 'Ll',
-},
-'ma' => {
-       'Mark' => 'M',
+       'Lowercase' => 'Lowercas',
+ },
+ 'ma' => {
        'Math(?:[-_]|\s+)?Symbol' => 'Sm',
-},
-'mo' => {
+       'Mark' => 'M',
+       'Math' => 'Math',
+       'Malayalam' => 'Malayala',
+ },
+ 'mo' => {
        'Modifier(?:[-_]|\s+)?Letter' => 'Lm',
        'Modifier(?:[-_]|\s+)?Symbol' => 'Sk',
-},
-'no' => {
+       'Mongolian' => 'Mongolia',
+ },
+ 'my' => {
+       'Myanmar' => 'Myanmar',
+ },
+ 'no' => {
        'Non(?:[-_]|\s+)?Spacing(?:[-_]|\s+)?Mark' => 'Mn',
-},
-'nu' => {
+       'Noncharacter(?:[-_]|\s+)?Code(?:[-_]|\s+)?Point' => 'Nonchara',
+ },
+ 'nu' => {
        'Number' => 'N',
-},
-'op' => {
+ },
+ 'og' => {
+       'Ogham' => 'Ogham',
+ },
+ 'ol' => {
+       'Old(?:[-_]|\s+)?Italic' => 'OldItali',
+ },
+ 'op' => {
        'Open(?:[-_]|\s+)?Punctuation' => 'Ps',
-},
-'ot' => {
-       'Other' => 'C',
-       'Other(?:[-_]|\s+)?Letter' => 'Lo',
-       'Other(?:[-_]|\s+)?Number' => 'No',
+ },
+ 'or' => {
+       'Oriya' => 'Oriya',
+ },
+ 'ot' => {
+       'Other(?:[-_]|\s+)?Math' => 'OtherMat',
        'Other(?:[-_]|\s+)?Punctuation' => 'Po',
+       'Other(?:[-_]|\s+)?Lowercase' => 'OtherLow',
+       'Other(?:[-_]|\s+)?Uppercase' => 'OtherUpp',
+       'Other(?:[-_]|\s+)?Letter' => 'Lo',
+       'Other(?:[-_]|\s+)?Alphabetic' => 'OtherAlp',
        'Other(?:[-_]|\s+)?Symbol' => 'So',
-},
-'pa' => {
+       'Other(?:[-_]|\s+)?Number' => 'No',
+       'Other' => 'C',
+ },
+ 'pa' => {
        'Paragraph(?:[-_]|\s+)?Separator' => 'Zp',
-},
-'pr' => {
+ },
+ 'pr' => {
        'Private(?:[-_]|\s+)?Use' => 'Co',
-},
-'pu' => {
+ },
+ 'pu' => {
        'Punctuation' => 'P',
-},
-'se' => {
+ },
+ 'qu' => {
+       'Quotation(?:[-_]|\s+)?Mark' => 'Quotatio',
+ },
+ 'ru' => {
+       'Runic' => 'Runic',
+ },
+ 'se' => {
        'Separator' => 'Z',
-},
-'sp' => {
+ },
+ 'si' => {
+       'Sinhala' => 'Sinhala',
+ },
+ 'sp' => {
        'Space(?:[-_]|\s+)?Separator' => 'Zs',
        'Spacing(?:[-_]|\s+)?Mark' => 'Mc',
-},
-'su' => {
+ },
+ 'su' => {
        'Surrogate' => 'Cs',
-},
-'sy' => {
+ },
+ 'sy' => {
+       'Syriac' => 'Syriac',
        'Symbol' => 'S',
-},
-'ti' => {
+ },
+ 'ta' => {
+       'Tamil' => 'Tamil',
+ },
+ 'te' => {
+       'Terminal(?:[-_]|\s+)?Punctuation' => 'Terminal',
+       'Telugu' => 'Telugu',
+ },
+ 'th' => {
+       'Thaana' => 'Thaana',
+       'Thai' => 'Thai',
+ },
+ 'ti' => {
        'Titlecase(?:[-_]|\s+)?Letter' => 'Lt',
-},
-'un' => {
+       'Tibetan' => 'Tibetan',
+ },
+ 'un' => {
        'Unassigned' => 'Cn',
-},
-'up' => {
+ },
+ 'up' => {
        'Uppercase(?:[-_]|\s+)?Letter' => 'Lu',
-},
+       'Uppercase' => 'Uppercas',
+ },
+ 'wh' => {
+       'White(?:[-_]|\s+)?space' => 'WhiteSpa',
+ },
+ 'yi' => {
+       'Yi' => 'Yi',
+ },
 );