Viewing file: Canonical.pl (21.49 KB) -rw-r--r-- Select action/file-type: (+) | (+) | (+) | Code (+) | Session (+) | (+) | SDB (+) | (+) | (+) | (+) | (+) | (+) |
# !!!!!!! DO NOT EDIT THIS FILE !!!!!!! # This file is built by mktables from e.g. UnicodeData.txt. # Any changes made here will be lost!
## ## Data in this file used by ../utf8_heavy.pl ##
## Mapping from lc(canonical name) to filename in ./lib %utf8::Canonical = (
# InAegeanNumbers aegeannumbers => 'InAegean',
alphabetic => 'Alphabet',
# InAlphabeticPresentationForms alphabeticpresentationforms => 'InAlphab',
# InAncientGreekMusicalNotation ancientgreekmusicalnotation => 'InAncie2',
# InAncientGreekNumbers ancientgreeknumbers => 'InAncien',
arabic => 'Arab',
# InArabicPresentationFormsA arabicpresentationformsa => 'InArabi4',
# InArabicPresentationFormsB arabicpresentationformsb => 'InArabi3',
# InArabicSupplement arabicsupplement => 'InArabi2',
armenian => 'Armn',
# InArrows arrows => 'InArrows',
# AsciiHexDigit asciihexdigit => 'AsciiHex',
# InBasicLatin basiclatin => 'InBasicL',
bengali => 'Beng',
# BidiControl bidicontrol => 'BidiCont',
# InBlockElements blockelements => 'InBlockE',
bopomofo => 'Bopo',
# InBopomofoExtended bopomofoextended => 'InBopom2',
# InBoxDrawing boxdrawing => 'InBoxDra',
braille => 'Brai',
# InBraillePatterns braillepatterns => 'InBraill',
buginese => 'Bugi', buhid => 'Buhd',
# InByzantineMusicalSymbols byzantinemusicalsymbols => 'InByzant',
# CanadianAboriginal canadianaboriginal => 'Canadian',
# CasedLetter casedletter => 'LC',
cherokee => 'Cher',
# InCjkCompatibility cjkcompatibility => 'InCjkCom',
# InCjkCompatibilityForms cjkcompatibilityforms => 'InCjkCo2',
# InCjkCompatibilityIdeographs cjkcompatibilityideographs => 'InCjkCo3',
# InCjkCompatibilityIdeographsSupplement cjkcompatibilityideographssupplement => 'InCjkCo4',
# InCjkRadicalsSupplement cjkradicalssupplement => 'InCjkRad',
# InCjkStrokes cjkstrokes => 'InCjkStr',
# InCjkSymbolsAndPunctuation cjksymbolsandpunctuation => 'InCjkSym',
# InCjkUnifiedIdeographs cjkunifiedideographs => 'InCjkUni',
# InCjkUnifiedIdeographsExtensionA cjkunifiedideographsextensiona => 'InCjkUn3',
# InCjkUnifiedIdeographsExtensionB cjkunifiedideographsextensionb => 'InCjkUn2',
# ClosePunctuation closepunctuation => 'Pe',
# InCombiningDiacriticalMarks combiningdiacriticalmarks => 'InCombi2',
# InCombiningDiacriticalMarksForSymbols combiningdiacriticalmarksforsymbols => 'InCombi4',
# InCombiningDiacriticalMarksSupplement combiningdiacriticalmarkssupplement => 'InCombi3',
# InCombiningHalfMarks combininghalfmarks => 'InCombin',
common => 'Zyyy',
# ConnectorPunctuation connectorpunctuation => 'Pc',
control => 'Cc',
# InControlPictures controlpictures => 'InContro',
coptic => 'Copt',
# CurrencySymbol currencysymbol => 'Sc',
# InCurrencySymbols currencysymbols => 'InCurren',
cypriot => 'Cprt',
# InCypriotSyllabary cypriotsyllabary => 'InCyprio',
cyrillic => 'Cyrl',
# InCyrillicSupplement cyrillicsupplement => 'InCyril2',
dash => 'Dash2',
# DashPunctuation dashpunctuation => 'Pd',
# DecimalNumber decimalnumber => 'Nd',
deprecated => 'Deprecat', deseret => 'Dsrt', devanagari => 'Deva', diacritic => 'Diacriti',
# InDingbats dingbats => 'InDingba',
# InEnclosedAlphanumerics enclosedalphanumerics => 'InEnclos',
# InEnclosedCjkLettersAndMonths enclosedcjklettersandmonths => 'InEnclo2',
# EnclosingMark enclosingmark => 'Me',
ethiopic => 'Ethi',
# InEthiopicExtended ethiopicextended => 'InEthio2',
# InEthiopicSupplement ethiopicsupplement => 'InEthio3',
extender => 'Extender',
# FinalPunctuation finalpunctuation => 'Pf',
format => 'Cf',
# InGeneralPunctuation generalpunctuation => 'InGenera',
# InGeometricShapes geometricshapes => 'InGeomet',
georgian => 'Geor',
# InGeorgianSupplement georgiansupplement => 'InGeorg2',
glagolitic => 'Glag', gothic => 'Goth',
# GraphemeLink graphemelink => 'Grapheme',
greek => 'Grek',
# InGreekAndCoptic greekandcoptic => 'InGreekA',
# InGreekExtended greekextended => 'InGreekE',
gujarati => 'Gujr', gurmukhi => 'Guru',
# InHalfwidthAndFullwidthForms halfwidthandfullwidthforms => 'InHalfwi',
han => 'Hani', hangul => 'Hang',
# InHangulCompatibilityJamo hangulcompatibilityjamo => 'InHangu3',
# InHangulJamo hanguljamo => 'InHangul',
# InHangulSyllables hangulsyllables => 'InHangu2',
hanunoo => 'Hano', hebrew => 'Hebr',
# HexDigit hexdigit => 'HexDigit',
# InHighPrivateUseSurrogates highprivateusesurrogates => 'InHighPr',
# InHighSurrogates highsurrogates => 'InHighSu',
hiragana => 'Hira', hyphen => 'Hyphen2',
# IdContinue idcontinue => 'IdContin',
ideographic => 'Ideograp',
# InIdeographicDescriptionCharacters ideographicdescriptioncharacters => 'InIdeogr',
# IdsBinaryOperator idsbinaryoperator => 'IdsBinar',
# IdStart idstart => 'IdStart',
# IdsTrinaryOperator idstrinaryoperator => 'IdsTrina',
# InAegeanNumbers inaegeannumbers => 'InAegean',
# InAlphabeticPresentationForms inalphabeticpresentationforms => 'InAlphab',
# InAncientGreekMusicalNotation inancientgreekmusicalnotation => 'InAncie2',
# InAncientGreekNumbers inancientgreeknumbers => 'InAncien',
# InArabic inarabic => 'InArabic',
# InArabicPresentationFormsA inarabicpresentationformsa => 'InArabi4',
# InArabicPresentationFormsB inarabicpresentationformsb => 'InArabi3',
# InArabicSupplement inarabicsupplement => 'InArabi2',
# InArmenian inarmenian => 'InArmeni',
# InArrows inarrows => 'InArrows',
# InBasicLatin inbasiclatin => 'InBasicL',
# InBengali inbengali => 'InBengal',
# InBlockElements inblockelements => 'InBlockE',
# InBopomofo inbopomofo => 'InBopomo',
# InBopomofoExtended inbopomofoextended => 'InBopom2',
# InBoxDrawing inboxdrawing => 'InBoxDra',
# InBraillePatterns inbraillepatterns => 'InBraill',
# InBuginese inbuginese => 'InBugine',
# InBuhid inbuhid => 'InBuhid',
# InByzantineMusicalSymbols inbyzantinemusicalsymbols => 'InByzant',
# InCherokee incherokee => 'InCherok',
# InCjkCompatibility incjkcompatibility => 'InCjkCom',
# InCjkCompatibilityForms incjkcompatibilityforms => 'InCjkCo2',
# InCjkCompatibilityIdeographs incjkcompatibilityideographs => 'InCjkCo3',
# InCjkCompatibilityIdeographsSupplement incjkcompatibilityideographssupplement => 'InCjkCo4',
# InCjkRadicalsSupplement incjkradicalssupplement => 'InCjkRad',
# InCjkStrokes incjkstrokes => 'InCjkStr',
# InCjkSymbolsAndPunctuation incjksymbolsandpunctuation => 'InCjkSym',
# InCjkUnifiedIdeographs incjkunifiedideographs => 'InCjkUni',
# InCjkUnifiedIdeographsExtensionA incjkunifiedideographsextensiona => 'InCjkUn3',
# InCjkUnifiedIdeographsExtensionB incjkunifiedideographsextensionb => 'InCjkUn2',
# InCombiningDiacriticalMarks incombiningdiacriticalmarks => 'InCombi2',
# InCombiningDiacriticalMarksForSymbols incombiningdiacriticalmarksforsymbols => 'InCombi4',
# InCombiningDiacriticalMarksSupplement incombiningdiacriticalmarkssupplement => 'InCombi3',
# InCombiningHalfMarks incombininghalfmarks => 'InCombin',
# InControlPictures incontrolpictures => 'InContro',
# InCoptic incoptic => 'InCoptic',
# InCurrencySymbols incurrencysymbols => 'InCurren',
# InCypriotSyllabary incypriotsyllabary => 'InCyprio',
# InCyrillic incyrillic => 'InCyrill',
# InCyrillicSupplement incyrillicsupplement => 'InCyril2',
# InDeseret indeseret => 'InDesere',
# InDevanagari indevanagari => 'InDevana',
# InDingbats indingbats => 'InDingba',
# InEnclosedAlphanumerics inenclosedalphanumerics => 'InEnclos',
# InEnclosedCjkLettersAndMonths inenclosedcjklettersandmonths => 'InEnclo2',
# InEthiopic inethiopic => 'InEthiop',
# InEthiopicExtended inethiopicextended => 'InEthio2',
# InEthiopicSupplement inethiopicsupplement => 'InEthio3',
# InGeneralPunctuation ingeneralpunctuation => 'InGenera',
# InGeometricShapes ingeometricshapes => 'InGeomet',
# InGeorgian ingeorgian => 'InGeorgi',
# InGeorgianSupplement ingeorgiansupplement => 'InGeorg2',
# InGlagolitic inglagolitic => 'InGlagol',
# InGothic ingothic => 'InGothic',
# InGreekAndCoptic ingreekandcoptic => 'InGreekA',
# InGreekExtended ingreekextended => 'InGreekE',
# InGujarati ingujarati => 'InGujara',
# InGurmukhi ingurmukhi => 'InGurmuk',
# InHalfwidthAndFullwidthForms inhalfwidthandfullwidthforms => 'InHalfwi',
# InHangulCompatibilityJamo inhangulcompatibilityjamo => 'InHangu3',
# InHangulJamo inhanguljamo => 'InHangul',
# InHangulSyllables inhangulsyllables => 'InHangu2',
# InHanunoo inhanunoo => 'InHanuno',
# InHebrew inhebrew => 'InHebrew',
inherited => 'Qaai',
# InHighPrivateUseSurrogates inhighprivateusesurrogates => 'InHighPr',
# InHighSurrogates inhighsurrogates => 'InHighSu',
# InHiragana inhiragana => 'InHiraga',
# InIdeographicDescriptionCharacters inideographicdescriptioncharacters => 'InIdeogr',
# InIpaExtensions inipaextensions => 'InIpaExt',
# InitialPunctuation initialpunctuation => 'Pi',
# InKanbun inkanbun => 'InKanbun',
# InKangxiRadicals inkangxiradicals => 'InKangxi',
# InKannada inkannada => 'InKannad',
# InKatakana inkatakana => 'InKataka',
# InKatakanaPhoneticExtensions inkatakanaphoneticextensions => 'InKatak2',
# InKharoshthi inkharoshthi => 'InKharos',
# InKhmer inkhmer => 'InKhmer',
# InKhmerSymbols inkhmersymbols => 'InKhmerS',
# InLao inlao => 'InLao',
# InLatin1Supplement inlatin1supplement => 'InLatin1',
# InLatinExtendedA inlatinextendeda => 'InLatin2',
# InLatinExtendedAdditional inlatinextendedadditional => 'InLatin3',
# InLatinExtendedB inlatinextendedb => 'InLatinE',
# InLetterlikeSymbols inletterlikesymbols => 'InLetter',
# InLimbu inlimbu => 'InLimbu',
# InLinearBIdeograms inlinearbideograms => 'InLinear',
# InLinearBSyllabary inlinearbsyllabary => 'InLinea2',
# InLowSurrogates inlowsurrogates => 'InLowSur',
# InMalayalam inmalayalam => 'InMalaya',
# InMathematicalAlphanumericSymbols inmathematicalalphanumericsymbols => 'InMathe2',
# InMathematicalOperators inmathematicaloperators => 'InMathem',
# InMiscellaneousMathematicalSymbolsA inmiscellaneousmathematicalsymbolsa => 'InMisce4',
# InMiscellaneousMathematicalSymbolsB inmiscellaneousmathematicalsymbolsb => 'InMisce5',
# InMiscellaneousSymbols inmiscellaneoussymbols => 'InMiscel',
# InMiscellaneousSymbolsAndArrows inmiscellaneoussymbolsandarrows => 'InMisce3',
# InMiscellaneousTechnical inmiscellaneoustechnical => 'InMisce2',
# InModifierToneLetters inmodifiertoneletters => 'InModifi',
# InMongolian inmongolian => 'InMongol',
# InMusicalSymbols inmusicalsymbols => 'InMusica',
# InMyanmar inmyanmar => 'InMyanma',
# InNewTaiLue innewtailue => 'InNewTai',
# InNumberForms innumberforms => 'InNumber',
# InOgham inogham => 'InOgham',
# InOldItalic inolditalic => 'InOldIta',
# InOldPersian inoldpersian => 'InOldPer',
# InOpticalCharacterRecognition inopticalcharacterrecognition => 'InOptica',
# InOriya inoriya => 'InOriya',
# InOsmanya inosmanya => 'InOsmany',
# InPhoneticExtensions inphoneticextensions => 'InPhonet',
# InPhoneticExtensionsSupplement inphoneticextensionssupplement => 'InPhone2',
# InPrivateUseArea inprivateusearea => 'InPrivat',
# InRunic inrunic => 'InRunic',
# InShavian inshavian => 'InShavia',
# InSinhala insinhala => 'InSinhal',
# InSmallFormVariants insmallformvariants => 'InSmallF',
# InSpacingModifierLetters inspacingmodifierletters => 'InSpacin',
# InSpecials inspecials => 'InSpecia',
# InSuperscriptsAndSubscripts insuperscriptsandsubscripts => 'InSupers',
# InSupplementalArrowsA insupplementalarrowsa => 'InSuppl2',
# InSupplementalArrowsB insupplementalarrowsb => 'InSupple',
# InSupplementalMathematicalOperators insupplementalmathematicaloperators => 'InSuppl6',
# InSupplementalPunctuation insupplementalpunctuation => 'InSuppl3',
# InSupplementaryPrivateUseAreaA insupplementaryprivateuseareaa => 'InSuppl4',
# InSupplementaryPrivateUseAreaB insupplementaryprivateuseareab => 'InSuppl5',
# InSylotiNagri insylotinagri => 'InSyloti',
# InSyriac insyriac => 'InSyriac',
# InTagalog intagalog => 'InTagalo',
# InTagbanwa intagbanwa => 'InTagban',
# InTags intags => 'InTags',
# InTaiLe intaile => 'InTaiLe',
# InTaiXuanJingSymbols intaixuanjingsymbols => 'InTaiXua',
# InTamil intamil => 'InTamil',
# InTelugu intelugu => 'InTelugu',
# InThaana inthaana => 'InThaana',
# InThai inthai => 'InThai',
# InTibetan intibetan => 'InTibeta',
# InTifinagh intifinagh => 'InTifina',
# InUgaritic inugaritic => 'InUgarit',
# InUnifiedCanadianAboriginalSyllabics inunifiedcanadianaboriginalsyllabics => 'InUnifie',
# InVariationSelectors invariationselectors => 'InVariat',
# InVariationSelectorsSupplement invariationselectorssupplement => 'InVaria2',
# InVerticalForms inverticalforms => 'InVertic',
# InYijingHexagramSymbols inyijinghexagramsymbols => 'InYijing',
# InYiRadicals inyiradicals => 'InYiRadi',
# InYiSyllables inyisyllables => 'InYiSyll',
# InIpaExtensions ipaextensions => 'InIpaExt',
# JoinControl joincontrol => 'JoinCont',
# InKanbun kanbun => 'InKanbun',
# InKangxiRadicals kangxiradicals => 'InKangxi',
kannada => 'Knda', katakana => 'Kana',
# InKatakanaPhoneticExtensions katakanaphoneticextensions => 'InKatak2',
kharoshthi => 'Khar', khmer => 'Khmr',
# InKhmerSymbols khmersymbols => 'InKhmerS',
lao => 'Laoo', latin => 'Latn',
# InLatin1Supplement latin1supplement => 'InLatin1',
# InLatinExtendedA latinextendeda => 'InLatin2',
# InLatinExtendedAdditional latinextendedadditional => 'InLatin3',
# InLatinExtendedB latinextendedb => 'InLatinE',
letter => 'L',
# InLetterlikeSymbols letterlikesymbols => 'InLetter',
# LetterNumber letternumber => 'Nl',
limbu => 'Limb',
# LinearB linearb => 'LinearB',
# InLinearBIdeograms linearbideograms => 'InLinear',
# InLinearBSyllabary linearbsyllabary => 'InLinea2',
# LineSeparator lineseparator => 'Zl',
# LogicalOrderException logicalorderexception => 'LogicalO',
lowercase => 'Lowercas',
# LowercaseLetter lowercaseletter => 'Ll',
# InLowSurrogates lowsurrogates => 'InLowSur',
malayalam => 'Mlym', mark => 'M', math => 'Math',
# InMathematicalAlphanumericSymbols mathematicalalphanumericsymbols => 'InMathe2',
# InMathematicalOperators mathematicaloperators => 'InMathem',
# MathSymbol mathsymbol => 'Sm',
# InMiscellaneousMathematicalSymbolsA miscellaneousmathematicalsymbolsa => 'InMisce4',
# InMiscellaneousMathematicalSymbolsB miscellaneousmathematicalsymbolsb => 'InMisce5',
# InMiscellaneousSymbols miscellaneoussymbols => 'InMiscel',
# InMiscellaneousSymbolsAndArrows miscellaneoussymbolsandarrows => 'InMisce3',
# InMiscellaneousTechnical miscellaneoustechnical => 'InMisce2',
# ModifierLetter modifierletter => 'Lm',
# ModifierSymbol modifiersymbol => 'Sk',
# InModifierToneLetters modifiertoneletters => 'InModifi',
mongolian => 'Mong',
# InMusicalSymbols musicalsymbols => 'InMusica',
myanmar => 'Mymr',
# NewTaiLue newtailue => 'NewTaiLu',
# NoncharacterCodePoint noncharactercodepoint => 'Nonchara',
# NonspacingMark nonspacingmark => 'Mn',
number => 'N',
# InNumberForms numberforms => 'InNumber',
ogham => 'Ogam',
# OldItalic olditalic => 'OldItali',
# OldPersian oldpersian => 'OldPersi',
# OpenPunctuation openpunctuation => 'Ps',
# InOpticalCharacterRecognition opticalcharacterrecognition => 'InOptica',
oriya => 'Orya', osmanya => 'Osma', other => 'C',
# OtherAlphabetic otheralphabetic => 'OtherAlp',
# OtherDefaultIgnorableCodePoint otherdefaultignorablecodepoint => 'OtherDef',
# OtherGraphemeExtend othergraphemeextend => 'OtherGra',
# OtherIdContinue otheridcontinue => 'OtherIdC',
# OtherIdStart otheridstart => 'OtherIdS',
# OtherLetter otherletter => 'Lo',
# OtherLowercase otherlowercase => 'OtherLow',
# OtherMath othermath => 'OtherMat',
# OtherNumber othernumber => 'No',
# OtherPunctuation otherpunctuation => 'Po',
# OtherSymbol othersymbol => 'So',
# OtherUppercase otheruppercase => 'OtherUpp',
# ParagraphSeparator paragraphseparator => 'Zp',
# PatternSyntax patternsyntax => 'PatternS',
# PatternWhiteSpace patternwhitespace => 'PatternW',
# InPhoneticExtensions phoneticextensions => 'InPhonet',
# InPhoneticExtensionsSupplement phoneticextensionssupplement => 'InPhone2',
# PrivateUse privateuse => 'Co',
# InPrivateUseArea privateusearea => 'InPrivat',
punctuation => 'P',
# QuotationMark quotationmark => 'Quotatio',
radical => 'Radical2', runic => 'Runr', separator => 'Z', shavian => 'Shaw', sinhala => 'Sinh',
# InSmallFormVariants smallformvariants => 'InSmallF',
# SoftDotted softdotted => 'SoftDott',
# SpaceSeparator spaceseparator => 'Zs',
# SpacingMark spacingmark => 'Mc',
# InSpacingModifierLetters spacingmodifierletters => 'InSpacin',
# InSpecials specials => 'InSpecia',
sterm => 'Sterm2',
# InSuperscriptsAndSubscripts superscriptsandsubscripts => 'InSupers',
# InSupplementalArrowsA supplementalarrowsa => 'InSuppl2',
# InSupplementalArrowsB supplementalarrowsb => 'InSupple',
# InSupplementalMathematicalOperators supplementalmathematicaloperators => 'InSuppl6',
# InSupplementalPunctuation supplementalpunctuation => 'InSuppl3',
# InSupplementaryPrivateUseAreaA supplementaryprivateuseareaa => 'InSuppl4',
# InSupplementaryPrivateUseAreaB supplementaryprivateuseareab => 'InSuppl5',
surrogate => 'Cs',
# SylotiNagri sylotinagri => 'SylotiNa',
symbol => 'S', syriac => 'Syrc', tagalog => 'Tglg', tagbanwa => 'Tagb',
# InTags tags => 'InTags',
# TaiLe taile => 'TaiLe',
# InTaiXuanJingSymbols taixuanjingsymbols => 'InTaiXua',
tamil => 'Taml', telugu => 'Telu',
# TerminalPunctuation terminalpunctuation => 'Terminal',
thaana => 'Thaa', thai => 'Thai', tibetan => 'Tibt', tifinagh => 'Tfng',
# TitlecaseLetter titlecaseletter => 'Lt',
ugaritic => 'Ugar', unassigned => 'Cn',
# InUnifiedCanadianAboriginalSyllabics unifiedcanadianaboriginalsyllabics => 'InUnifie',
# UnifiedIdeograph unifiedideograph => 'UnifiedI',
uppercase => 'Uppercas',
# UppercaseLetter uppercaseletter => 'Lu',
# VariationSelector variationselector => 'Variatio',
# InVariationSelectors variationselectors => 'InVariat',
# InVariationSelectorsSupplement variationselectorssupplement => 'InVaria2',
# InVerticalForms verticalforms => 'InVertic',
# WhiteSpace whitespace => 'WhiteSpa',
yi => 'Yiii',
# InYijingHexagramSymbols yijinghexagramsymbols => 'InYijing',
# InYiRadicals yiradicals => 'InYiRadi',
# InYiSyllables yisyllables => 'InYiSyll',
); 1
|