Update of /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt
In directory subversions:/tmp/cvs-serv25158/lib/MHonArc/CharEnt
Modified Files:
CP1250.pm ISO8859_10.pm ISO8859_15.pm ISO8859_2.pm
ISO8859_3.pm ISO8859_4.pm ISO8859_5.pm ISO8859_6.pm
ISO8859_7.pm ISO8859_8.pm ISO8859_9.pm
Added Files:
AppleArabic.pm AppleCenteuro.pm AppleCroatian.pm
AppleCyrillic.pm AppleGreek.pm AppleHebrew.pm AppleIceland.pm
AppleRoman.pm AppleRomanian.pm AppleThai.pm AppleTurkish.pm
CP1251.pm CP1253.pm CP1254.pm CP1255.pm CP1256.pm CP1257.pm
CP1258.pm GOST19768_87.pm ISO8859_11.pm ISO8859_13.pm
ISO8859_14.pm ISO8859_16.pm KOI8_A.pm KOI8_B.pm KOI8_E.pm
KOI8_F.pm KOI8_R.pm KOI8_U.pm KOI_0.pm KOI_7.pm VISCII.pm
Log Message:
* Added CHARSETALIASES resource to define aliases for official
charset names.
* MHonArc::CharEnt:
+ Several charset mappings added to MHonArc::CharEnt with the
default value for CHARSETCONVERTERS updated to reflect the new
mappings: various Cyrillic sets, VISCII, Apple-based charsets, etc.
Sets that have bidirectional rendering (Hebrew, Arabic) exist,
but directional re-ording for rendering is currently not supported.
. Some existing mappings have been updated to use Unicode numeric
character entity references (&#xHHHH;) instead of standard SGML
character entity references (eg. &Aelig;). Most, if not all,
web browsers only support the set of SGML entity references
defined in the HTML 4.0 specification.
All existing tables should now generate entity references
recognized by all HTML 4.0 compliant browsers.
--- NEW FILE ---
package MHonArc::CharEnt::AppleArabic;
# Apple Arabic
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x20 => '#x0020', # SPACE, left-right
0x21 => '#x0021', # EXCLAMATION MARK, left-right
0x22 => '#x0022', # QUOTATION MARK, left-right
0x23 => '#x0023', # NUMBER SIGN, left-right
0x24 => '#x0024', # DOLLAR SIGN, left-right
0x25 => '#x0025', # PERCENT SIGN, left-right
0x26 => '#x0026', # AMPERSAND, left-right
0x27 => '#x0027', # APOSTROPHE, left-right
0x28 => '#x0028', # LEFT PARENTHESIS, left-right
0x29 => '#x0029', # RIGHT PARENTHESIS, left-right
0x2A => '#x002A', # ASTERISK, left-right
0x2B => '#x002B', # PLUS SIGN, left-right
0x2C => '#x002C', # COMMA, left-right
0x2D => '#x002D', # HYPHEN-MINUS, left-right
0x2E => '#x002E', # FULL STOP, left-right
0x2F => '#x002F', # SOLIDUS, left-right
0x3A => '#x003A', # COLON, left-right
0x3B => '#x003B', # SEMICOLON, left-right
0x3C => '#x003C', # LESS-THAN SIGN, left-right
0x3D => '#x003D', # EQUALS SIGN, left-right
0x3E => '#x003E', # GREATER-THAN SIGN, left-right
0x3F => '#x003F', # QUESTION MARK, left-right
0x5B => '#x005B', # LEFT SQUARE BRACKET, left-right
0x5C => '#x005C', # REVERSE SOLIDUS, left-right
0x5D => '#x005D', # RIGHT SQUARE BRACKET, left-right
0x5E => '#x005E', # CIRCUMFLEX ACCENT, left-right
0x5F => '#x005F', # LOW LINE, left-right
0x7B => '#x007B', # LEFT CURLY BRACKET, left-right
0x7C => '#x007C', # VERTICAL LINE, left-right
0x7D => '#x007D', # RIGHT CURLY BRACKET, left-right
0x80 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
0x81 => '#x00A0', # NO-BREAK SPACE, right-left
0x82 => '#x00C7', # LATIN CAPITAL LETTER C WITH CEDILLA
0x83 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0x84 => '#x00D1', # LATIN CAPITAL LETTER N WITH TILDE
0x85 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
0x86 => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
0x87 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
0x88 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
0x89 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
0x8A => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
0x8B => '#x06BA', # ARABIC LETTER NOON GHUNNA
0x8C => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK,
right-left
0x8D => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
0x8E => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0x8F => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
0x90 => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
0x91 => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
0x92 => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
0x93 => '#x2026', # HORIZONTAL ELLIPSIS, right-left
0x94 => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
0x95 => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
0x96 => '#x00F1', # LATIN SMALL LETTER N WITH TILDE
0x97 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
0x98 => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK,
right-left
0x99 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
0x9A => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
0x9B => '#x00F7', # DIVISION SIGN, right-left
0x9C => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
0x9D => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
0x9E => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
0x9F => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xA0 => '#x0020', # SPACE, right-left
0xA1 => '#x0021', # EXCLAMATION MARK, right-left
0xA2 => '#x0022', # QUOTATION MARK, right-left
0xA3 => '#x0023', # NUMBER SIGN, right-left
0xA4 => '#x0024', # DOLLAR SIGN, right-left
0xA5 => '#x066A', # ARABIC PERCENT SIGN
0xA6 => '#x0026', # AMPERSAND, right-left
0xA7 => '#x0027', # APOSTROPHE, right-left
0xA8 => '#x0028', # LEFT PARENTHESIS, right-left
0xA9 => '#x0029', # RIGHT PARENTHESIS, right-left
0xAA => '#x002A', # ASTERISK, right-left
0xAB => '#x002B', # PLUS SIGN, right-left
0xAC => '#x060C', # ARABIC COMMA
0xAD => '#x002D', # HYPHEN-MINUS, right-left
0xAE => '#x002E', # FULL STOP, right-left
0xAF => '#x002F', # SOLIDUS, right-left
0xB0 => '#x0660', # ARABIC-INDIC DIGIT ZERO, right-left
0xB1 => '#x0661', # ARABIC-INDIC DIGIT ONE, right-left
0xB2 => '#x0662', # ARABIC-INDIC DIGIT TWO, right-left
0xB3 => '#x0663', # ARABIC-INDIC DIGIT THREE, right-left
0xB4 => '#x0664', # ARABIC-INDIC DIGIT FOUR, right-left
0xB5 => '#x0665', # ARABIC-INDIC DIGIT FIVE, right-left
0xB6 => '#x0666', # ARABIC-INDIC DIGIT SIX, right-left
0xB7 => '#x0667', # ARABIC-INDIC DIGIT SEVEN, right-left
0xB8 => '#x0668', # ARABIC-INDIC DIGIT EIGHT, right-left
0xB9 => '#x0669', # ARABIC-INDIC DIGIT NINE, right-left
0xBA => '#x003A', # COLON, right-left
0xBB => '#x061B', # ARABIC SEMICOLON
0xBC => '#x003C', # LESS-THAN SIGN, right-left
0xBD => '#x003D', # EQUALS SIGN, right-left
0xBE => '#x003E', # GREATER-THAN SIGN, right-left
0xBF => '#x061F', # ARABIC QUESTION MARK
0xC0 => '#x274A', # EIGHT TEARDROP-SPOKED PROPELLER ASTERISK,
right-left
0xC1 => '#x0621', # ARABIC LETTER HAMZA
0xC2 => '#x0622', # ARABIC LETTER ALEF WITH MADDA ABOVE
0xC3 => '#x0623', # ARABIC LETTER ALEF WITH HAMZA ABOVE
0xC4 => '#x0624', # ARABIC LETTER WAW WITH HAMZA ABOVE
0xC5 => '#x0625', # ARABIC LETTER ALEF WITH HAMZA BELOW
0xC6 => '#x0626', # ARABIC LETTER YEH WITH HAMZA ABOVE
0xC7 => '#x0627', # ARABIC LETTER ALEF
0xC8 => '#x0628', # ARABIC LETTER BEH
0xC9 => '#x0629', # ARABIC LETTER TEH MARBUTA
0xCA => '#x062A', # ARABIC LETTER TEH
0xCB => '#x062B', # ARABIC LETTER THEH
0xCC => '#x062C', # ARABIC LETTER JEEM
0xCD => '#x062D', # ARABIC LETTER HAH
0xCE => '#x062E', # ARABIC LETTER KHAH
0xCF => '#x062F', # ARABIC LETTER DAL
0xD0 => '#x0630', # ARABIC LETTER THAL
0xD1 => '#x0631', # ARABIC LETTER REH
0xD2 => '#x0632', # ARABIC LETTER ZAIN
0xD3 => '#x0633', # ARABIC LETTER SEEN
0xD4 => '#x0634', # ARABIC LETTER SHEEN
0xD5 => '#x0635', # ARABIC LETTER SAD
0xD6 => '#x0636', # ARABIC LETTER DAD
0xD7 => '#x0637', # ARABIC LETTER TAH
0xD8 => '#x0638', # ARABIC LETTER ZAH
0xD9 => '#x0639', # ARABIC LETTER AIN
0xDA => '#x063A', # ARABIC LETTER GHAIN
0xDB => '#x005B', # LEFT SQUARE BRACKET, right-left
0xDC => '#x005C', # REVERSE SOLIDUS, right-left
0xDD => '#x005D', # RIGHT SQUARE BRACKET, right-left
0xDE => '#x005E', # CIRCUMFLEX ACCENT, right-left
0xDF => '#x005F', # LOW LINE, right-left
0xE0 => '#x0640', # ARABIC TATWEEL
0xE1 => '#x0641', # ARABIC LETTER FEH
0xE2 => '#x0642', # ARABIC LETTER QAF
0xE3 => '#x0643', # ARABIC LETTER KAF
0xE4 => '#x0644', # ARABIC LETTER LAM
0xE5 => '#x0645', # ARABIC LETTER MEEM
0xE6 => '#x0646', # ARABIC LETTER NOON
0xE7 => '#x0647', # ARABIC LETTER HEH
0xE8 => '#x0648', # ARABIC LETTER WAW
0xE9 => '#x0649', # ARABIC LETTER ALEF MAKSURA
0xEA => '#x064A', # ARABIC LETTER YEH
0xEB => '#x064B', # ARABIC FATHATAN
0xEC => '#x064C', # ARABIC DAMMATAN
0xED => '#x064D', # ARABIC KASRATAN
0xEE => '#x064E', # ARABIC FATHA
0xEF => '#x064F', # ARABIC DAMMA
0xF0 => '#x0650', # ARABIC KASRA
0xF1 => '#x0651', # ARABIC SHADDA
0xF2 => '#x0652', # ARABIC SUKUN
0xF3 => '#x067E', # ARABIC LETTER PEH
0xF4 => '#x0679', # ARABIC LETTER TTEH
0xF5 => '#x0686', # ARABIC LETTER TCHEH
0xF6 => '#x06D5', # ARABIC LETTER AE
0xF7 => '#x06A4', # ARABIC LETTER VEH
0xF8 => '#x06AF', # ARABIC LETTER GAF
0xF9 => '#x0688', # ARABIC LETTER DDAL
0xFA => '#x0691', # ARABIC LETTER RREH
0xFB => '#x007B', # LEFT CURLY BRACKET, right-left
0xFC => '#x007C', # VERTICAL LINE, right-left
0xFD => '#x007D', # RIGHT CURLY BRACKET, right-left
0xFE => '#x0698', # ARABIC LETTER JEH
0xFF => '#x06D2', # ARABIC LETTER YEH BARREE
};
--- NEW FILE ---
package MHonArc::CharEnt::AppleCenteuro;
# Apple Central European
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
0x81 => '#x0100', # LATIN CAPITAL LETTER A WITH MACRON
0x82 => '#x0101', # LATIN SMALL LETTER A WITH MACRON
0x83 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0x84 => '#x0104', # LATIN CAPITAL LETTER A WITH OGONEK
0x85 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
0x86 => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
0x87 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
0x88 => '#x0105', # LATIN SMALL LETTER A WITH OGONEK
0x89 => '#x010C', # LATIN CAPITAL LETTER C WITH CARON
0x8A => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
0x8B => '#x010D', # LATIN SMALL LETTER C WITH CARON
0x8C => '#x0106', # LATIN CAPITAL LETTER C WITH ACUTE
0x8D => '#x0107', # LATIN SMALL LETTER C WITH ACUTE
0x8E => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0x8F => '#x0179', # LATIN CAPITAL LETTER Z WITH ACUTE
0x90 => '#x017A', # LATIN SMALL LETTER Z WITH ACUTE
0x91 => '#x010E', # LATIN CAPITAL LETTER D WITH CARON
0x92 => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
0x93 => '#x010F', # LATIN SMALL LETTER D WITH CARON
0x94 => '#x0112', # LATIN CAPITAL LETTER E WITH MACRON
0x95 => '#x0113', # LATIN SMALL LETTER E WITH MACRON
0x96 => '#x0116', # LATIN CAPITAL LETTER E WITH DOT ABOVE
0x97 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
0x98 => '#x0117', # LATIN SMALL LETTER E WITH DOT ABOVE
0x99 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
0x9A => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
0x9B => '#x00F5', # LATIN SMALL LETTER O WITH TILDE
0x9C => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
0x9D => '#x011A', # LATIN CAPITAL LETTER E WITH CARON
0x9E => '#x011B', # LATIN SMALL LETTER E WITH CARON
0x9F => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xA0 => '#x2020', # DAGGER
0xA1 => '#x00B0', # DEGREE SIGN
0xA2 => '#x0118', # LATIN CAPITAL LETTER E WITH OGONEK
0xA3 => '#x00A3', # POUND SIGN
0xA4 => '#x00A7', # SECTION SIGN
0xA5 => '#x2022', # BULLET
0xA6 => '#x00B6', # PILCROW SIGN
0xA7 => '#x00DF', # LATIN SMALL LETTER SHARP S
0xA8 => '#x00AE', # REGISTERED SIGN
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAA => '#x2122', # TRADE MARK SIGN
0xAB => '#x0119', # LATIN SMALL LETTER E WITH OGONEK
0xAC => '#x00A8', # DIAERESIS
0xAD => '#x2260', # NOT EQUAL TO
0xAE => '#x0123', # LATIN SMALL LETTER G WITH CEDILLA
0xAF => '#x012E', # LATIN CAPITAL LETTER I WITH OGONEK
0xB0 => '#x012F', # LATIN SMALL LETTER I WITH OGONEK
0xB1 => '#x012A', # LATIN CAPITAL LETTER I WITH MACRON
0xB2 => '#x2264', # LESS-THAN OR EQUAL TO
0xB3 => '#x2265', # GREATER-THAN OR EQUAL TO
0xB4 => '#x012B', # LATIN SMALL LETTER I WITH MACRON
0xB5 => '#x0136', # LATIN CAPITAL LETTER K WITH CEDILLA
0xB6 => '#x2202', # PARTIAL DIFFERENTIAL
0xB7 => '#x2211', # N-ARY SUMMATION
0xB8 => '#x0142', # LATIN SMALL LETTER L WITH STROKE
0xB9 => '#x013B', # LATIN CAPITAL LETTER L WITH CEDILLA
0xBA => '#x013C', # LATIN SMALL LETTER L WITH CEDILLA
0xBB => '#x013D', # LATIN CAPITAL LETTER L WITH CARON
0xBC => '#x013E', # LATIN SMALL LETTER L WITH CARON
0xBD => '#x0139', # LATIN CAPITAL LETTER L WITH ACUTE
0xBE => '#x013A', # LATIN SMALL LETTER L WITH ACUTE
0xBF => '#x0145', # LATIN CAPITAL LETTER N WITH CEDILLA
0xC0 => '#x0146', # LATIN SMALL LETTER N WITH CEDILLA
0xC1 => '#x0143', # LATIN CAPITAL LETTER N WITH ACUTE
0xC2 => '#x00AC', # NOT SIGN
0xC3 => '#x221A', # SQUARE ROOT
0xC4 => '#x0144', # LATIN SMALL LETTER N WITH ACUTE
0xC5 => '#x0147', # LATIN CAPITAL LETTER N WITH CARON
0xC6 => '#x2206', # INCREMENT
0xC7 => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC8 => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC9 => '#x2026', # HORIZONTAL ELLIPSIS
0xCA => '#x00A0', # NO-BREAK SPACE
0xCB => '#x0148', # LATIN SMALL LETTER N WITH CARON
0xCC => '#x0150', # LATIN CAPITAL LETTER O WITH DOUBLE ACUTE
0xCD => '#x00D5', # LATIN CAPITAL LETTER O WITH TILDE
0xCE => '#x0151', # LATIN SMALL LETTER O WITH DOUBLE ACUTE
0xCF => '#x014C', # LATIN CAPITAL LETTER O WITH MACRON
0xD0 => '#x2013', # EN DASH
0xD1 => '#x2014', # EM DASH
0xD2 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0xD3 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0xD4 => '#x2018', # LEFT SINGLE QUOTATION MARK
0xD5 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0xD6 => '#x00F7', # DIVISION SIGN
0xD7 => '#x25CA', # LOZENGE
0xD8 => '#x014D', # LATIN SMALL LETTER O WITH MACRON
0xD9 => '#x0154', # LATIN CAPITAL LETTER R WITH ACUTE
0xDA => '#x0155', # LATIN SMALL LETTER R WITH ACUTE
0xDB => '#x0158', # LATIN CAPITAL LETTER R WITH CARON
0xDC => '#x2039', # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
0xDD => '#x203A', # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
0xDE => '#x0159', # LATIN SMALL LETTER R WITH CARON
0xDF => '#x0156', # LATIN CAPITAL LETTER R WITH CEDILLA
0xE0 => '#x0157', # LATIN SMALL LETTER R WITH CEDILLA
0xE1 => '#x0160', # LATIN CAPITAL LETTER S WITH CARON
0xE2 => '#x201A', # SINGLE LOW-9 QUOTATION MARK
0xE3 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0xE4 => '#x0161', # LATIN SMALL LETTER S WITH CARON
0xE5 => '#x015A', # LATIN CAPITAL LETTER S WITH ACUTE
0xE6 => '#x015B', # LATIN SMALL LETTER S WITH ACUTE
0xE7 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
0xE8 => '#x0164', # LATIN CAPITAL LETTER T WITH CARON
0xE9 => '#x0165', # LATIN SMALL LETTER T WITH CARON
0xEA => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
0xEB => '#x017D', # LATIN CAPITAL LETTER Z WITH CARON
0xEC => '#x017E', # LATIN SMALL LETTER Z WITH CARON
0xED => '#x016A', # LATIN CAPITAL LETTER U WITH MACRON
0xEE => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
0xEF => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
0xF0 => '#x016B', # LATIN SMALL LETTER U WITH MACRON
0xF1 => '#x016E', # LATIN CAPITAL LETTER U WITH RING ABOVE
0xF2 => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
0xF3 => '#x016F', # LATIN SMALL LETTER U WITH RING ABOVE
0xF4 => '#x0170', # LATIN CAPITAL LETTER U WITH DOUBLE ACUTE
0xF5 => '#x0171', # LATIN SMALL LETTER U WITH DOUBLE ACUTE
0xF6 => '#x0172', # LATIN CAPITAL LETTER U WITH OGONEK
0xF7 => '#x0173', # LATIN SMALL LETTER U WITH OGONEK
0xF8 => '#x00DD', # LATIN CAPITAL LETTER Y WITH ACUTE
0xF9 => '#x00FD', # LATIN SMALL LETTER Y WITH ACUTE
0xFA => '#x0137', # LATIN SMALL LETTER K WITH CEDILLA
0xFB => '#x017B', # LATIN CAPITAL LETTER Z WITH DOT ABOVE
0xFC => '#x0141', # LATIN CAPITAL LETTER L WITH STROKE
0xFD => '#x017C', # LATIN SMALL LETTER Z WITH DOT ABOVE
0xFE => '#x0122', # LATIN CAPITAL LETTER G WITH CEDILLA
0xFF => '#x02C7', # CARON
};
--- NEW FILE ---
package MHonArc::CharEnt::AppleCroatian;
# Apple Croatian
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
0x81 => '#x00C5', # LATIN CAPITAL LETTER A WITH RING ABOVE
0x82 => '#x00C7', # LATIN CAPITAL LETTER C WITH CEDILLA
0x83 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0x84 => '#x00D1', # LATIN CAPITAL LETTER N WITH TILDE
0x85 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
0x86 => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
0x87 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
0x88 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
0x89 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
0x8A => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
0x8B => '#x00E3', # LATIN SMALL LETTER A WITH TILDE
0x8C => '#x00E5', # LATIN SMALL LETTER A WITH RING ABOVE
0x8D => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
0x8E => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0x8F => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
0x90 => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
0x91 => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
0x92 => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
0x93 => '#x00EC', # LATIN SMALL LETTER I WITH GRAVE
0x94 => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
0x95 => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
0x96 => '#x00F1', # LATIN SMALL LETTER N WITH TILDE
0x97 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
0x98 => '#x00F2', # LATIN SMALL LETTER O WITH GRAVE
0x99 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
0x9A => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
0x9B => '#x00F5', # LATIN SMALL LETTER O WITH TILDE
0x9C => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
0x9D => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
0x9E => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
0x9F => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xA0 => '#x2020', # DAGGER
0xA1 => '#x00B0', # DEGREE SIGN
0xA2 => '#x00A2', # CENT SIGN
0xA3 => '#x00A3', # POUND SIGN
0xA4 => '#x00A7', # SECTION SIGN
0xA5 => '#x2022', # BULLET
0xA6 => '#x00B6', # PILCROW SIGN
0xA7 => '#x00DF', # LATIN SMALL LETTER SHARP S
0xA8 => '#x00AE', # REGISTERED SIGN
0xA9 => '#x0160', # LATIN CAPITAL LETTER S WITH CARON
0xAA => '#x2122', # TRADE MARK SIGN
0xAB => '#x00B4', # ACUTE ACCENT
0xAC => '#x00A8', # DIAERESIS
0xAD => '#x2260', # NOT EQUAL TO
0xAE => '#x017D', # LATIN CAPITAL LETTER Z WITH CARON
0xAF => '#x00D8', # LATIN CAPITAL LETTER O WITH STROKE
0xB0 => '#x221E', # INFINITY
0xB1 => '#x00B1', # PLUS-MINUS SIGN
0xB2 => '#x2264', # LESS-THAN OR EQUAL TO
0xB3 => '#x2265', # GREATER-THAN OR EQUAL TO
0xB4 => '#x2206', # INCREMENT
0xB5 => '#x00B5', # MICRO SIGN
0xB6 => '#x2202', # PARTIAL DIFFERENTIAL
0xB7 => '#x2211', # N-ARY SUMMATION
0xB8 => '#x220F', # N-ARY PRODUCT
0xB9 => '#x0161', # LATIN SMALL LETTER S WITH CARON
0xBA => '#x222B', # INTEGRAL
0xBB => '#x00AA', # FEMININE ORDINAL INDICATOR
0xBC => '#x00BA', # MASCULINE ORDINAL INDICATOR
0xBD => '#x03A9', # GREEK CAPITAL LETTER OMEGA
0xBE => '#x017E', # LATIN SMALL LETTER Z WITH CARON
0xBF => '#x00F8', # LATIN SMALL LETTER O WITH STROKE
0xC0 => '#x00BF', # INVERTED QUESTION MARK
0xC1 => '#x00A1', # INVERTED EXCLAMATION MARK
0xC2 => '#x00AC', # NOT SIGN
0xC3 => '#x221A', # SQUARE ROOT
0xC4 => '#x0192', # LATIN SMALL LETTER F WITH HOOK
0xC5 => '#x2248', # ALMOST EQUAL TO
0xC6 => '#x0106', # LATIN CAPITAL LETTER C WITH ACUTE
0xC7 => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC8 => '#x010C', # LATIN CAPITAL LETTER C WITH CARON
0xC9 => '#x2026', # HORIZONTAL ELLIPSIS
0xCA => '#x00A0', # NO-BREAK SPACE
0xCB => '#x00C0', # LATIN CAPITAL LETTER A WITH GRAVE
0xCC => '#x00C3', # LATIN CAPITAL LETTER A WITH TILDE
0xCD => '#x00D5', # LATIN CAPITAL LETTER O WITH TILDE
0xCE => '#x0152', # LATIN CAPITAL LIGATURE OE
0xCF => '#x0153', # LATIN SMALL LIGATURE OE
0xD0 => '#x0110', # LATIN CAPITAL LETTER D WITH STROKE
0xD1 => '#x2014', # EM DASH
0xD2 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0xD3 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0xD4 => '#x2018', # LEFT SINGLE QUOTATION MARK
0xD5 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0xD6 => '#x00F7', # DIVISION SIGN
0xD7 => '#x25CA', # LOZENGE
0xD8 => '#xF8FF', # Apple logo
0xD9 => '#x00A9', # COPYRIGHT SIGN
0xDA => '#x2044', # FRACTION SLASH
0xDB => '#x20AC', # EURO SIGN
0xDC => '#x2039', # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
0xDD => '#x203A', # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
0xDE => '#x00C6', # LATIN CAPITAL LETTER AE
0xDF => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xE0 => '#x2013', # EN DASH
0xE1 => '#x00B7', # MIDDLE DOT
0xE2 => '#x201A', # SINGLE LOW-9 QUOTATION MARK
0xE3 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0xE4 => '#x2030', # PER MILLE SIGN
0xE5 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
0xE6 => '#x0107', # LATIN SMALL LETTER C WITH ACUTE
0xE7 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
0xE8 => '#x010D', # LATIN SMALL LETTER C WITH CARON
0xE9 => '#x00C8', # LATIN CAPITAL LETTER E WITH GRAVE
0xEA => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
0xEB => '#x00CE', # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
0xEC => '#x00CF', # LATIN CAPITAL LETTER I WITH DIAERESIS
0xED => '#x00CC', # LATIN CAPITAL LETTER I WITH GRAVE
0xEE => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
0xEF => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
0xF0 => '#x0111', # LATIN SMALL LETTER D WITH STROKE
0xF1 => '#x00D2', # LATIN CAPITAL LETTER O WITH GRAVE
0xF2 => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
0xF3 => '#x00DB', # LATIN CAPITAL LETTER U WITH CIRCUMFLEX
0xF4 => '#x00D9', # LATIN CAPITAL LETTER U WITH GRAVE
0xF5 => '#x0131', # LATIN SMALL LETTER DOTLESS I
0xF6 => '#x02C6', # MODIFIER LETTER CIRCUMFLEX ACCENT
0xF7 => '#x02DC', # SMALL TILDE
0xF8 => '#x00AF', # MACRON
0xF9 => '#x03C0', # GREEK SMALL LETTER PI
0xFA => '#x00CB', # LATIN CAPITAL LETTER E WITH DIAERESIS
0xFB => '#x02DA', # RING ABOVE
0xFC => '#x00B8', # CEDILLA
0xFD => '#x00CA', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX
0xFE => '#x00E6', # LATIN SMALL LETTER AE
0xFF => '#x02C7', # CARON
};
--- NEW FILE ---
package MHonArc::CharEnt::AppleCyrillic;
# Apple Cyrillic
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x0410', # CYRILLIC CAPITAL LETTER A
0x81 => '#x0411', # CYRILLIC CAPITAL LETTER BE
0x82 => '#x0412', # CYRILLIC CAPITAL LETTER VE
0x83 => '#x0413', # CYRILLIC CAPITAL LETTER GHE
0x84 => '#x0414', # CYRILLIC CAPITAL LETTER DE
0x85 => '#x0415', # CYRILLIC CAPITAL LETTER IE
0x86 => '#x0416', # CYRILLIC CAPITAL LETTER ZHE
0x87 => '#x0417', # CYRILLIC CAPITAL LETTER ZE
0x88 => '#x0418', # CYRILLIC CAPITAL LETTER I
0x89 => '#x0419', # CYRILLIC CAPITAL LETTER SHORT I
0x8A => '#x041A', # CYRILLIC CAPITAL LETTER KA
0x8B => '#x041B', # CYRILLIC CAPITAL LETTER EL
0x8C => '#x041C', # CYRILLIC CAPITAL LETTER EM
0x8D => '#x041D', # CYRILLIC CAPITAL LETTER EN
0x8E => '#x041E', # CYRILLIC CAPITAL LETTER O
0x8F => '#x041F', # CYRILLIC CAPITAL LETTER PE
0x90 => '#x0420', # CYRILLIC CAPITAL LETTER ER
0x91 => '#x0421', # CYRILLIC CAPITAL LETTER ES
0x92 => '#x0422', # CYRILLIC CAPITAL LETTER TE
0x93 => '#x0423', # CYRILLIC CAPITAL LETTER U
0x94 => '#x0424', # CYRILLIC CAPITAL LETTER EF
0x95 => '#x0425', # CYRILLIC CAPITAL LETTER HA
0x96 => '#x0426', # CYRILLIC CAPITAL LETTER TSE
0x97 => '#x0427', # CYRILLIC CAPITAL LETTER CHE
0x98 => '#x0428', # CYRILLIC CAPITAL LETTER SHA
0x99 => '#x0429', # CYRILLIC CAPITAL LETTER SHCHA
0x9A => '#x042A', # CYRILLIC CAPITAL LETTER HARD SIGN
0x9B => '#x042B', # CYRILLIC CAPITAL LETTER YERU
0x9C => '#x042C', # CYRILLIC CAPITAL LETTER SOFT SIGN
0x9D => '#x042D', # CYRILLIC CAPITAL LETTER E
0x9E => '#x042E', # CYRILLIC CAPITAL LETTER YU
0x9F => '#x042F', # CYRILLIC CAPITAL LETTER YA
0xA0 => '#x2020', # DAGGER
0xA1 => '#x00B0', # DEGREE SIGN
0xA2 => '#x0490', # CYRILLIC CAPITAL LETTER GHE WITH UPTURN
0xA3 => '#x00A3', # POUND SIGN
0xA4 => '#x00A7', # SECTION SIGN
0xA5 => '#x2022', # BULLET
0xA6 => '#x00B6', # PILCROW SIGN
0xA7 => '#x0406', # CYRILLIC CAPITAL LETTER
BYELORUSSIAN-UKRAINIAN I
0xA8 => '#x00AE', # REGISTERED SIGN
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAA => '#x2122', # TRADE MARK SIGN
0xAB => '#x0402', # CYRILLIC CAPITAL LETTER DJE
0xAC => '#x0452', # CYRILLIC SMALL LETTER DJE
0xAD => '#x2260', # NOT EQUAL TO
0xAE => '#x0403', # CYRILLIC CAPITAL LETTER GJE
0xAF => '#x0453', # CYRILLIC SMALL LETTER GJE
0xB0 => '#x221E', # INFINITY
0xB1 => '#x00B1', # PLUS-MINUS SIGN
0xB2 => '#x2264', # LESS-THAN OR EQUAL TO
0xB3 => '#x2265', # GREATER-THAN OR EQUAL TO
0xB4 => '#x0456', # CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
0xB5 => '#x00B5', # MICRO SIGN
0xB6 => '#x0491', # CYRILLIC SMALL LETTER GHE WITH UPTURN
0xB7 => '#x0408', # CYRILLIC CAPITAL LETTER JE
0xB8 => '#x0404', # CYRILLIC CAPITAL LETTER UKRAINIAN IE
0xB9 => '#x0454', # CYRILLIC SMALL LETTER UKRAINIAN IE
0xBA => '#x0407', # CYRILLIC CAPITAL LETTER YI
0xBB => '#x0457', # CYRILLIC SMALL LETTER YI
0xBC => '#x0409', # CYRILLIC CAPITAL LETTER LJE
0xBD => '#x0459', # CYRILLIC SMALL LETTER LJE
0xBE => '#x040A', # CYRILLIC CAPITAL LETTER NJE
0xBF => '#x045A', # CYRILLIC SMALL LETTER NJE
0xC0 => '#x0458', # CYRILLIC SMALL LETTER JE
0xC1 => '#x0405', # CYRILLIC CAPITAL LETTER DZE
0xC2 => '#x00AC', # NOT SIGN
0xC3 => '#x221A', # SQUARE ROOT
0xC4 => '#x0192', # LATIN SMALL LETTER F WITH HOOK
0xC5 => '#x2248', # ALMOST EQUAL TO
0xC6 => '#x2206', # INCREMENT
0xC7 => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC8 => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC9 => '#x2026', # HORIZONTAL ELLIPSIS
0xCA => '#x00A0', # NO-BREAK SPACE
0xCB => '#x040B', # CYRILLIC CAPITAL LETTER TSHE
0xCC => '#x045B', # CYRILLIC SMALL LETTER TSHE
0xCD => '#x040C', # CYRILLIC CAPITAL LETTER KJE
0xCE => '#x045C', # CYRILLIC SMALL LETTER KJE
0xCF => '#x0455', # CYRILLIC SMALL LETTER DZE
0xD0 => '#x2013', # EN DASH
0xD1 => '#x2014', # EM DASH
0xD2 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0xD3 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0xD4 => '#x2018', # LEFT SINGLE QUOTATION MARK
0xD5 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0xD6 => '#x00F7', # DIVISION SIGN
0xD7 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0xD8 => '#x040E', # CYRILLIC CAPITAL LETTER SHORT U
0xD9 => '#x045E', # CYRILLIC SMALL LETTER SHORT U
0xDA => '#x040F', # CYRILLIC CAPITAL LETTER DZHE
0xDB => '#x045F', # CYRILLIC SMALL LETTER DZHE
0xDC => '#x2116', # NUMERO SIGN
0xDD => '#x0401', # CYRILLIC CAPITAL LETTER IO
0xDE => '#x0451', # CYRILLIC SMALL LETTER IO
0xDF => '#x044F', # CYRILLIC SMALL LETTER YA
0xE0 => '#x0430', # CYRILLIC SMALL LETTER A
0xE1 => '#x0431', # CYRILLIC SMALL LETTER BE
0xE2 => '#x0432', # CYRILLIC SMALL LETTER VE
0xE3 => '#x0433', # CYRILLIC SMALL LETTER GHE
0xE4 => '#x0434', # CYRILLIC SMALL LETTER DE
0xE5 => '#x0435', # CYRILLIC SMALL LETTER IE
0xE6 => '#x0436', # CYRILLIC SMALL LETTER ZHE
0xE7 => '#x0437', # CYRILLIC SMALL LETTER ZE
0xE8 => '#x0438', # CYRILLIC SMALL LETTER I
0xE9 => '#x0439', # CYRILLIC SMALL LETTER SHORT I
0xEA => '#x043A', # CYRILLIC SMALL LETTER KA
0xEB => '#x043B', # CYRILLIC SMALL LETTER EL
0xEC => '#x043C', # CYRILLIC SMALL LETTER EM
0xED => '#x043D', # CYRILLIC SMALL LETTER EN
0xEE => '#x043E', # CYRILLIC SMALL LETTER O
0xEF => '#x043F', # CYRILLIC SMALL LETTER PE
0xF0 => '#x0440', # CYRILLIC SMALL LETTER ER
0xF1 => '#x0441', # CYRILLIC SMALL LETTER ES
0xF2 => '#x0442', # CYRILLIC SMALL LETTER TE
0xF3 => '#x0443', # CYRILLIC SMALL LETTER U
0xF4 => '#x0444', # CYRILLIC SMALL LETTER EF
0xF5 => '#x0445', # CYRILLIC SMALL LETTER HA
0xF6 => '#x0446', # CYRILLIC SMALL LETTER TSE
0xF7 => '#x0447', # CYRILLIC SMALL LETTER CHE
0xF8 => '#x0448', # CYRILLIC SMALL LETTER SHA
0xF9 => '#x0449', # CYRILLIC SMALL LETTER SHCHA
0xFA => '#x044A', # CYRILLIC SMALL LETTER HARD SIGN
0xFB => '#x044B', # CYRILLIC SMALL LETTER YERU
0xFC => '#x044C', # CYRILLIC SMALL LETTER SOFT SIGN
0xFD => '#x044D', # CYRILLIC SMALL LETTER E
0xFE => '#x044E', # CYRILLIC SMALL LETTER YU
0xFF => '#x20AC', # EURO SIGN
};
--- NEW FILE ---
package MHonArc::CharEnt::AppleGreek;
# Apple Greek
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
0x81 => '#x00B9', # SUPERSCRIPT ONE
0x82 => '#x00B2', # SUPERSCRIPT TWO
0x83 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0x84 => '#x00B3', # SUPERSCRIPT THREE
0x85 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
0x86 => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
0x87 => '#x0385', # GREEK DIALYTIKA TONOS
0x88 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
0x89 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
0x8A => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
0x8B => '#x0384', # GREEK TONOS
0x8C => '#x00A8', # DIAERESIS
0x8D => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
0x8E => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0x8F => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
0x90 => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
0x91 => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
0x92 => '#x00A3', # POUND SIGN
0x93 => '#x2122', # TRADE MARK SIGN
0x94 => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
0x95 => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
0x96 => '#x2022', # BULLET
0x97 => '#x00BD', # VULGAR FRACTION ONE HALF
0x98 => '#x2030', # PER MILLE SIGN
0x99 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
0x9A => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
0x9B => '#x00A6', # BROKEN BAR
0x9C => '#x00AD', # SOFT HYPHEN
0x9D => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
0x9E => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
0x9F => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xA0 => '#x2020', # DAGGER
0xA1 => '#x0393', # GREEK CAPITAL LETTER GAMMA
0xA2 => '#x0394', # GREEK CAPITAL LETTER DELTA
0xA3 => '#x0398', # GREEK CAPITAL LETTER THETA
0xA4 => '#x039B', # GREEK CAPITAL LETTER LAMDA
0xA5 => '#x039E', # GREEK CAPITAL LETTER XI
0xA6 => '#x03A0', # GREEK CAPITAL LETTER PI
0xA7 => '#x00DF', # LATIN SMALL LETTER SHARP S
0xA8 => '#x00AE', # REGISTERED SIGN
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAA => '#x03A3', # GREEK CAPITAL LETTER SIGMA
0xAB => '#x03AA', # GREEK CAPITAL LETTER IOTA WITH DIALYTIKA
0xAC => '#x00A7', # SECTION SIGN
0xAD => '#x2260', # NOT EQUAL TO
0xAE => '#x00B0', # DEGREE SIGN
0xAF => '#x00B7', # MIDDLE DOT
0xB0 => '#x0391', # GREEK CAPITAL LETTER ALPHA
0xB1 => '#x00B1', # PLUS-MINUS SIGN
0xB2 => '#x2264', # LESS-THAN OR EQUAL TO
0xB3 => '#x2265', # GREATER-THAN OR EQUAL TO
0xB4 => '#x00A5', # YEN SIGN
0xB5 => '#x0392', # GREEK CAPITAL LETTER BETA
0xB6 => '#x0395', # GREEK CAPITAL LETTER EPSILON
0xB7 => '#x0396', # GREEK CAPITAL LETTER ZETA
0xB8 => '#x0397', # GREEK CAPITAL LETTER ETA
0xB9 => '#x0399', # GREEK CAPITAL LETTER IOTA
0xBA => '#x039A', # GREEK CAPITAL LETTER KAPPA
0xBB => '#x039C', # GREEK CAPITAL LETTER MU
0xBC => '#x03A6', # GREEK CAPITAL LETTER PHI
0xBD => '#x03AB', # GREEK CAPITAL LETTER UPSILON WITH DIALYTIKA
0xBE => '#x03A8', # GREEK CAPITAL LETTER PSI
0xBF => '#x03A9', # GREEK CAPITAL LETTER OMEGA
0xC0 => '#x03AC', # GREEK SMALL LETTER ALPHA WITH TONOS
0xC1 => '#x039D', # GREEK CAPITAL LETTER NU
0xC2 => '#x00AC', # NOT SIGN
0xC3 => '#x039F', # GREEK CAPITAL LETTER OMICRON
0xC4 => '#x03A1', # GREEK CAPITAL LETTER RHO
0xC5 => '#x2248', # ALMOST EQUAL TO
0xC6 => '#x03A4', # GREEK CAPITAL LETTER TAU
0xC7 => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC8 => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC9 => '#x2026', # HORIZONTAL ELLIPSIS
0xCA => '#x00A0', # NO-BREAK SPACE
0xCB => '#x03A5', # GREEK CAPITAL LETTER UPSILON
0xCC => '#x03A7', # GREEK CAPITAL LETTER CHI
0xCD => '#x0386', # GREEK CAPITAL LETTER ALPHA WITH TONOS
0xCE => '#x0388', # GREEK CAPITAL LETTER EPSILON WITH TONOS
0xCF => '#x0153', # LATIN SMALL LIGATURE OE
0xD0 => '#x2013', # EN DASH
0xD1 => '#x2015', # HORIZONTAL BAR
0xD2 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0xD3 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0xD4 => '#x2018', # LEFT SINGLE QUOTATION MARK
0xD5 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0xD6 => '#x00F7', # DIVISION SIGN
0xD7 => '#x0389', # GREEK CAPITAL LETTER ETA WITH TONOS
0xD8 => '#x038A', # GREEK CAPITAL LETTER IOTA WITH TONOS
0xD9 => '#x038C', # GREEK CAPITAL LETTER OMICRON WITH TONOS
0xDA => '#x038E', # GREEK CAPITAL LETTER UPSILON WITH TONOS
0xDB => '#x03AD', # GREEK SMALL LETTER EPSILON WITH TONOS
0xDC => '#x03AE', # GREEK SMALL LETTER ETA WITH TONOS
0xDD => '#x03AF', # GREEK SMALL LETTER IOTA WITH TONOS
0xDE => '#x03CC', # GREEK SMALL LETTER OMICRON WITH TONOS
0xDF => '#x038F', # GREEK CAPITAL LETTER OMEGA WITH TONOS
0xE0 => '#x03CD', # GREEK SMALL LETTER UPSILON WITH TONOS
0xE1 => '#x03B1', # GREEK SMALL LETTER ALPHA
0xE2 => '#x03B2', # GREEK SMALL LETTER BETA
0xE3 => '#x03C8', # GREEK SMALL LETTER PSI
0xE4 => '#x03B4', # GREEK SMALL LETTER DELTA
0xE5 => '#x03B5', # GREEK SMALL LETTER EPSILON
0xE6 => '#x03C6', # GREEK SMALL LETTER PHI
0xE7 => '#x03B3', # GREEK SMALL LETTER GAMMA
0xE8 => '#x03B7', # GREEK SMALL LETTER ETA
0xE9 => '#x03B9', # GREEK SMALL LETTER IOTA
0xEA => '#x03BE', # GREEK SMALL LETTER XI
0xEB => '#x03BA', # GREEK SMALL LETTER KAPPA
0xEC => '#x03BB', # GREEK SMALL LETTER LAMDA
0xED => '#x03BC', # GREEK SMALL LETTER MU
0xEE => '#x03BD', # GREEK SMALL LETTER NU
0xEF => '#x03BF', # GREEK SMALL LETTER OMICRON
0xF0 => '#x03C0', # GREEK SMALL LETTER PI
0xF1 => '#x03CE', # GREEK SMALL LETTER OMEGA WITH TONOS
0xF2 => '#x03C1', # GREEK SMALL LETTER RHO
0xF3 => '#x03C3', # GREEK SMALL LETTER SIGMA
0xF4 => '#x03C4', # GREEK SMALL LETTER TAU
0xF5 => '#x03B8', # GREEK SMALL LETTER THETA
0xF6 => '#x03C9', # GREEK SMALL LETTER OMEGA
0xF7 => '#x03C2', # GREEK SMALL LETTER FINAL SIGMA
0xF8 => '#x03C7', # GREEK SMALL LETTER CHI
0xF9 => '#x03C5', # GREEK SMALL LETTER UPSILON
0xFA => '#x03B6', # GREEK SMALL LETTER ZETA
0xFB => '#x03CA', # GREEK SMALL LETTER IOTA WITH DIALYTIKA
0xFC => '#x03CB', # GREEK SMALL LETTER UPSILON WITH DIALYTIKA
0xFD => '#x0390', # GREEK SMALL LETTER IOTA WITH DIALYTIKA AND
TONOS
0xFE => '#x03B0', # GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND
TONOS
0xFF => '#xF8A0', # undefined1
};
--- NEW FILE ---
package MHonArc::CharEnt::AppleHebrew;
# Apple Hebrew
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x20 => '#x0020', # SPACE, left-right
0x21 => '#x0021', # EXCLAMATION MARK, left-right
0x22 => '#x0022', # QUOTATION MARK, left-right
0x23 => '#x0023', # NUMBER SIGN, left-right
0x24 => '#x0024', # DOLLAR SIGN, left-right
0x25 => '#x0025', # PERCENT SIGN, left-right
0x27 => '#x0027', # APOSTROPHE, left-right
0x28 => '#x0028', # LEFT PARENTHESIS, left-right
0x29 => '#x0029', # RIGHT PARENTHESIS, left-right
0x2A => '#x002A', # ASTERISK, left-right
0x2B => '#x002B', # PLUS SIGN, left-right
0x2C => '#x002C', # COMMA, left-right
0x2D => '#x002D', # HYPHEN-MINUS, left-right
0x2E => '#x002E', # FULL STOP, left-right
0x2F => '#x002F', # SOLIDUS, left-right
0x30 => '#x0030', # DIGIT ZERO, left-right
0x31 => '#x0031', # DIGIT ONE, left-right
0x32 => '#x0032', # DIGIT TWO, left-right
0x33 => '#x0033', # DIGIT THREE, left-right
0x34 => '#x0034', # DIGIT FOUR, left-right
0x35 => '#x0035', # DIGIT FIVE, left-right
0x36 => '#x0036', # DIGIT SIX, left-right
0x37 => '#x0037', # DIGIT SEVEN, left-right
0x38 => '#x0038', # DIGIT EIGHT, left-right
0x39 => '#x0039', # DIGIT NINE, left-right
0x3A => '#x003A', # COLON, left-right
0x3B => '#x003B', # SEMICOLON, left-right
0x3C => '#x003C', # LESS-THAN SIGN, left-right
0x3D => '#x003D', # EQUALS SIGN, left-right
0x3E => '#x003E', # GREATER-THAN SIGN, left-right
0x3F => '#x003F', # QUESTION MARK, left-right
0x5B => '#x005B', # LEFT SQUARE BRACKET, left-right
0x5D => '#x005D', # RIGHT SQUARE BRACKET, left-right
0x7B => '#x007B', # LEFT CURLY BRACKET, left-right
0x7C => '#x007C', # VERTICAL LINE, left-right
0x7D => '#x007D', # RIGHT CURLY BRACKET, left-right
0x80 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
0x81 => '#xFB1F', # HEBREW LIGATURE YIDDISH YOD YOD PATAH
0x82 => '#x00C7', # LATIN CAPITAL LETTER C WITH CEDILLA
0x83 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0x84 => '#x00D1', # LATIN CAPITAL LETTER N WITH TILDE
0x85 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
0x86 => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
0x87 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
0x88 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
0x89 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
0x8A => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
0x8B => '#x00E3', # LATIN SMALL LETTER A WITH TILDE
0x8C => '#x00E5', # LATIN SMALL LETTER A WITH RING ABOVE
0x8D => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
0x8E => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0x8F => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
0x90 => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
0x91 => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
0x92 => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
0x93 => '#x00EC', # LATIN SMALL LETTER I WITH GRAVE
0x94 => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
0x95 => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
0x96 => '#x00F1', # LATIN SMALL LETTER N WITH TILDE
0x97 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
0x98 => '#x00F2', # LATIN SMALL LETTER O WITH GRAVE
0x99 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
0x9A => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
0x9B => '#x00F5', # LATIN SMALL LETTER O WITH TILDE
0x9C => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
0x9D => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
0x9E => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
0x9F => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xA0 => '#x0020', # SPACE, right-left
0xA1 => '#x0021', # EXCLAMATION MARK, right-left
0xA2 => '#x0022', # QUOTATION MARK, right-left
0xA3 => '#x0023', # NUMBER SIGN, right-left
0xA4 => '#x0024', # DOLLAR SIGN, right-left
0xA5 => '#x0025', # PERCENT SIGN, right-left
0xA6 => '#x20AA', # NEW SHEQEL SIGN
0xA7 => '#x0027', # APOSTROPHE, right-left
0xA8 => '#x0028', # LEFT PARENTHESIS, right-left
0xA9 => '#x0029', # RIGHT PARENTHESIS, right-left
0xAA => '#x002A', # ASTERISK, right-left
0xAB => '#x002B', # PLUS SIGN, right-left
0xAC => '#x002C', # COMMA, right-left
0xAD => '#x002D', # HYPHEN-MINUS, right-left
0xAE => '#x002E', # FULL STOP, right-left
0xAF => '#x002F', # SOLIDUS, right-left
0xB0 => '#x0030', # DIGIT ZERO, right-left
0xB1 => '#x0031', # DIGIT ONE, right-left
0xB2 => '#x0032', # DIGIT TWO, right-left
0xB3 => '#x0033', # DIGIT THREE, right-left
0xB4 => '#x0034', # DIGIT FOUR, right-left
0xB5 => '#x0035', # DIGIT FIVE, right-left
0xB6 => '#x0036', # DIGIT SIX, right-left
0xB7 => '#x0037', # DIGIT SEVEN, right-left
0xB8 => '#x0038', # DIGIT EIGHT, right-left
0xB9 => '#x0039', # DIGIT NINE, right-left
0xBA => '#x003A', # COLON, right-left
0xBB => '#x003B', # SEMICOLON, right-left
0xBC => '#x003C', # LESS-THAN SIGN, right-left
0xBD => '#x003D', # EQUALS SIGN, right-left
0xBE => '#x003E', # GREATER-THAN SIGN, right-left
0xBF => '#x003F', # QUESTION MARK, right-left
0xC0 => ['#xF86A','#x05DC','#x05B9'], # Hebrew ligature lamed holam
0xC1 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK, right-left
0xC2 => '#xF89B', # Hebrew canoral 1
0xC3 => '#xF89C', # Hebrew canoral 2
0xC4 => '#xF89D', # Hebrew canoral 3
0xC5 => '#xF89E', # Hebrew canoral 4
0xC6 => '#x05BC', # HEBREW POINT DAGESH OR MAPIQ
0xC7 => '#xFB4B', # HEBREW LETTER VAV WITH HOLAM
0xC8 => '#xFB35', # HEBREW LETTER VAV WITH DAGESH
0xC9 => '#x2026', # HORIZONTAL ELLIPSIS, right-left
0xCA => '#x00A0', # NO-BREAK SPACE, right-left
0xCB => '#x05B8', # HEBREW POINT QAMATS
0xCC => '#x05B7', # HEBREW POINT PATAH
0xCD => '#x05B5', # HEBREW POINT TSERE
0xCE => '#x05B6', # HEBREW POINT SEGOL
0xCF => '#x05B4', # HEBREW POINT HIRIQ
0xD0 => '#x2013', # EN DASH, right-left
0xD1 => '#x2014', # EM DASH, right-left
0xD2 => '#x201C', # LEFT DOUBLE QUOTATION MARK, right-left
0xD3 => '#x201D', # RIGHT DOUBLE QUOTATION MARK, right-left
0xD4 => '#x2018', # LEFT SINGLE QUOTATION MARK, right-left
0xD5 => '#x2019', # RIGHT SINGLE QUOTATION MARK, right-left
0xD6 => '#xFB2A', # HEBREW LETTER SHIN WITH SHIN DOT
0xD7 => '#xFB2B', # HEBREW LETTER SHIN WITH SIN DOT
0xD8 => '#x05BF', # HEBREW POINT RAFE
0xD9 => '#x05B0', # HEBREW POINT SHEVA
0xDA => '#x05B2', # HEBREW POINT HATAF PATAH
0xDB => '#x05B1', # HEBREW POINT HATAF SEGOL
0xDC => '#x05BB', # HEBREW POINT QUBUTS
0xDD => '#x05B9', # HEBREW POINT HOLAM
0xDE => ['#x05B8','#xF87F'], # HEBREW POINT QAMATS, alternate form
"qamats qatan"
0xDF => '#x05B3', # HEBREW POINT HATAF QAMATS
0xE0 => '#x05D0', # HEBREW LETTER ALEF
0xE1 => '#x05D1', # HEBREW LETTER BET
0xE2 => '#x05D2', # HEBREW LETTER GIMEL
0xE3 => '#x05D3', # HEBREW LETTER DALET
0xE4 => '#x05D4', # HEBREW LETTER HE
0xE5 => '#x05D5', # HEBREW LETTER VAV
0xE6 => '#x05D6', # HEBREW LETTER ZAYIN
0xE7 => '#x05D7', # HEBREW LETTER HET
0xE8 => '#x05D8', # HEBREW LETTER TET
0xE9 => '#x05D9', # HEBREW LETTER YOD
0xEA => '#x05DA', # HEBREW LETTER FINAL KAF
0xEB => '#x05DB', # HEBREW LETTER KAF
0xEC => '#x05DC', # HEBREW LETTER LAMED
0xED => '#x05DD', # HEBREW LETTER FINAL MEM
0xEE => '#x05DE', # HEBREW LETTER MEM
0xEF => '#x05DF', # HEBREW LETTER FINAL NUN
0xF0 => '#x05E0', # HEBREW LETTER NUN
0xF1 => '#x05E1', # HEBREW LETTER SAMEKH
0xF2 => '#x05E2', # HEBREW LETTER AYIN
0xF3 => '#x05E3', # HEBREW LETTER FINAL PE
0xF4 => '#x05E4', # HEBREW LETTER PE
0xF5 => '#x05E5', # HEBREW LETTER FINAL TSADI
0xF6 => '#x05E6', # HEBREW LETTER TSADI
0xF7 => '#x05E7', # HEBREW LETTER QOF
0xF8 => '#x05E8', # HEBREW LETTER RESH
0xF9 => '#x05E9', # HEBREW LETTER SHIN
0xFA => '#x05EA', # HEBREW LETTER TAV
0xFB => '#x007D', # RIGHT CURLY BRACKET, right-left
0xFC => '#x005D', # RIGHT SQUARE BRACKET, right-left
0xFD => '#x007B', # LEFT CURLY BRACKET, right-left
0xFE => '#x005B', # LEFT SQUARE BRACKET, right-left
0xFF => '#x007C', # VERTICAL LINE, right-left
};
--- NEW FILE ---
package MHonArc::CharEnt::AppleIceland;
# Apple Icelandic
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
0x81 => '#x00C5', # LATIN CAPITAL LETTER A WITH RING ABOVE
0x82 => '#x00C7', # LATIN CAPITAL LETTER C WITH CEDILLA
0x83 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0x84 => '#x00D1', # LATIN CAPITAL LETTER N WITH TILDE
0x85 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
0x86 => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
0x87 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
0x88 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
0x89 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
0x8A => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
0x8B => '#x00E3', # LATIN SMALL LETTER A WITH TILDE
0x8C => '#x00E5', # LATIN SMALL LETTER A WITH RING ABOVE
0x8D => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
0x8E => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0x8F => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
0x90 => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
0x91 => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
0x92 => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
0x93 => '#x00EC', # LATIN SMALL LETTER I WITH GRAVE
0x94 => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
0x95 => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
0x96 => '#x00F1', # LATIN SMALL LETTER N WITH TILDE
0x97 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
0x98 => '#x00F2', # LATIN SMALL LETTER O WITH GRAVE
0x99 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
0x9A => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
0x9B => '#x00F5', # LATIN SMALL LETTER O WITH TILDE
0x9C => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
0x9D => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
0x9E => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
0x9F => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xA0 => '#x00DD', # LATIN CAPITAL LETTER Y WITH ACUTE
0xA1 => '#x00B0', # DEGREE SIGN
0xA2 => '#x00A2', # CENT SIGN
0xA3 => '#x00A3', # POUND SIGN
0xA4 => '#x00A7', # SECTION SIGN
0xA5 => '#x2022', # BULLET
0xA6 => '#x00B6', # PILCROW SIGN
0xA7 => '#x00DF', # LATIN SMALL LETTER SHARP S
0xA8 => '#x00AE', # REGISTERED SIGN
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAA => '#x2122', # TRADE MARK SIGN
0xAB => '#x00B4', # ACUTE ACCENT
0xAC => '#x00A8', # DIAERESIS
0xAD => '#x2260', # NOT EQUAL TO
0xAE => '#x00C6', # LATIN CAPITAL LETTER AE
0xAF => '#x00D8', # LATIN CAPITAL LETTER O WITH STROKE
0xB0 => '#x221E', # INFINITY
0xB1 => '#x00B1', # PLUS-MINUS SIGN
0xB2 => '#x2264', # LESS-THAN OR EQUAL TO
0xB3 => '#x2265', # GREATER-THAN OR EQUAL TO
0xB4 => '#x00A5', # YEN SIGN
0xB5 => '#x00B5', # MICRO SIGN
0xB6 => '#x2202', # PARTIAL DIFFERENTIAL
0xB7 => '#x2211', # N-ARY SUMMATION
0xB8 => '#x220F', # N-ARY PRODUCT
0xB9 => '#x03C0', # GREEK SMALL LETTER PI
0xBA => '#x222B', # INTEGRAL
0xBB => '#x00AA', # FEMININE ORDINAL INDICATOR
0xBC => '#x00BA', # MASCULINE ORDINAL INDICATOR
0xBD => '#x03A9', # GREEK CAPITAL LETTER OMEGA
0xBE => '#x00E6', # LATIN SMALL LETTER AE
0xBF => '#x00F8', # LATIN SMALL LETTER O WITH STROKE
0xC0 => '#x00BF', # INVERTED QUESTION MARK
0xC1 => '#x00A1', # INVERTED EXCLAMATION MARK
0xC2 => '#x00AC', # NOT SIGN
0xC3 => '#x221A', # SQUARE ROOT
0xC4 => '#x0192', # LATIN SMALL LETTER F WITH HOOK
0xC5 => '#x2248', # ALMOST EQUAL TO
0xC6 => '#x2206', # INCREMENT
0xC7 => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC8 => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC9 => '#x2026', # HORIZONTAL ELLIPSIS
0xCA => '#x00A0', # NO-BREAK SPACE
0xCB => '#x00C0', # LATIN CAPITAL LETTER A WITH GRAVE
0xCC => '#x00C3', # LATIN CAPITAL LETTER A WITH TILDE
0xCD => '#x00D5', # LATIN CAPITAL LETTER O WITH TILDE
0xCE => '#x0152', # LATIN CAPITAL LIGATURE OE
0xCF => '#x0153', # LATIN SMALL LIGATURE OE
0xD0 => '#x2013', # EN DASH
0xD1 => '#x2014', # EM DASH
0xD2 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0xD3 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0xD4 => '#x2018', # LEFT SINGLE QUOTATION MARK
0xD5 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0xD6 => '#x00F7', # DIVISION SIGN
0xD7 => '#x25CA', # LOZENGE
0xD8 => '#x00FF', # LATIN SMALL LETTER Y WITH DIAERESIS
0xD9 => '#x0178', # LATIN CAPITAL LETTER Y WITH DIAERESIS
0xDA => '#x2044', # FRACTION SLASH
0xDB => '#x20AC', # EURO SIGN
0xDC => '#x00D0', # LATIN CAPITAL LETTER ETH
0xDD => '#x00F0', # LATIN SMALL LETTER ETH
0xDE => '#x00DE', # LATIN CAPITAL LETTER THORN
0xDF => '#x00FE', # LATIN SMALL LETTER THORN
0xE0 => '#x00FD', # LATIN SMALL LETTER Y WITH ACUTE
0xE1 => '#x00B7', # MIDDLE DOT
0xE2 => '#x201A', # SINGLE LOW-9 QUOTATION MARK
0xE3 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0xE4 => '#x2030', # PER MILLE SIGN
0xE5 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
0xE6 => '#x00CA', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX
0xE7 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
0xE8 => '#x00CB', # LATIN CAPITAL LETTER E WITH DIAERESIS
0xE9 => '#x00C8', # LATIN CAPITAL LETTER E WITH GRAVE
0xEA => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
0xEB => '#x00CE', # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
0xEC => '#x00CF', # LATIN CAPITAL LETTER I WITH DIAERESIS
0xED => '#x00CC', # LATIN CAPITAL LETTER I WITH GRAVE
0xEE => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
0xEF => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
0xF0 => '#xF8FF', # Apple logo
0xF1 => '#x00D2', # LATIN CAPITAL LETTER O WITH GRAVE
0xF2 => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
0xF3 => '#x00DB', # LATIN CAPITAL LETTER U WITH CIRCUMFLEX
0xF4 => '#x00D9', # LATIN CAPITAL LETTER U WITH GRAVE
0xF5 => '#x0131', # LATIN SMALL LETTER DOTLESS I
0xF6 => '#x02C6', # MODIFIER LETTER CIRCUMFLEX ACCENT
0xF7 => '#x02DC', # SMALL TILDE
0xF8 => '#x00AF', # MACRON
0xF9 => '#x02D8', # BREVE
0xFA => '#x02D9', # DOT ABOVE
0xFB => '#x02DA', # RING ABOVE
0xFC => '#x00B8', # CEDILLA
0xFD => '#x02DD', # DOUBLE ACUTE ACCENT
0xFE => '#x02DB', # OGONEK
0xFF => '#x02C7', # CARON
};
--- NEW FILE ---
package MHonArc::CharEnt::AppleRoman;
# Apple Roman
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
0x81 => '#x00C5', # LATIN CAPITAL LETTER A WITH RING ABOVE
0x82 => '#x00C7', # LATIN CAPITAL LETTER C WITH CEDILLA
0x83 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0x84 => '#x00D1', # LATIN CAPITAL LETTER N WITH TILDE
0x85 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
0x86 => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
0x87 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
0x88 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
0x89 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
0x8A => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
0x8B => '#x00E3', # LATIN SMALL LETTER A WITH TILDE
0x8C => '#x00E5', # LATIN SMALL LETTER A WITH RING ABOVE
0x8D => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
0x8E => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0x8F => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
0x90 => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
0x91 => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
0x92 => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
0x93 => '#x00EC', # LATIN SMALL LETTER I WITH GRAVE
0x94 => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
0x95 => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
0x96 => '#x00F1', # LATIN SMALL LETTER N WITH TILDE
0x97 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
0x98 => '#x00F2', # LATIN SMALL LETTER O WITH GRAVE
0x99 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
0x9A => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
0x9B => '#x00F5', # LATIN SMALL LETTER O WITH TILDE
0x9C => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
0x9D => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
0x9E => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
0x9F => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xA0 => '#x2020', # DAGGER
0xA1 => '#x00B0', # DEGREE SIGN
0xA2 => '#x00A2', # CENT SIGN
0xA3 => '#x00A3', # POUND SIGN
0xA4 => '#x00A7', # SECTION SIGN
0xA5 => '#x2022', # BULLET
0xA6 => '#x00B6', # PILCROW SIGN
0xA7 => '#x00DF', # LATIN SMALL LETTER SHARP S
0xA8 => '#x00AE', # REGISTERED SIGN
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAA => '#x2122', # TRADE MARK SIGN
0xAB => '#x00B4', # ACUTE ACCENT
0xAC => '#x00A8', # DIAERESIS
0xAD => '#x2260', # NOT EQUAL TO
0xAE => '#x00C6', # LATIN CAPITAL LETTER AE
0xAF => '#x00D8', # LATIN CAPITAL LETTER O WITH STROKE
0xB0 => '#x221E', # INFINITY
0xB1 => '#x00B1', # PLUS-MINUS SIGN
0xB2 => '#x2264', # LESS-THAN OR EQUAL TO
0xB3 => '#x2265', # GREATER-THAN OR EQUAL TO
0xB4 => '#x00A5', # YEN SIGN
0xB5 => '#x00B5', # MICRO SIGN
0xB6 => '#x2202', # PARTIAL DIFFERENTIAL
0xB7 => '#x2211', # N-ARY SUMMATION
0xB8 => '#x220F', # N-ARY PRODUCT
0xB9 => '#x03C0', # GREEK SMALL LETTER PI
0xBA => '#x222B', # INTEGRAL
0xBB => '#x00AA', # FEMININE ORDINAL INDICATOR
0xBC => '#x00BA', # MASCULINE ORDINAL INDICATOR
0xBD => '#x03A9', # GREEK CAPITAL LETTER OMEGA
0xBE => '#x00E6', # LATIN SMALL LETTER AE
0xBF => '#x00F8', # LATIN SMALL LETTER O WITH STROKE
0xC0 => '#x00BF', # INVERTED QUESTION MARK
0xC1 => '#x00A1', # INVERTED EXCLAMATION MARK
0xC2 => '#x00AC', # NOT SIGN
0xC3 => '#x221A', # SQUARE ROOT
0xC4 => '#x0192', # LATIN SMALL LETTER F WITH HOOK
0xC5 => '#x2248', # ALMOST EQUAL TO
0xC6 => '#x2206', # INCREMENT
0xC7 => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC8 => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC9 => '#x2026', # HORIZONTAL ELLIPSIS
0xCA => '#x00A0', # NO-BREAK SPACE
0xCB => '#x00C0', # LATIN CAPITAL LETTER A WITH GRAVE
0xCC => '#x00C3', # LATIN CAPITAL LETTER A WITH TILDE
0xCD => '#x00D5', # LATIN CAPITAL LETTER O WITH TILDE
0xCE => '#x0152', # LATIN CAPITAL LIGATURE OE
0xCF => '#x0153', # LATIN SMALL LIGATURE OE
0xD0 => '#x2013', # EN DASH
0xD1 => '#x2014', # EM DASH
0xD2 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0xD3 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0xD4 => '#x2018', # LEFT SINGLE QUOTATION MARK
0xD5 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0xD6 => '#x00F7', # DIVISION SIGN
0xD7 => '#x25CA', # LOZENGE
0xD8 => '#x00FF', # LATIN SMALL LETTER Y WITH DIAERESIS
0xD9 => '#x0178', # LATIN CAPITAL LETTER Y WITH DIAERESIS
0xDA => '#x2044', # FRACTION SLASH
0xDB => '#x20AC', # EURO SIGN
0xDC => '#x2039', # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
0xDD => '#x203A', # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
0xDE => '#xFB01', # LATIN SMALL LIGATURE FI
0xDF => '#xFB02', # LATIN SMALL LIGATURE FL
0xE0 => '#x2021', # DOUBLE DAGGER
0xE1 => '#x00B7', # MIDDLE DOT
0xE2 => '#x201A', # SINGLE LOW-9 QUOTATION MARK
0xE3 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0xE4 => '#x2030', # PER MILLE SIGN
0xE5 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
0xE6 => '#x00CA', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX
0xE7 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
0xE8 => '#x00CB', # LATIN CAPITAL LETTER E WITH DIAERESIS
0xE9 => '#x00C8', # LATIN CAPITAL LETTER E WITH GRAVE
0xEA => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
0xEB => '#x00CE', # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
0xEC => '#x00CF', # LATIN CAPITAL LETTER I WITH DIAERESIS
0xED => '#x00CC', # LATIN CAPITAL LETTER I WITH GRAVE
0xEE => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
0xEF => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
0xF0 => '#xF8FF', # Apple logo
0xF1 => '#x00D2', # LATIN CAPITAL LETTER O WITH GRAVE
0xF2 => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
0xF3 => '#x00DB', # LATIN CAPITAL LETTER U WITH CIRCUMFLEX
0xF4 => '#x00D9', # LATIN CAPITAL LETTER U WITH GRAVE
0xF5 => '#x0131', # LATIN SMALL LETTER DOTLESS I
0xF6 => '#x02C6', # MODIFIER LETTER CIRCUMFLEX ACCENT
0xF7 => '#x02DC', # SMALL TILDE
0xF8 => '#x00AF', # MACRON
0xF9 => '#x02D8', # BREVE
0xFA => '#x02D9', # DOT ABOVE
0xFB => '#x02DA', # RING ABOVE
0xFC => '#x00B8', # CEDILLA
0xFD => '#x02DD', # DOUBLE ACUTE ACCENT
0xFE => '#x02DB', # OGONEK
0xFF => '#x02C7', # CARON
};
--- NEW FILE ---
package MHonArc::CharEnt::AppleRomanian;
# Apple Romanian
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
0x81 => '#x00C5', # LATIN CAPITAL LETTER A WITH RING ABOVE
0x82 => '#x00C7', # LATIN CAPITAL LETTER C WITH CEDILLA
0x83 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0x84 => '#x00D1', # LATIN CAPITAL LETTER N WITH TILDE
0x85 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
0x86 => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
0x87 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
0x88 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
0x89 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
0x8A => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
0x8B => '#x00E3', # LATIN SMALL LETTER A WITH TILDE
0x8C => '#x00E5', # LATIN SMALL LETTER A WITH RING ABOVE
0x8D => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
0x8E => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0x8F => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
0x90 => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
0x91 => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
0x92 => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
0x93 => '#x00EC', # LATIN SMALL LETTER I WITH GRAVE
0x94 => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
0x95 => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
0x96 => '#x00F1', # LATIN SMALL LETTER N WITH TILDE
0x97 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
0x98 => '#x00F2', # LATIN SMALL LETTER O WITH GRAVE
0x99 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
0x9A => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
0x9B => '#x00F5', # LATIN SMALL LETTER O WITH TILDE
0x9C => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
0x9D => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
0x9E => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
0x9F => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xA0 => '#x2020', # DAGGER
0xA1 => '#x00B0', # DEGREE SIGN
0xA2 => '#x00A2', # CENT SIGN
0xA3 => '#x00A3', # POUND SIGN
0xA4 => '#x00A7', # SECTION SIGN
0xA5 => '#x2022', # BULLET
0xA6 => '#x00B6', # PILCROW SIGN
0xA7 => '#x00DF', # LATIN SMALL LETTER SHARP S
0xA8 => '#x00AE', # REGISTERED SIGN
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAA => '#x2122', # TRADE MARK SIGN
0xAB => '#x00B4', # ACUTE ACCENT
0xAC => '#x00A8', # DIAERESIS
0xAD => '#x2260', # NOT EQUAL TO
0xAE => '#x0102', # LATIN CAPITAL LETTER A WITH BREVE
0xAF => ['#x0053', '#x0326'], # LATIN CAPITAL LETTER S + COMBINING
COMMA BELOW
0xB0 => '#x221E', # INFINITY
0xB1 => '#x00B1', # PLUS-MINUS SIGN
0xB2 => '#x2264', # LESS-THAN OR EQUAL TO
0xB3 => '#x2265', # GREATER-THAN OR EQUAL TO
0xB4 => '#x00A5', # YEN SIGN
0xB5 => '#x00B5', # MICRO SIGN
0xB6 => '#x2202', # PARTIAL DIFFERENTIAL
0xB7 => '#x2211', # N-ARY SUMMATION
0xB8 => '#x220F', # N-ARY PRODUCT
0xB9 => '#x03C0', # GREEK SMALL LETTER PI
0xBA => '#x222B', # INTEGRAL
0xBB => '#x00AA', # FEMININE ORDINAL INDICATOR
0xBC => '#x00BA', # MASCULINE ORDINAL INDICATOR
0xBD => '#x03A9', # GREEK CAPITAL LETTER OMEGA
0xBE => '#x0103', # LATIN SMALL LETTER A WITH BREVE
0xBF => ['#x0073','#x0326'], # LATIN SMALL LETTER S + COMBINING
COMMA BELOW
0xC0 => '#x00BF', # INVERTED QUESTION MARK
0xC1 => '#x00A1', # INVERTED EXCLAMATION MARK
0xC2 => '#x00AC', # NOT SIGN
0xC3 => '#x221A', # SQUARE ROOT
0xC4 => '#x0192', # LATIN SMALL LETTER F WITH HOOK
0xC5 => '#x2248', # ALMOST EQUAL TO
0xC6 => '#x2206', # INCREMENT
0xC7 => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC8 => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC9 => '#x2026', # HORIZONTAL ELLIPSIS
0xCA => '#x00A0', # NO-BREAK SPACE
0xCB => '#x00C0', # LATIN CAPITAL LETTER A WITH GRAVE
0xCC => '#x00C3', # LATIN CAPITAL LETTER A WITH TILDE
0xCD => '#x00D5', # LATIN CAPITAL LETTER O WITH TILDE
0xCE => '#x0152', # LATIN CAPITAL LIGATURE OE
0xCF => '#x0153', # LATIN SMALL LIGATURE OE
0xD0 => '#x2013', # EN DASH
0xD1 => '#x2014', # EM DASH
0xD2 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0xD3 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0xD4 => '#x2018', # LEFT SINGLE QUOTATION MARK
0xD5 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0xD6 => '#x00F7', # DIVISION SIGN
0xD7 => '#x25CA', # LOZENGE
0xD8 => '#x00FF', # LATIN SMALL LETTER Y WITH DIAERESIS
0xD9 => '#x0178', # LATIN CAPITAL LETTER Y WITH DIAERESIS
0xDA => '#x2044', # FRACTION SLASH
0xDB => '#x20AC', # EURO SIGN
0xDC => '#x2039', # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
0xDD => '#x203A', # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
0xDE => ['#x0054','#x0326'], # LATIN CAPITAL LETTER T + COMBINING
COMMA BELOW
0xDF => ['#x0074','#x0326'], # LATIN SMALL LETTER T + COMBINING
COMMA BELOW
0xE0 => '#x2021', # DOUBLE DAGGER
0xE1 => '#x00B7', # MIDDLE DOT
0xE2 => '#x201A', # SINGLE LOW-9 QUOTATION MARK
0xE3 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0xE4 => '#x2030', # PER MILLE SIGN
0xE5 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
0xE6 => '#x00CA', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX
0xE7 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
0xE8 => '#x00CB', # LATIN CAPITAL LETTER E WITH DIAERESIS
0xE9 => '#x00C8', # LATIN CAPITAL LETTER E WITH GRAVE
0xEA => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
0xEB => '#x00CE', # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
0xEC => '#x00CF', # LATIN CAPITAL LETTER I WITH DIAERESIS
0xED => '#x00CC', # LATIN CAPITAL LETTER I WITH GRAVE
0xEE => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
0xEF => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
0xF0 => '#xF8FF', # Apple logo
0xF1 => '#x00D2', # LATIN CAPITAL LETTER O WITH GRAVE
0xF2 => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
0xF3 => '#x00DB', # LATIN CAPITAL LETTER U WITH CIRCUMFLEX
0xF4 => '#x00D9', # LATIN CAPITAL LETTER U WITH GRAVE
0xF5 => '#x0131', # LATIN SMALL LETTER DOTLESS I
0xF6 => '#x02C6', # MODIFIER LETTER CIRCUMFLEX ACCENT
0xF7 => '#x02DC', # SMALL TILDE
0xF8 => '#x00AF', # MACRON
0xF9 => '#x02D8', # BREVE
0xFA => '#x02D9', # DOT ABOVE
0xFB => '#x02DA', # RING ABOVE
0xFC => '#x00B8', # CEDILLA
0xFD => '#x02DD', # DOUBLE ACUTE ACCENT
0xFE => '#x02DB', # OGONEK
0xFF => '#x02C7', # CARON
};
--- NEW FILE ---
package MHonArc::CharEnt::AppleThai;
# Apple Thai
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0x81 => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0x82 => '#x2026', # HORIZONTAL ELLIPSIS
0x83 => ['#x0E48','#xF875'], # THAI CHARACTER MAI EK, low left
position
0x84 => ['#x0E49','#xF875'], # THAI CHARACTER MAI THO, low left
position
0x85 => ['#x0E4A','#xF875'], # THAI CHARACTER MAI TRI, low left
position
0x86 => ['#x0E4B','#xF875'], # THAI CHARACTER MAI CHATTAWA, low left
position
0x87 => ['#x0E4C','#xF875'], # THAI CHARACTER THANTHAKHAT, low left
position
0x88 => ['#x0E48','#xF873'], # THAI CHARACTER MAI EK, low position
0x89 => ['#x0E49','#xF873'], # THAI CHARACTER MAI THO, low position
0x8A => ['#x0E4A','#xF873'], # THAI CHARACTER MAI TRI, low position
0x8B => ['#x0E4B','#xF873'], # THAI CHARACTER MAI CHATTAWA, low
position
0x8C => ['#x0E4C','#xF873'], # THAI CHARACTER THANTHAKHAT, low
position
0x8D => '#x201C', # LEFT DOUBLE QUOTATION MARK
0x8E => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0x8F => ['#x0E4D','#xF874'], # THAI CHARACTER NIKHAHIT, left position
0x91 => '#x2022', # BULLET
0x92 => ['#x0E31','#xF874'], # THAI CHARACTER MAI HAN-AKAT, left
position
0x93 => ['#x0E47','#xF874'], # THAI CHARACTER MAITAIKHU, left
position
0x94 => ['#x0E34','#xF874'], # THAI CHARACTER SARA I, left position
0x95 => ['#x0E35','#xF874'], # THAI CHARACTER SARA II, left position
0x96 => ['#x0E36','#xF874'], # THAI CHARACTER SARA UE, left position
0x97 => ['#x0E37','#xF874'], # THAI CHARACTER SARA UEE, left position
0x98 => ['#x0E48','#xF874'], # THAI CHARACTER MAI EK, left position
0x99 => ['#x0E49','#xF874'], # THAI CHARACTER MAI THO, left position
0x9A => ['#x0E4A','#xF874'], # THAI CHARACTER MAI TRI, left position
0x9B => ['#x0E4B','#xF874'], # THAI CHARACTER MAI CHATTAWA, left
position
0x9C => ['#x0E4C','#xF874'], # THAI CHARACTER THANTHAKHAT, left
position
0x9D => '#x2018', # LEFT SINGLE QUOTATION MARK
0x9E => '#x2019', # RIGHT SINGLE QUOTATION MARK
0xA1 => '#x0E01', # THAI CHARACTER KO KAI
0xA2 => '#x0E02', # THAI CHARACTER KHO KHAI
0xA3 => '#x0E03', # THAI CHARACTER KHO KHUAT
0xA4 => '#x0E04', # THAI CHARACTER KHO KHWAI
0xA5 => '#x0E05', # THAI CHARACTER KHO KHON
0xA6 => '#x0E06', # THAI CHARACTER KHO RAKHANG
0xA7 => '#x0E07', # THAI CHARACTER NGO NGU
0xA8 => '#x0E08', # THAI CHARACTER CHO CHAN
0xA9 => '#x0E09', # THAI CHARACTER CHO CHING
0xAA => '#x0E0A', # THAI CHARACTER CHO CHANG
0xAB => '#x0E0B', # THAI CHARACTER SO SO
0xAC => '#x0E0C', # THAI CHARACTER CHO CHOE
0xAD => '#x0E0D', # THAI CHARACTER YO YING
0xAE => '#x0E0E', # THAI CHARACTER DO CHADA
0xAF => '#x0E0F', # THAI CHARACTER TO PATAK
0xB0 => '#x0E10', # THAI CHARACTER THO THAN
0xB1 => '#x0E11', # THAI CHARACTER THO NANGMONTHO
0xB2 => '#x0E12', # THAI CHARACTER THO PHUTHAO
0xB3 => '#x0E13', # THAI CHARACTER NO NEN
0xB4 => '#x0E14', # THAI CHARACTER DO DEK
0xB5 => '#x0E15', # THAI CHARACTER TO TAO
0xB6 => '#x0E16', # THAI CHARACTER THO THUNG
0xB7 => '#x0E17', # THAI CHARACTER THO THAHAN
0xB8 => '#x0E18', # THAI CHARACTER THO THONG
0xB9 => '#x0E19', # THAI CHARACTER NO NU
0xBA => '#x0E1A', # THAI CHARACTER BO BAIMAI
0xBB => '#x0E1B', # THAI CHARACTER PO PLA
0xBC => '#x0E1C', # THAI CHARACTER PHO PHUNG
0xBD => '#x0E1D', # THAI CHARACTER FO FA
0xBE => '#x0E1E', # THAI CHARACTER PHO PHAN
0xBF => '#x0E1F', # THAI CHARACTER FO FAN
0xC0 => '#x0E20', # THAI CHARACTER PHO SAMPHAO
0xC1 => '#x0E21', # THAI CHARACTER MO MA
0xC2 => '#x0E22', # THAI CHARACTER YO YAK
0xC3 => '#x0E23', # THAI CHARACTER RO RUA
0xC4 => '#x0E24', # THAI CHARACTER RU
0xC5 => '#x0E25', # THAI CHARACTER LO LING
0xC6 => '#x0E26', # THAI CHARACTER LU
0xC7 => '#x0E27', # THAI CHARACTER WO WAEN
0xC8 => '#x0E28', # THAI CHARACTER SO SALA
0xC9 => '#x0E29', # THAI CHARACTER SO RUSI
0xCA => '#x0E2A', # THAI CHARACTER SO SUA
0xCB => '#x0E2B', # THAI CHARACTER HO HIP
0xCC => '#x0E2C', # THAI CHARACTER LO CHULA
0xCD => '#x0E2D', # THAI CHARACTER O ANG
0xCE => '#x0E2E', # THAI CHARACTER HO NOKHUK
0xCF => '#x0E2F', # THAI CHARACTER PAIYANNOI
0xD0 => '#x0E30', # THAI CHARACTER SARA A
0xD1 => '#x0E31', # THAI CHARACTER MAI HAN-AKAT
0xD2 => '#x0E32', # THAI CHARACTER SARA AA
0xD3 => '#x0E33', # THAI CHARACTER SARA AM
0xD4 => '#x0E34', # THAI CHARACTER SARA I
0xD5 => '#x0E35', # THAI CHARACTER SARA II
0xD6 => '#x0E36', # THAI CHARACTER SARA UE
0xD7 => '#x0E37', # THAI CHARACTER SARA UEE
0xD8 => '#x0E38', # THAI CHARACTER SARA U
0xD9 => '#x0E39', # THAI CHARACTER SARA UU
0xDA => '#x0E3A', # THAI CHARACTER PHINTHU
0xDB => '#xFEFF', # ZERO WIDTH NO-BREAK SPACE
0xDC => '#x200B', # ZERO WIDTH SPACE
0xDD => '#x2013', # EN DASH
0xDE => '#x2014', # EM DASH
0xDF => '#x0E3F', # THAI CURRENCY SYMBOL BAHT
0xE0 => '#x0E40', # THAI CHARACTER SARA E
0xE1 => '#x0E41', # THAI CHARACTER SARA AE
0xE2 => '#x0E42', # THAI CHARACTER SARA O
0xE3 => '#x0E43', # THAI CHARACTER SARA AI MAIMUAN
0xE4 => '#x0E44', # THAI CHARACTER SARA AI MAIMALAI
0xE5 => '#x0E45', # THAI CHARACTER LAKKHANGYAO
0xE6 => '#x0E46', # THAI CHARACTER MAIYAMOK
0xE7 => '#x0E47', # THAI CHARACTER MAITAIKHU
0xE8 => '#x0E48', # THAI CHARACTER MAI EK
0xE9 => '#x0E49', # THAI CHARACTER MAI THO
0xEA => '#x0E4A', # THAI CHARACTER MAI TRI
0xEB => '#x0E4B', # THAI CHARACTER MAI CHATTAWA
0xEC => '#x0E4C', # THAI CHARACTER THANTHAKHAT
0xED => '#x0E4D', # THAI CHARACTER NIKHAHIT
0xEE => '#x2122', # TRADE MARK SIGN
0xEF => '#x0E4F', # THAI CHARACTER FONGMAN
0xF0 => '#x0E50', # THAI DIGIT ZERO
0xF1 => '#x0E51', # THAI DIGIT ONE
0xF2 => '#x0E52', # THAI DIGIT TWO
0xF3 => '#x0E53', # THAI DIGIT THREE
0xF4 => '#x0E54', # THAI DIGIT FOUR
0xF5 => '#x0E55', # THAI DIGIT FIVE
0xF6 => '#x0E56', # THAI DIGIT SIX
0xF7 => '#x0E57', # THAI DIGIT SEVEN
0xF8 => '#x0E58', # THAI DIGIT EIGHT
0xF9 => '#x0E59', # THAI DIGIT NINE
0xFA => '#x00AE', # REGISTERED SIGN
0xFB => '#x00A9', # COPYRIGHT SIGN
};
--- NEW FILE ---
package MHonArc::CharEnt::AppleTurkish;
# Apple Turkish
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
0x81 => '#x00C5', # LATIN CAPITAL LETTER A WITH RING ABOVE
0x82 => '#x00C7', # LATIN CAPITAL LETTER C WITH CEDILLA
0x83 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0x84 => '#x00D1', # LATIN CAPITAL LETTER N WITH TILDE
0x85 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
0x86 => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
0x87 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
0x88 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
0x89 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
0x8A => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
0x8B => '#x00E3', # LATIN SMALL LETTER A WITH TILDE
0x8C => '#x00E5', # LATIN SMALL LETTER A WITH RING ABOVE
0x8D => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
0x8E => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0x8F => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
0x90 => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
0x91 => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
0x92 => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
0x93 => '#x00EC', # LATIN SMALL LETTER I WITH GRAVE
0x94 => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
0x95 => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
0x96 => '#x00F1', # LATIN SMALL LETTER N WITH TILDE
0x97 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
0x98 => '#x00F2', # LATIN SMALL LETTER O WITH GRAVE
0x99 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
0x9A => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
0x9B => '#x00F5', # LATIN SMALL LETTER O WITH TILDE
0x9C => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
0x9D => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
0x9E => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
0x9F => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xA0 => '#x2020', # DAGGER
0xA1 => '#x00B0', # DEGREE SIGN
0xA2 => '#x00A2', # CENT SIGN
0xA3 => '#x00A3', # POUND SIGN
0xA4 => '#x00A7', # SECTION SIGN
0xA5 => '#x2022', # BULLET
0xA6 => '#x00B6', # PILCROW SIGN
0xA7 => '#x00DF', # LATIN SMALL LETTER SHARP S
0xA8 => '#x00AE', # REGISTERED SIGN
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAA => '#x2122', # TRADE MARK SIGN
0xAB => '#x00B4', # ACUTE ACCENT
0xAC => '#x00A8', # DIAERESIS
0xAD => '#x2260', # NOT EQUAL TO
0xAE => '#x00C6', # LATIN CAPITAL LETTER AE
0xAF => '#x00D8', # LATIN CAPITAL LETTER O WITH STROKE
0xB0 => '#x221E', # INFINITY
0xB1 => '#x00B1', # PLUS-MINUS SIGN
0xB2 => '#x2264', # LESS-THAN OR EQUAL TO
0xB3 => '#x2265', # GREATER-THAN OR EQUAL TO
0xB4 => '#x00A5', # YEN SIGN
0xB5 => '#x00B5', # MICRO SIGN
0xB6 => '#x2202', # PARTIAL DIFFERENTIAL
0xB7 => '#x2211', # N-ARY SUMMATION
0xB8 => '#x220F', # N-ARY PRODUCT
0xB9 => '#x03C0', # GREEK SMALL LETTER PI
0xBA => '#x222B', # INTEGRAL
0xBB => '#x00AA', # FEMININE ORDINAL INDICATOR
0xBC => '#x00BA', # MASCULINE ORDINAL INDICATOR
0xBD => '#x03A9', # GREEK CAPITAL LETTER OMEGA
0xBE => '#x00E6', # LATIN SMALL LETTER AE
0xBF => '#x00F8', # LATIN SMALL LETTER O WITH STROKE
0xC0 => '#x00BF', # INVERTED QUESTION MARK
0xC1 => '#x00A1', # INVERTED EXCLAMATION MARK
0xC2 => '#x00AC', # NOT SIGN
0xC3 => '#x221A', # SQUARE ROOT
0xC4 => '#x0192', # LATIN SMALL LETTER F WITH HOOK
0xC5 => '#x2248', # ALMOST EQUAL TO
0xC6 => '#x2206', # INCREMENT
0xC7 => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC8 => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC9 => '#x2026', # HORIZONTAL ELLIPSIS
0xCA => '#x00A0', # NO-BREAK SPACE
0xCB => '#x00C0', # LATIN CAPITAL LETTER A WITH GRAVE
0xCC => '#x00C3', # LATIN CAPITAL LETTER A WITH TILDE
0xCD => '#x00D5', # LATIN CAPITAL LETTER O WITH TILDE
0xCE => '#x0152', # LATIN CAPITAL LIGATURE OE
0xCF => '#x0153', # LATIN SMALL LIGATURE OE
0xD0 => '#x2013', # EN DASH
0xD1 => '#x2014', # EM DASH
0xD2 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0xD3 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0xD4 => '#x2018', # LEFT SINGLE QUOTATION MARK
0xD5 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0xD6 => '#x00F7', # DIVISION SIGN
0xD7 => '#x25CA', # LOZENGE
0xD8 => '#x00FF', # LATIN SMALL LETTER Y WITH DIAERESIS
0xD9 => '#x0178', # LATIN CAPITAL LETTER Y WITH DIAERESIS
0xDA => '#x011E', # LATIN CAPITAL LETTER G WITH BREVE
0xDB => '#x011F', # LATIN SMALL LETTER G WITH BREVE
0xDC => '#x0130', # LATIN CAPITAL LETTER I WITH DOT ABOVE
0xDD => '#x0131', # LATIN SMALL LETTER DOTLESS I
0xDE => '#x015E', # LATIN CAPITAL LETTER S WITH CEDILLA
0xDF => '#x015F', # LATIN SMALL LETTER S WITH CEDILLA
0xE0 => '#x2021', # DOUBLE DAGGER
0xE1 => '#x00B7', # MIDDLE DOT
0xE2 => '#x201A', # SINGLE LOW-9 QUOTATION MARK
0xE3 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0xE4 => '#x2030', # PER MILLE SIGN
0xE5 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
0xE6 => '#x00CA', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX
0xE7 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
0xE8 => '#x00CB', # LATIN CAPITAL LETTER E WITH DIAERESIS
0xE9 => '#x00C8', # LATIN CAPITAL LETTER E WITH GRAVE
0xEA => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
0xEB => '#x00CE', # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
0xEC => '#x00CF', # LATIN CAPITAL LETTER I WITH DIAERESIS
0xED => '#x00CC', # LATIN CAPITAL LETTER I WITH GRAVE
0xEE => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
0xEF => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
0xF0 => '#xF8FF', # Apple logo
0xF1 => '#x00D2', # LATIN CAPITAL LETTER O WITH GRAVE
0xF2 => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
0xF3 => '#x00DB', # LATIN CAPITAL LETTER U WITH CIRCUMFLEX
0xF4 => '#x00D9', # LATIN CAPITAL LETTER U WITH GRAVE
0xF5 => '#xF8A0', # undefined1
0xF6 => '#x02C6', # MODIFIER LETTER CIRCUMFLEX ACCENT
0xF7 => '#x02DC', # SMALL TILDE
0xF8 => '#x00AF', # MACRON
0xF9 => '#x02D8', # BREVE
0xFA => '#x02D9', # DOT ABOVE
0xFB => '#x02DA', # RING ABOVE
0xFC => '#x00B8', # CEDILLA
0xFD => '#x02DD', # DOUBLE ACUTE ACCENT
0xFE => '#x02DB', # OGONEK
0xFF => '#x02C7', # CARON
};
--- NEW FILE ---
package MHonArc::CharEnt::CP1251;
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x0402', # CYRILLIC CAPITAL LETTER DJE
0x81 => '#x0403', # CYRILLIC CAPITAL LETTER GJE
0x82 => '#x201A', # SINGLE LOW-9 QUOTATION MARK
0x83 => '#x0453', # CYRILLIC SMALL LETTER GJE
0x84 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0x85 => '#x2026', # HORIZONTAL ELLIPSIS
0x86 => '#x2020', # DAGGER
0x87 => '#x2021', # DOUBLE DAGGER
0x88 => '#x20AC', # EURO SIGN
0x89 => '#x2030', # PER MILLE SIGN
0x8A => '#x0409', # CYRILLIC CAPITAL LETTER LJE
0x8B => '#x2039', # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
0x8C => '#x040A', # CYRILLIC CAPITAL LETTER NJE
0x8D => '#x040C', # CYRILLIC CAPITAL LETTER KJE
0x8E => '#x040B', # CYRILLIC CAPITAL LETTER TSHE
0x8F => '#x040F', # CYRILLIC CAPITAL LETTER DZHE
0x90 => '#x0452', # CYRILLIC SMALL LETTER DJE
0x91 => '#x2018', # LEFT SINGLE QUOTATION MARK
0x92 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0x93 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0x94 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0x95 => '#x2022', # BULLET
0x96 => '#x2013', # EN DASH
0x97 => '#x2014', # EM DASH
0x99 => '#x2122', # TRADE MARK SIGN
0x9A => '#x0459', # CYRILLIC SMALL LETTER LJE
0x9B => '#x203A', # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
0x9C => '#x045A', # CYRILLIC SMALL LETTER NJE
0x9D => '#x045C', # CYRILLIC SMALL LETTER KJE
0x9E => '#x045B', # CYRILLIC SMALL LETTER TSHE
0x9F => '#x045F', # CYRILLIC SMALL LETTER DZHE
0xA1 => '#x040E', # CYRILLIC CAPITAL LETTER SHORT U
0xA2 => '#x045E', # CYRILLIC SMALL LETTER SHORT U
0xA3 => '#x0408', # CYRILLIC CAPITAL LETTER JE
0xA5 => '#x0490', # CYRILLIC CAPITAL LETTER GHE WITH UPTURN
0xA8 => '#x0401', # CYRILLIC CAPITAL LETTER IO
0xAA => '#x0404', # CYRILLIC CAPITAL LETTER UKRAINIAN IE
0xAF => '#x0407', # CYRILLIC CAPITAL LETTER YI
0xB2 => '#x0406', # CYRILLIC CAPITAL LETTER
BYELORUSSIAN-UKRAINIAN I
0xB3 => '#x0456', # CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
0xB4 => '#x0491', # CYRILLIC SMALL LETTER GHE WITH UPTURN
0xB8 => '#x0451', # CYRILLIC SMALL LETTER IO
0xB9 => '#x2116', # NUMERO SIGN
0xBA => '#x0454', # CYRILLIC SMALL LETTER UKRAINIAN IE
0xBC => '#x0458', # CYRILLIC SMALL LETTER JE
0xBD => '#x0405', # CYRILLIC CAPITAL LETTER DZE
0xBE => '#x0455', # CYRILLIC SMALL LETTER DZE
0xBF => '#x0457', # CYRILLIC SMALL LETTER YI
0xC0 => '#x0410', # CYRILLIC CAPITAL LETTER A
0xC1 => '#x0411', # CYRILLIC CAPITAL LETTER BE
0xC2 => '#x0412', # CYRILLIC CAPITAL LETTER VE
0xC3 => '#x0413', # CYRILLIC CAPITAL LETTER GHE
0xC4 => '#x0414', # CYRILLIC CAPITAL LETTER DE
0xC5 => '#x0415', # CYRILLIC CAPITAL LETTER IE
0xC6 => '#x0416', # CYRILLIC CAPITAL LETTER ZHE
0xC7 => '#x0417', # CYRILLIC CAPITAL LETTER ZE
0xC8 => '#x0418', # CYRILLIC CAPITAL LETTER I
0xC9 => '#x0419', # CYRILLIC CAPITAL LETTER SHORT I
0xCA => '#x041A', # CYRILLIC CAPITAL LETTER KA
0xCB => '#x041B', # CYRILLIC CAPITAL LETTER EL
0xCC => '#x041C', # CYRILLIC CAPITAL LETTER EM
0xCD => '#x041D', # CYRILLIC CAPITAL LETTER EN
0xCE => '#x041E', # CYRILLIC CAPITAL LETTER O
0xCF => '#x041F', # CYRILLIC CAPITAL LETTER PE
0xD0 => '#x0420', # CYRILLIC CAPITAL LETTER ER
0xD1 => '#x0421', # CYRILLIC CAPITAL LETTER ES
0xD2 => '#x0422', # CYRILLIC CAPITAL LETTER TE
0xD3 => '#x0423', # CYRILLIC CAPITAL LETTER U
0xD4 => '#x0424', # CYRILLIC CAPITAL LETTER EF
0xD5 => '#x0425', # CYRILLIC CAPITAL LETTER HA
0xD6 => '#x0426', # CYRILLIC CAPITAL LETTER TSE
0xD7 => '#x0427', # CYRILLIC CAPITAL LETTER CHE
0xD8 => '#x0428', # CYRILLIC CAPITAL LETTER SHA
0xD9 => '#x0429', # CYRILLIC CAPITAL LETTER SHCHA
0xDA => '#x042A', # CYRILLIC CAPITAL LETTER HARD SIGN
0xDB => '#x042B', # CYRILLIC CAPITAL LETTER YERU
0xDC => '#x042C', # CYRILLIC CAPITAL LETTER SOFT SIGN
0xDD => '#x042D', # CYRILLIC CAPITAL LETTER E
0xDE => '#x042E', # CYRILLIC CAPITAL LETTER YU
0xDF => '#x042F', # CYRILLIC CAPITAL LETTER YA
0xE0 => '#x0430', # CYRILLIC SMALL LETTER A
0xE1 => '#x0431', # CYRILLIC SMALL LETTER BE
0xE2 => '#x0432', # CYRILLIC SMALL LETTER VE
0xE3 => '#x0433', # CYRILLIC SMALL LETTER GHE
0xE4 => '#x0434', # CYRILLIC SMALL LETTER DE
0xE5 => '#x0435', # CYRILLIC SMALL LETTER IE
0xE6 => '#x0436', # CYRILLIC SMALL LETTER ZHE
0xE7 => '#x0437', # CYRILLIC SMALL LETTER ZE
0xE8 => '#x0438', # CYRILLIC SMALL LETTER I
0xE9 => '#x0439', # CYRILLIC SMALL LETTER SHORT I
0xEA => '#x043A', # CYRILLIC SMALL LETTER KA
0xEB => '#x043B', # CYRILLIC SMALL LETTER EL
0xEC => '#x043C', # CYRILLIC SMALL LETTER EM
0xED => '#x043D', # CYRILLIC SMALL LETTER EN
0xEE => '#x043E', # CYRILLIC SMALL LETTER O
0xEF => '#x043F', # CYRILLIC SMALL LETTER PE
0xF0 => '#x0440', # CYRILLIC SMALL LETTER ER
0xF1 => '#x0441', # CYRILLIC SMALL LETTER ES
0xF2 => '#x0442', # CYRILLIC SMALL LETTER TE
0xF3 => '#x0443', # CYRILLIC SMALL LETTER U
0xF4 => '#x0444', # CYRILLIC SMALL LETTER EF
0xF5 => '#x0445', # CYRILLIC SMALL LETTER HA
0xF6 => '#x0446', # CYRILLIC SMALL LETTER TSE
0xF7 => '#x0447', # CYRILLIC SMALL LETTER CHE
0xF8 => '#x0448', # CYRILLIC SMALL LETTER SHA
0xF9 => '#x0449', # CYRILLIC SMALL LETTER SHCHA
0xFA => '#x044A', # CYRILLIC SMALL LETTER HARD SIGN
0xFB => '#x044B', # CYRILLIC SMALL LETTER YERU
0xFC => '#x044C', # CYRILLIC SMALL LETTER SOFT SIGN
0xFD => '#x044D', # CYRILLIC SMALL LETTER E
0xFE => '#x044E', # CYRILLIC SMALL LETTER YU
0xFF => '#x044F', # CYRILLIC SMALL LETTER YA
};
--- NEW FILE ---
package MHonArc::CharEnt::CP1253;
# WinGreek
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x20AC', # EURO SIGN
0x82 => '#x201A', # SINGLE LOW-9 QUOTATION MARK
0x83 => '#x0192', # LATIN SMALL LETTER F WITH HOOK
0x84 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0x85 => '#x2026', # HORIZONTAL ELLIPSIS
0x86 => '#x2020', # DAGGER
0x87 => '#x2021', # DOUBLE DAGGER
0x89 => '#x2030', # PER MILLE SIGN
0x8B => '#x2039', # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
0x91 => '#x2018', # LEFT SINGLE QUOTATION MARK
0x92 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0x93 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0x94 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0x95 => '#x2022', # BULLET
0x96 => '#x2013', # EN DASH
0x97 => '#x2014', # EM DASH
0x99 => '#x2122', # TRADE MARK SIGN
0x9B => '#x203A', # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
0xA1 => '#x0385', # GREEK DIALYTIKA TONOS
0xA2 => '#x0386', # GREEK CAPITAL LETTER ALPHA WITH TONOS
0xA3 => '#x00A3', # POUND SIGN
0xA4 => '#x00A4', # CURRENCY SIGN
0xA5 => '#x00A5', # YEN SIGN
0xA6 => '#x00A6', # BROKEN BAR
0xA7 => '#x00A7', # SECTION SIGN
0xA8 => '#x00A8', # DIAERESIS
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAB => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xAC => '#x00AC', # NOT SIGN
0xAD => '#x00AD', # SOFT HYPHEN
0xAE => '#x00AE', # REGISTERED SIGN
0xAF => '#x2015', # HORIZONTAL BAR
0xB0 => '#x00B0', # DEGREE SIGN
0xB1 => '#x00B1', # PLUS-MINUS SIGN
0xB2 => '#x00B2', # SUPERSCRIPT TWO
0xB3 => '#x00B3', # SUPERSCRIPT THREE
0xB4 => '#x0384', # GREEK TONOS
0xB5 => '#x00B5', # MICRO SIGN
0xB6 => '#x00B6', # PILCROW SIGN
0xB7 => '#x00B7', # MIDDLE DOT
0xB8 => '#x0388', # GREEK CAPITAL LETTER EPSILON WITH TONOS
0xB9 => '#x0389', # GREEK CAPITAL LETTER ETA WITH TONOS
0xBA => '#x038A', # GREEK CAPITAL LETTER IOTA WITH TONOS
0xBB => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xBC => '#x038C', # GREEK CAPITAL LETTER OMICRON WITH TONOS
0xBD => '#x00BD', # VULGAR FRACTION ONE HALF
0xBE => '#x038E', # GREEK CAPITAL LETTER UPSILON WITH TONOS
0xBF => '#x038F', # GREEK CAPITAL LETTER OMEGA WITH TONOS
0xC0 => '#x0390', # GREEK SMALL LETTER IOTA WITH DIALYTIKA AND
TONOS
0xC1 => '#x0391', # GREEK CAPITAL LETTER ALPHA
0xC2 => '#x0392', # GREEK CAPITAL LETTER BETA
0xC3 => '#x0393', # GREEK CAPITAL LETTER GAMMA
0xC4 => '#x0394', # GREEK CAPITAL LETTER DELTA
0xC5 => '#x0395', # GREEK CAPITAL LETTER EPSILON
0xC6 => '#x0396', # GREEK CAPITAL LETTER ZETA
0xC7 => '#x0397', # GREEK CAPITAL LETTER ETA
0xC8 => '#x0398', # GREEK CAPITAL LETTER THETA
0xC9 => '#x0399', # GREEK CAPITAL LETTER IOTA
0xCA => '#x039A', # GREEK CAPITAL LETTER KAPPA
0xCB => '#x039B', # GREEK CAPITAL LETTER LAMDA
0xCC => '#x039C', # GREEK CAPITAL LETTER MU
0xCD => '#x039D', # GREEK CAPITAL LETTER NU
0xCE => '#x039E', # GREEK CAPITAL LETTER XI
0xCF => '#x039F', # GREEK CAPITAL LETTER OMICRON
0xD0 => '#x03A0', # GREEK CAPITAL LETTER PI
0xD1 => '#x03A1', # GREEK CAPITAL LETTER RHO
0xD3 => '#x03A3', # GREEK CAPITAL LETTER SIGMA
0xD4 => '#x03A4', # GREEK CAPITAL LETTER TAU
0xD5 => '#x03A5', # GREEK CAPITAL LETTER UPSILON
0xD6 => '#x03A6', # GREEK CAPITAL LETTER PHI
0xD7 => '#x03A7', # GREEK CAPITAL LETTER CHI
0xD8 => '#x03A8', # GREEK CAPITAL LETTER PSI
0xD9 => '#x03A9', # GREEK CAPITAL LETTER OMEGA
0xDA => '#x03AA', # GREEK CAPITAL LETTER IOTA WITH DIALYTIKA
0xDB => '#x03AB', # GREEK CAPITAL LETTER UPSILON WITH DIALYTIKA
0xDC => '#x03AC', # GREEK SMALL LETTER ALPHA WITH TONOS
0xDD => '#x03AD', # GREEK SMALL LETTER EPSILON WITH TONOS
0xDE => '#x03AE', # GREEK SMALL LETTER ETA WITH TONOS
0xDF => '#x03AF', # GREEK SMALL LETTER IOTA WITH TONOS
0xE0 => '#x03B0', # GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND
TONOS
0xE1 => '#x03B1', # GREEK SMALL LETTER ALPHA
0xE2 => '#x03B2', # GREEK SMALL LETTER BETA
0xE3 => '#x03B3', # GREEK SMALL LETTER GAMMA
0xE4 => '#x03B4', # GREEK SMALL LETTER DELTA
0xE5 => '#x03B5', # GREEK SMALL LETTER EPSILON
0xE6 => '#x03B6', # GREEK SMALL LETTER ZETA
0xE7 => '#x03B7', # GREEK SMALL LETTER ETA
0xE8 => '#x03B8', # GREEK SMALL LETTER THETA
0xE9 => '#x03B9', # GREEK SMALL LETTER IOTA
0xEA => '#x03BA', # GREEK SMALL LETTER KAPPA
0xEB => '#x03BB', # GREEK SMALL LETTER LAMDA
0xEC => '#x03BC', # GREEK SMALL LETTER MU
0xED => '#x03BD', # GREEK SMALL LETTER NU
0xEE => '#x03BE', # GREEK SMALL LETTER XI
0xEF => '#x03BF', # GREEK SMALL LETTER OMICRON
0xF0 => '#x03C0', # GREEK SMALL LETTER PI
0xF1 => '#x03C1', # GREEK SMALL LETTER RHO
0xF2 => '#x03C2', # GREEK SMALL LETTER FINAL SIGMA
0xF3 => '#x03C3', # GREEK SMALL LETTER SIGMA
0xF4 => '#x03C4', # GREEK SMALL LETTER TAU
0xF5 => '#x03C5', # GREEK SMALL LETTER UPSILON
0xF6 => '#x03C6', # GREEK SMALL LETTER PHI
0xF7 => '#x03C7', # GREEK SMALL LETTER CHI
0xF8 => '#x03C8', # GREEK SMALL LETTER PSI
0xF9 => '#x03C9', # GREEK SMALL LETTER OMEGA
0xFA => '#x03CA', # GREEK SMALL LETTER IOTA WITH DIALYTIKA
0xFB => '#x03CB', # GREEK SMALL LETTER UPSILON WITH DIALYTIKA
0xFC => '#x03CC', # GREEK SMALL LETTER OMICRON WITH TONOS
0xFD => '#x03CD', # GREEK SMALL LETTER UPSILON WITH TONOS
0xFE => '#x03CE', # GREEK SMALL LETTER OMEGA WITH TONOS
};
--- NEW FILE ---
package MHonArc::CharEnt::CP1254;
# WinTurkish
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x20AC', # EURO SIGN
0x82 => '#x201A', # SINGLE LOW-9 QUOTATION MARK
0x83 => '#x0192', # LATIN SMALL LETTER F WITH HOOK
0x84 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0x85 => '#x2026', # HORIZONTAL ELLIPSIS
0x86 => '#x2020', # DAGGER
0x87 => '#x2021', # DOUBLE DAGGER
0x88 => '#x02C6', # MODIFIER LETTER CIRCUMFLEX ACCENT
0x89 => '#x2030', # PER MILLE SIGN
0x8A => '#x0160', # LATIN CAPITAL LETTER S WITH CARON
0x8B => '#x2039', # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
0x8C => '#x0152', # LATIN CAPITAL LIGATURE OE
0x91 => '#x2018', # LEFT SINGLE QUOTATION MARK
0x92 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0x93 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0x94 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0x95 => '#x2022', # BULLET
0x96 => '#x2013', # EN DASH
0x97 => '#x2014', # EM DASH
0x98 => '#x02DC', # SMALL TILDE
0x99 => '#x2122', # TRADE MARK SIGN
0x9A => '#x0161', # LATIN SMALL LETTER S WITH CARON
0x9B => '#x203A', # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
0x9C => '#x0153', # LATIN SMALL LIGATURE OE
0x9F => '#x0178', # LATIN CAPITAL LETTER Y WITH DIAERESIS
0xA1 => '#x00A1', # INVERTED EXCLAMATION MARK
0xA2 => '#x00A2', # CENT SIGN
0xA3 => '#x00A3', # POUND SIGN
0xA4 => '#x00A4', # CURRENCY SIGN
0xA5 => '#x00A5', # YEN SIGN
0xA6 => '#x00A6', # BROKEN BAR
0xA7 => '#x00A7', # SECTION SIGN
0xA8 => '#x00A8', # DIAERESIS
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAA => '#x00AA', # FEMININE ORDINAL INDICATOR
0xAB => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xAC => '#x00AC', # NOT SIGN
0xAD => '#x00AD', # SOFT HYPHEN
0xAE => '#x00AE', # REGISTERED SIGN
0xAF => '#x00AF', # MACRON
0xB0 => '#x00B0', # DEGREE SIGN
0xB1 => '#x00B1', # PLUS-MINUS SIGN
0xB2 => '#x00B2', # SUPERSCRIPT TWO
0xB3 => '#x00B3', # SUPERSCRIPT THREE
0xB4 => '#x00B4', # ACUTE ACCENT
0xB5 => '#x00B5', # MICRO SIGN
0xB6 => '#x00B6', # PILCROW SIGN
0xB7 => '#x00B7', # MIDDLE DOT
0xB8 => '#x00B8', # CEDILLA
0xB9 => '#x00B9', # SUPERSCRIPT ONE
0xBA => '#x00BA', # MASCULINE ORDINAL INDICATOR
0xBB => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xBC => '#x00BC', # VULGAR FRACTION ONE QUARTER
0xBD => '#x00BD', # VULGAR FRACTION ONE HALF
0xBE => '#x00BE', # VULGAR FRACTION THREE QUARTERS
0xBF => '#x00BF', # INVERTED QUESTION MARK
0xC0 => '#x00C0', # LATIN CAPITAL LETTER A WITH GRAVE
0xC1 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
0xC2 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
0xC3 => '#x00C3', # LATIN CAPITAL LETTER A WITH TILDE
0xC4 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
0xC5 => '#x00C5', # LATIN CAPITAL LETTER A WITH RING ABOVE
0xC6 => '#x00C6', # LATIN CAPITAL LETTER AE
0xC7 => '#x00C7', # LATIN CAPITAL LETTER C WITH CEDILLA
0xC8 => '#x00C8', # LATIN CAPITAL LETTER E WITH GRAVE
0xC9 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0xCA => '#x00CA', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX
0xCB => '#x00CB', # LATIN CAPITAL LETTER E WITH DIAERESIS
0xCC => '#x00CC', # LATIN CAPITAL LETTER I WITH GRAVE
0xCD => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
0xCE => '#x00CE', # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
0xCF => '#x00CF', # LATIN CAPITAL LETTER I WITH DIAERESIS
0xD0 => '#x011E', # LATIN CAPITAL LETTER G WITH BREVE
0xD1 => '#x00D1', # LATIN CAPITAL LETTER N WITH TILDE
0xD2 => '#x00D2', # LATIN CAPITAL LETTER O WITH GRAVE
0xD3 => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
0xD4 => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
0xD5 => '#x00D5', # LATIN CAPITAL LETTER O WITH TILDE
0xD6 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
0xD7 => '#x00D7', # MULTIPLICATION SIGN
0xD8 => '#x00D8', # LATIN CAPITAL LETTER O WITH STROKE
0xD9 => '#x00D9', # LATIN CAPITAL LETTER U WITH GRAVE
0xDA => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
0xDB => '#x00DB', # LATIN CAPITAL LETTER U WITH CIRCUMFLEX
0xDC => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
0xDD => '#x0130', # LATIN CAPITAL LETTER I WITH DOT ABOVE
0xDE => '#x015E', # LATIN CAPITAL LETTER S WITH CEDILLA
0xDF => '#x00DF', # LATIN SMALL LETTER SHARP S
0xE0 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
0xE1 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
0xE2 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
0xE3 => '#x00E3', # LATIN SMALL LETTER A WITH TILDE
0xE4 => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
0xE5 => '#x00E5', # LATIN SMALL LETTER A WITH RING ABOVE
0xE6 => '#x00E6', # LATIN SMALL LETTER AE
0xE7 => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
0xE8 => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
0xE9 => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0xEA => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
0xEB => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
0xEC => '#x00EC', # LATIN SMALL LETTER I WITH GRAVE
0xED => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
0xEE => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
0xEF => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
0xF0 => '#x011F', # LATIN SMALL LETTER G WITH BREVE
0xF1 => '#x00F1', # LATIN SMALL LETTER N WITH TILDE
0xF2 => '#x00F2', # LATIN SMALL LETTER O WITH GRAVE
0xF3 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
0xF4 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
0xF5 => '#x00F5', # LATIN SMALL LETTER O WITH TILDE
0xF6 => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
0xF7 => '#x00F7', # DIVISION SIGN
0xF8 => '#x00F8', # LATIN SMALL LETTER O WITH STROKE
0xF9 => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
0xFA => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
0xFB => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
0xFC => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xFD => '#x0131', # LATIN SMALL LETTER DOTLESS I
0xFE => '#x015F', # LATIN SMALL LETTER S WITH CEDILLA
0xFF => '#x00FF', # LATIN SMALL LETTER Y WITH DIAERESIS
};
--- NEW FILE ---
package MHonArc::CharEnt::CP1255;
# WinHebrew
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x20AC', # EURO SIGN
0x82 => '#x201A', # SINGLE LOW-9 QUOTATION MARK
0x83 => '#x0192', # LATIN SMALL LETTER F WITH HOOK
0x84 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0x85 => '#x2026', # HORIZONTAL ELLIPSIS
0x86 => '#x2020', # DAGGER
0x87 => '#x2021', # DOUBLE DAGGER
0x88 => '#x02C6', # MODIFIER LETTER CIRCUMFLEX ACCENT
0x89 => '#x2030', # PER MILLE SIGN
0x8B => '#x2039', # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
0x91 => '#x2018', # LEFT SINGLE QUOTATION MARK
0x92 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0x93 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0x94 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0x95 => '#x2022', # BULLET
0x96 => '#x2013', # EN DASH
0x97 => '#x2014', # EM DASH
0x98 => '#x02DC', # SMALL TILDE
0x99 => '#x2122', # TRADE MARK SIGN
0x9B => '#x203A', # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
0xA1 => '#x00A1', # INVERTED EXCLAMATION MARK
0xA2 => '#x00A2', # CENT SIGN
0xA3 => '#x00A3', # POUND SIGN
0xA4 => '#x20AA', # NEW SHEQEL SIGN
0xA5 => '#x00A5', # YEN SIGN
0xA6 => '#x00A6', # BROKEN BAR
0xA7 => '#x00A7', # SECTION SIGN
0xA8 => '#x00A8', # DIAERESIS
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAA => '#x00D7', # MULTIPLICATION SIGN
0xAB => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xAC => '#x00AC', # NOT SIGN
0xAD => '#x00AD', # SOFT HYPHEN
0xAE => '#x00AE', # REGISTERED SIGN
0xAF => '#x00AF', # MACRON
0xB0 => '#x00B0', # DEGREE SIGN
0xB1 => '#x00B1', # PLUS-MINUS SIGN
0xB2 => '#x00B2', # SUPERSCRIPT TWO
0xB3 => '#x00B3', # SUPERSCRIPT THREE
0xB4 => '#x00B4', # ACUTE ACCENT
0xB5 => '#x00B5', # MICRO SIGN
0xB6 => '#x00B6', # PILCROW SIGN
0xB7 => '#x00B7', # MIDDLE DOT
0xB8 => '#x00B8', # CEDILLA
0xB9 => '#x00B9', # SUPERSCRIPT ONE
0xBA => '#x00F7', # DIVISION SIGN
0xBB => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xBC => '#x00BC', # VULGAR FRACTION ONE QUARTER
0xBD => '#x00BD', # VULGAR FRACTION ONE HALF
0xBE => '#x00BE', # VULGAR FRACTION THREE QUARTERS
0xBF => '#x00BF', # INVERTED QUESTION MARK
0xC0 => '#x05B0', # HEBREW POINT SHEVA
0xC1 => '#x05B1', # HEBREW POINT HATAF SEGOL
0xC2 => '#x05B2', # HEBREW POINT HATAF PATAH
0xC3 => '#x05B3', # HEBREW POINT HATAF QAMATS
0xC4 => '#x05B4', # HEBREW POINT HIRIQ
0xC5 => '#x05B5', # HEBREW POINT TSERE
0xC6 => '#x05B6', # HEBREW POINT SEGOL
0xC7 => '#x05B7', # HEBREW POINT PATAH
0xC8 => '#x05B8', # HEBREW POINT QAMATS
0xC9 => '#x05B9', # HEBREW POINT HOLAM
0xCB => '#x05BB', # HEBREW POINT QUBUTS
0xCC => '#x05BC', # HEBREW POINT DAGESH OR MAPIQ
0xCD => '#x05BD', # HEBREW POINT METEG
0xCE => '#x05BE', # HEBREW PUNCTUATION MAQAF
0xCF => '#x05BF', # HEBREW POINT RAFE
0xD0 => '#x05C0', # HEBREW PUNCTUATION PASEQ
0xD1 => '#x05C1', # HEBREW POINT SHIN DOT
0xD2 => '#x05C2', # HEBREW POINT SIN DOT
0xD3 => '#x05C3', # HEBREW PUNCTUATION SOF PASUQ
0xD4 => '#x05F0', # HEBREW LIGATURE YIDDISH DOUBLE VAV
0xD5 => '#x05F1', # HEBREW LIGATURE YIDDISH VAV YOD
0xD6 => '#x05F2', # HEBREW LIGATURE YIDDISH DOUBLE YOD
0xD7 => '#x05F3', # HEBREW PUNCTUATION GERESH
0xD8 => '#x05F4', # HEBREW PUNCTUATION GERSHAYIM
0xE0 => '#x05D0', # HEBREW LETTER ALEF
0xE1 => '#x05D1', # HEBREW LETTER BET
0xE2 => '#x05D2', # HEBREW LETTER GIMEL
0xE3 => '#x05D3', # HEBREW LETTER DALET
0xE4 => '#x05D4', # HEBREW LETTER HE
0xE5 => '#x05D5', # HEBREW LETTER VAV
0xE6 => '#x05D6', # HEBREW LETTER ZAYIN
0xE7 => '#x05D7', # HEBREW LETTER HET
0xE8 => '#x05D8', # HEBREW LETTER TET
0xE9 => '#x05D9', # HEBREW LETTER YOD
0xEA => '#x05DA', # HEBREW LETTER FINAL KAF
0xEB => '#x05DB', # HEBREW LETTER KAF
0xEC => '#x05DC', # HEBREW LETTER LAMED
0xED => '#x05DD', # HEBREW LETTER FINAL MEM
0xEE => '#x05DE', # HEBREW LETTER MEM
0xEF => '#x05DF', # HEBREW LETTER FINAL NUN
0xF0 => '#x05E0', # HEBREW LETTER NUN
0xF1 => '#x05E1', # HEBREW LETTER SAMEKH
0xF2 => '#x05E2', # HEBREW LETTER AYIN
0xF3 => '#x05E3', # HEBREW LETTER FINAL PE
0xF4 => '#x05E4', # HEBREW LETTER PE
0xF5 => '#x05E5', # HEBREW LETTER FINAL TSADI
0xF6 => '#x05E6', # HEBREW LETTER TSADI
0xF7 => '#x05E7', # HEBREW LETTER QOF
0xF8 => '#x05E8', # HEBREW LETTER RESH
0xF9 => '#x05E9', # HEBREW LETTER SHIN
0xFA => '#x05EA', # HEBREW LETTER TAV
0xFD => '#x200E', # LEFT-TO-RIGHT MARK
0xFE => '#x200F', # RIGHT-TO-LEFT MARK
};
--- NEW FILE ---
package MHonArc::CharEnt::CP1256;
# WinArabic
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x20AC', # EURO SIGN
0x81 => '#x067E', # ARABIC LETTER PEH
0x82 => '#x201A', # SINGLE LOW-9 QUOTATION MARK
0x83 => '#x0192', # LATIN SMALL LETTER F WITH HOOK
0x84 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0x85 => '#x2026', # HORIZONTAL ELLIPSIS
0x86 => '#x2020', # DAGGER
0x87 => '#x2021', # DOUBLE DAGGER
0x88 => '#x02C6', # MODIFIER LETTER CIRCUMFLEX ACCENT
0x89 => '#x2030', # PER MILLE SIGN
0x8A => '#x0679', # ARABIC LETTER TTEH
0x8B => '#x2039', # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
0x8C => '#x0152', # LATIN CAPITAL LIGATURE OE
0x8D => '#x0686', # ARABIC LETTER TCHEH
0x8E => '#x0698', # ARABIC LETTER JEH
0x8F => '#x0688', # ARABIC LETTER DDAL
0x90 => '#x06AF', # ARABIC LETTER GAF
0x91 => '#x2018', # LEFT SINGLE QUOTATION MARK
0x92 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0x93 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0x94 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0x95 => '#x2022', # BULLET
0x96 => '#x2013', # EN DASH
0x97 => '#x2014', # EM DASH
0x98 => '#x06A9', # ARABIC LETTER KEHEH
0x99 => '#x2122', # TRADE MARK SIGN
0x9A => '#x0691', # ARABIC LETTER RREH
0x9B => '#x203A', # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
0x9C => '#x0153', # LATIN SMALL LIGATURE OE
0x9D => '#x200C', # ZERO WIDTH NON-JOINER
0x9E => '#x200D', # ZERO WIDTH JOINER
0x9F => '#x06BA', # ARABIC LETTER NOON GHUNNA
0xA1 => '#x060C', # ARABIC COMMA
0xA2 => '#x00A2', # CENT SIGN
0xA3 => '#x00A3', # POUND SIGN
0xA4 => '#x00A4', # CURRENCY SIGN
0xA5 => '#x00A5', # YEN SIGN
0xA6 => '#x00A6', # BROKEN BAR
0xA7 => '#x00A7', # SECTION SIGN
0xA8 => '#x00A8', # DIAERESIS
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAA => '#x06BE', # ARABIC LETTER HEH DOACHASHMEE
0xAB => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xAC => '#x00AC', # NOT SIGN
0xAD => '#x00AD', # SOFT HYPHEN
0xAE => '#x00AE', # REGISTERED SIGN
0xAF => '#x00AF', # MACRON
0xB0 => '#x00B0', # DEGREE SIGN
0xB1 => '#x00B1', # PLUS-MINUS SIGN
0xB2 => '#x00B2', # SUPERSCRIPT TWO
0xB3 => '#x00B3', # SUPERSCRIPT THREE
0xB4 => '#x00B4', # ACUTE ACCENT
0xB5 => '#x00B5', # MICRO SIGN
0xB6 => '#x00B6', # PILCROW SIGN
0xB7 => '#x00B7', # MIDDLE DOT
0xB8 => '#x00B8', # CEDILLA
0xB9 => '#x00B9', # SUPERSCRIPT ONE
0xBA => '#x061B', # ARABIC SEMICOLON
0xBB => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xBC => '#x00BC', # VULGAR FRACTION ONE QUARTER
0xBD => '#x00BD', # VULGAR FRACTION ONE HALF
0xBE => '#x00BE', # VULGAR FRACTION THREE QUARTERS
0xBF => '#x061F', # ARABIC QUESTION MARK
0xC0 => '#x06C1', # ARABIC LETTER HEH GOAL
0xC1 => '#x0621', # ARABIC LETTER HAMZA
0xC2 => '#x0622', # ARABIC LETTER ALEF WITH MADDA ABOVE
0xC3 => '#x0623', # ARABIC LETTER ALEF WITH HAMZA ABOVE
0xC4 => '#x0624', # ARABIC LETTER WAW WITH HAMZA ABOVE
0xC5 => '#x0625', # ARABIC LETTER ALEF WITH HAMZA BELOW
0xC6 => '#x0626', # ARABIC LETTER YEH WITH HAMZA ABOVE
0xC7 => '#x0627', # ARABIC LETTER ALEF
0xC8 => '#x0628', # ARABIC LETTER BEH
0xC9 => '#x0629', # ARABIC LETTER TEH MARBUTA
0xCA => '#x062A', # ARABIC LETTER TEH
0xCB => '#x062B', # ARABIC LETTER THEH
0xCC => '#x062C', # ARABIC LETTER JEEM
0xCD => '#x062D', # ARABIC LETTER HAH
0xCE => '#x062E', # ARABIC LETTER KHAH
0xCF => '#x062F', # ARABIC LETTER DAL
0xD0 => '#x0630', # ARABIC LETTER THAL
0xD1 => '#x0631', # ARABIC LETTER REH
0xD2 => '#x0632', # ARABIC LETTER ZAIN
0xD3 => '#x0633', # ARABIC LETTER SEEN
0xD4 => '#x0634', # ARABIC LETTER SHEEN
0xD5 => '#x0635', # ARABIC LETTER SAD
0xD6 => '#x0636', # ARABIC LETTER DAD
0xD7 => '#x00D7', # MULTIPLICATION SIGN
0xD8 => '#x0637', # ARABIC LETTER TAH
0xD9 => '#x0638', # ARABIC LETTER ZAH
0xDA => '#x0639', # ARABIC LETTER AIN
0xDB => '#x063A', # ARABIC LETTER GHAIN
0xDC => '#x0640', # ARABIC TATWEEL
0xDD => '#x0641', # ARABIC LETTER FEH
0xDE => '#x0642', # ARABIC LETTER QAF
0xDF => '#x0643', # ARABIC LETTER KAF
0xE0 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
0xE1 => '#x0644', # ARABIC LETTER LAM
0xE2 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
0xE3 => '#x0645', # ARABIC LETTER MEEM
0xE4 => '#x0646', # ARABIC LETTER NOON
0xE5 => '#x0647', # ARABIC LETTER HEH
0xE6 => '#x0648', # ARABIC LETTER WAW
0xE7 => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
0xE8 => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
0xE9 => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0xEA => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
0xEB => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
0xEC => '#x0649', # ARABIC LETTER ALEF MAKSURA
0xED => '#x064A', # ARABIC LETTER YEH
0xEE => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
0xEF => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
0xF0 => '#x064B', # ARABIC FATHATAN
0xF1 => '#x064C', # ARABIC DAMMATAN
0xF2 => '#x064D', # ARABIC KASRATAN
0xF3 => '#x064E', # ARABIC FATHA
0xF4 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
0xF5 => '#x064F', # ARABIC DAMMA
0xF6 => '#x0650', # ARABIC KASRA
0xF7 => '#x00F7', # DIVISION SIGN
0xF8 => '#x0651', # ARABIC SHADDA
0xF9 => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
0xFA => '#x0652', # ARABIC SUKUN
0xFB => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
0xFC => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xFD => '#x200E', # LEFT-TO-RIGHT MARK
0xFE => '#x200F', # RIGHT-TO-LEFT MARK
0xFF => '#x06D2', # ARABIC LETTER YEH BARREE
};
--- NEW FILE ---
package MHonArc::CharEnt::CP1257;
# WinBaltic
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x20AC', # EURO SIGN
0x82 => '#x201A', # SINGLE LOW-9 QUOTATION MARK
0x84 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0x85 => '#x2026', # HORIZONTAL ELLIPSIS
0x86 => '#x2020', # DAGGER
0x87 => '#x2021', # DOUBLE DAGGER
0x89 => '#x2030', # PER MILLE SIGN
0x8B => '#x2039', # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
0x8D => '#x00A8', # DIAERESIS
0x8E => '#x02C7', # CARON
0x8F => '#x00B8', # CEDILLA
0x91 => '#x2018', # LEFT SINGLE QUOTATION MARK
0x92 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0x93 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0x94 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0x95 => '#x2022', # BULLET
0x96 => '#x2013', # EN DASH
0x97 => '#x2014', # EM DASH
0x99 => '#x2122', # TRADE MARK SIGN
0x9B => '#x203A', # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
0x9D => '#x00AF', # MACRON
0x9E => '#x02DB', # OGONEK
0xA2 => '#x00A2', # CENT SIGN
0xA3 => '#x00A3', # POUND SIGN
0xA4 => '#x00A4', # CURRENCY SIGN
0xA6 => '#x00A6', # BROKEN BAR
0xA7 => '#x00A7', # SECTION SIGN
0xA8 => '#x00D8', # LATIN CAPITAL LETTER O WITH STROKE
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAA => '#x0156', # LATIN CAPITAL LETTER R WITH CEDILLA
0xAB => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xAC => '#x00AC', # NOT SIGN
0xAD => '#x00AD', # SOFT HYPHEN
0xAE => '#x00AE', # REGISTERED SIGN
0xAF => '#x00C6', # LATIN CAPITAL LETTER AE
0xB0 => '#x00B0', # DEGREE SIGN
0xB1 => '#x00B1', # PLUS-MINUS SIGN
0xB2 => '#x00B2', # SUPERSCRIPT TWO
0xB3 => '#x00B3', # SUPERSCRIPT THREE
0xB4 => '#x00B4', # ACUTE ACCENT
0xB5 => '#x00B5', # MICRO SIGN
0xB6 => '#x00B6', # PILCROW SIGN
0xB7 => '#x00B7', # MIDDLE DOT
0xB8 => '#x00F8', # LATIN SMALL LETTER O WITH STROKE
0xB9 => '#x00B9', # SUPERSCRIPT ONE
0xBA => '#x0157', # LATIN SMALL LETTER R WITH CEDILLA
0xBB => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xBC => '#x00BC', # VULGAR FRACTION ONE QUARTER
0xBD => '#x00BD', # VULGAR FRACTION ONE HALF
0xBE => '#x00BE', # VULGAR FRACTION THREE QUARTERS
0xBF => '#x00E6', # LATIN SMALL LETTER AE
0xC0 => '#x0104', # LATIN CAPITAL LETTER A WITH OGONEK
0xC1 => '#x012E', # LATIN CAPITAL LETTER I WITH OGONEK
0xC2 => '#x0100', # LATIN CAPITAL LETTER A WITH MACRON
0xC3 => '#x0106', # LATIN CAPITAL LETTER C WITH ACUTE
0xC4 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
0xC5 => '#x00C5', # LATIN CAPITAL LETTER A WITH RING ABOVE
0xC6 => '#x0118', # LATIN CAPITAL LETTER E WITH OGONEK
0xC7 => '#x0112', # LATIN CAPITAL LETTER E WITH MACRON
0xC8 => '#x010C', # LATIN CAPITAL LETTER C WITH CARON
0xC9 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0xCA => '#x0179', # LATIN CAPITAL LETTER Z WITH ACUTE
0xCB => '#x0116', # LATIN CAPITAL LETTER E WITH DOT ABOVE
0xCC => '#x0122', # LATIN CAPITAL LETTER G WITH CEDILLA
0xCD => '#x0136', # LATIN CAPITAL LETTER K WITH CEDILLA
0xCE => '#x012A', # LATIN CAPITAL LETTER I WITH MACRON
0xCF => '#x013B', # LATIN CAPITAL LETTER L WITH CEDILLA
0xD0 => '#x0160', # LATIN CAPITAL LETTER S WITH CARON
0xD1 => '#x0143', # LATIN CAPITAL LETTER N WITH ACUTE
0xD2 => '#x0145', # LATIN CAPITAL LETTER N WITH CEDILLA
0xD3 => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
0xD4 => '#x014C', # LATIN CAPITAL LETTER O WITH MACRON
0xD5 => '#x00D5', # LATIN CAPITAL LETTER O WITH TILDE
0xD6 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
0xD7 => '#x00D7', # MULTIPLICATION SIGN
0xD8 => '#x0172', # LATIN CAPITAL LETTER U WITH OGONEK
0xD9 => '#x0141', # LATIN CAPITAL LETTER L WITH STROKE
0xDA => '#x015A', # LATIN CAPITAL LETTER S WITH ACUTE
0xDB => '#x016A', # LATIN CAPITAL LETTER U WITH MACRON
0xDC => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
0xDD => '#x017B', # LATIN CAPITAL LETTER Z WITH DOT ABOVE
0xDE => '#x017D', # LATIN CAPITAL LETTER Z WITH CARON
0xDF => '#x00DF', # LATIN SMALL LETTER SHARP S
0xE0 => '#x0105', # LATIN SMALL LETTER A WITH OGONEK
0xE1 => '#x012F', # LATIN SMALL LETTER I WITH OGONEK
0xE2 => '#x0101', # LATIN SMALL LETTER A WITH MACRON
0xE3 => '#x0107', # LATIN SMALL LETTER C WITH ACUTE
0xE4 => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
0xE5 => '#x00E5', # LATIN SMALL LETTER A WITH RING ABOVE
0xE6 => '#x0119', # LATIN SMALL LETTER E WITH OGONEK
0xE7 => '#x0113', # LATIN SMALL LETTER E WITH MACRON
0xE8 => '#x010D', # LATIN SMALL LETTER C WITH CARON
0xE9 => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0xEA => '#x017A', # LATIN SMALL LETTER Z WITH ACUTE
0xEB => '#x0117', # LATIN SMALL LETTER E WITH DOT ABOVE
0xEC => '#x0123', # LATIN SMALL LETTER G WITH CEDILLA
0xED => '#x0137', # LATIN SMALL LETTER K WITH CEDILLA
0xEE => '#x012B', # LATIN SMALL LETTER I WITH MACRON
0xEF => '#x013C', # LATIN SMALL LETTER L WITH CEDILLA
0xF0 => '#x0161', # LATIN SMALL LETTER S WITH CARON
0xF1 => '#x0144', # LATIN SMALL LETTER N WITH ACUTE
0xF2 => '#x0146', # LATIN SMALL LETTER N WITH CEDILLA
0xF3 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
0xF4 => '#x014D', # LATIN SMALL LETTER O WITH MACRON
0xF5 => '#x00F5', # LATIN SMALL LETTER O WITH TILDE
0xF6 => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
0xF7 => '#x00F7', # DIVISION SIGN
0xF8 => '#x0173', # LATIN SMALL LETTER U WITH OGONEK
0xF9 => '#x0142', # LATIN SMALL LETTER L WITH STROKE
0xFA => '#x015B', # LATIN SMALL LETTER S WITH ACUTE
0xFB => '#x016B', # LATIN SMALL LETTER U WITH MACRON
0xFC => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xFD => '#x017C', # LATIN SMALL LETTER Z WITH DOT ABOVE
0xFE => '#x017E', # LATIN SMALL LETTER Z WITH CARON
0xFF => '#x02D9', # DOT ABOVE
};
--- NEW FILE ---
package MHonArc::CharEnt::CP1258;
# WinVietnamese
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x20AC', # EURO SIGN
0x82 => '#x201A', # SINGLE LOW-9 QUOTATION MARK
0x83 => '#x0192', # LATIN SMALL LETTER F WITH HOOK
0x84 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0x85 => '#x2026', # HORIZONTAL ELLIPSIS
0x86 => '#x2020', # DAGGER
0x87 => '#x2021', # DOUBLE DAGGER
0x88 => '#x02C6', # MODIFIER LETTER CIRCUMFLEX ACCENT
0x89 => '#x2030', # PER MILLE SIGN
0x8B => '#x2039', # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
0x8C => '#x0152', # LATIN CAPITAL LIGATURE OE
0x91 => '#x2018', # LEFT SINGLE QUOTATION MARK
0x92 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0x93 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0x94 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0x95 => '#x2022', # BULLET
0x96 => '#x2013', # EN DASH
0x97 => '#x2014', # EM DASH
0x98 => '#x02DC', # SMALL TILDE
0x99 => '#x2122', # TRADE MARK SIGN
0x9B => '#x203A', # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
0x9C => '#x0153', # LATIN SMALL LIGATURE OE
0x9F => '#x0178', # LATIN CAPITAL LETTER Y WITH DIAERESIS
0xA1 => '#x00A1', # INVERTED EXCLAMATION MARK
0xA2 => '#x00A2', # CENT SIGN
0xA3 => '#x00A3', # POUND SIGN
0xA4 => '#x00A4', # CURRENCY SIGN
0xA5 => '#x00A5', # YEN SIGN
0xA6 => '#x00A6', # BROKEN BAR
0xA7 => '#x00A7', # SECTION SIGN
0xA8 => '#x00A8', # DIAERESIS
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAA => '#x00AA', # FEMININE ORDINAL INDICATOR
0xAB => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xAC => '#x00AC', # NOT SIGN
0xAD => '#x00AD', # SOFT HYPHEN
0xAE => '#x00AE', # REGISTERED SIGN
0xAF => '#x00AF', # MACRON
0xB0 => '#x00B0', # DEGREE SIGN
0xB1 => '#x00B1', # PLUS-MINUS SIGN
0xB2 => '#x00B2', # SUPERSCRIPT TWO
0xB3 => '#x00B3', # SUPERSCRIPT THREE
0xB4 => '#x00B4', # ACUTE ACCENT
0xB5 => '#x00B5', # MICRO SIGN
0xB6 => '#x00B6', # PILCROW SIGN
0xB7 => '#x00B7', # MIDDLE DOT
0xB8 => '#x00B8', # CEDILLA
0xB9 => '#x00B9', # SUPERSCRIPT ONE
0xBA => '#x00BA', # MASCULINE ORDINAL INDICATOR
0xBB => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xBC => '#x00BC', # VULGAR FRACTION ONE QUARTER
0xBD => '#x00BD', # VULGAR FRACTION ONE HALF
0xBE => '#x00BE', # VULGAR FRACTION THREE QUARTERS
0xBF => '#x00BF', # INVERTED QUESTION MARK
0xC0 => '#x00C0', # LATIN CAPITAL LETTER A WITH GRAVE
0xC1 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
0xC2 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
0xC3 => '#x0102', # LATIN CAPITAL LETTER A WITH BREVE
0xC4 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
0xC5 => '#x00C5', # LATIN CAPITAL LETTER A WITH RING ABOVE
0xC6 => '#x00C6', # LATIN CAPITAL LETTER AE
0xC7 => '#x00C7', # LATIN CAPITAL LETTER C WITH CEDILLA
0xC8 => '#x00C8', # LATIN CAPITAL LETTER E WITH GRAVE
0xC9 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0xCA => '#x00CA', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX
0xCB => '#x00CB', # LATIN CAPITAL LETTER E WITH DIAERESIS
0xCC => '#x0300', # COMBINING GRAVE ACCENT
0xCD => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
0xCE => '#x00CE', # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
0xCF => '#x00CF', # LATIN CAPITAL LETTER I WITH DIAERESIS
0xD0 => '#x0110', # LATIN CAPITAL LETTER D WITH STROKE
0xD1 => '#x00D1', # LATIN CAPITAL LETTER N WITH TILDE
0xD2 => '#x0309', # COMBINING HOOK ABOVE
0xD3 => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
0xD4 => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
0xD5 => '#x01A0', # LATIN CAPITAL LETTER O WITH HORN
0xD6 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
0xD7 => '#x00D7', # MULTIPLICATION SIGN
0xD8 => '#x00D8', # LATIN CAPITAL LETTER O WITH STROKE
0xD9 => '#x00D9', # LATIN CAPITAL LETTER U WITH GRAVE
0xDA => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
0xDB => '#x00DB', # LATIN CAPITAL LETTER U WITH CIRCUMFLEX
0xDC => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
0xDD => '#x01AF', # LATIN CAPITAL LETTER U WITH HORN
0xDE => '#x0303', # COMBINING TILDE
0xDF => '#x00DF', # LATIN SMALL LETTER SHARP S
0xE0 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
0xE1 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
0xE2 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
0xE3 => '#x0103', # LATIN SMALL LETTER A WITH BREVE
0xE4 => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
0xE5 => '#x00E5', # LATIN SMALL LETTER A WITH RING ABOVE
0xE6 => '#x00E6', # LATIN SMALL LETTER AE
0xE7 => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
0xE8 => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
0xE9 => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0xEA => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
0xEB => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
0xEC => '#x0301', # COMBINING ACUTE ACCENT
0xED => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
0xEE => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
0xEF => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
0xF0 => '#x0111', # LATIN SMALL LETTER D WITH STROKE
0xF1 => '#x00F1', # LATIN SMALL LETTER N WITH TILDE
0xF2 => '#x0323', # COMBINING DOT BELOW
0xF3 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
0xF4 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
0xF5 => '#x01A1', # LATIN SMALL LETTER O WITH HORN
0xF6 => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
0xF7 => '#x00F7', # DIVISION SIGN
0xF8 => '#x00F8', # LATIN SMALL LETTER O WITH STROKE
0xF9 => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
0xFA => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
0xFB => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
0xFC => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xFD => '#x01B0', # LATIN SMALL LETTER U WITH HORN
0xFE => '#x20AB', # DONG SIGN
0xFF => '#x00FF', # LATIN SMALL LETTER Y WITH DIAERESIS
};
--- NEW FILE ---
package MHonArc::CharEnt::GOST19768_87;
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x24 => '#x00A4', # CURRENCY SIGN
0xA1 => '#x0401', # CYRILLIC CAPITAL LETTER IO
0xB0 => '#x0410', # CYRILLIC CAPITAL LETTER A
0xB1 => '#x0411', # CYRILLIC CAPITAL LETTER BE
0xB2 => '#x0412', # CYRILLIC CAPITAL LETTER VE
0xB3 => '#x0413', # CYRILLIC CAPITAL LETTER GHE
0xB4 => '#x0414', # CYRILLIC CAPITAL LETTER DE
0xB5 => '#x0415', # CYRILLIC CAPITAL LETTER IE
0xB6 => '#x0416', # CYRILLIC CAPITAL LETTER ZHE
0xB7 => '#x0417', # CYRILLIC CAPITAL LETTER ZE
0xB8 => '#x0418', # CYRILLIC CAPITAL LETTER I
0xB9 => '#x0419', # CYRILLIC CAPITAL LETTER SHORT I
0xBA => '#x041A', # CYRILLIC CAPITAL LETTER KA
0xBB => '#x041B', # CYRILLIC CAPITAL LETTER EL
0xBC => '#x041C', # CYRILLIC CAPITAL LETTER EM
0xBD => '#x041D', # CYRILLIC CAPITAL LETTER EN
0xBE => '#x041E', # CYRILLIC CAPITAL LETTER O
0xBF => '#x041F', # CYRILLIC CAPITAL LETTER PE
0xC0 => '#x0420', # CYRILLIC CAPITAL LETTER ER
0xC1 => '#x0421', # CYRILLIC CAPITAL LETTER ES
0xC2 => '#x0422', # CYRILLIC CAPITAL LETTER TE
0xC3 => '#x0423', # CYRILLIC CAPITAL LETTER U
0xC4 => '#x0424', # CYRILLIC CAPITAL LETTER EF
0xC5 => '#x0425', # CYRILLIC CAPITAL LETTER HA
0xC6 => '#x0426', # CYRILLIC CAPITAL LETTER TSE
0xC7 => '#x0427', # CYRILLIC CAPITAL LETTER CHE
0xC8 => '#x0428', # CYRILLIC CAPITAL LETTER SHA
0xC9 => '#x0429', # CYRILLIC CAPITAL LETTER SHCHA
0xCA => '#x042A', # CYRILLIC CAPITAL LETTER HARD SIGN
0xCB => '#x042B', # CYRILLIC CAPITAL LETTER YERU
0xCC => '#x042C', # CYRILLIC CAPITAL LETTER SOFT SIGN
0xCD => '#x042D', # CYRILLIC CAPITAL LETTER E
0xCE => '#x042E', # CYRILLIC CAPITAL LETTER YU
0xCF => '#x042F', # CYRILLIC CAPITAL LETTER YA
0xD0 => '#x0430', # CYRILLIC SMALL LETTER A
0xD1 => '#x0431', # CYRILLIC SMALL LETTER BE
0xD2 => '#x0432', # CYRILLIC SMALL LETTER VE
0xD3 => '#x0433', # CYRILLIC SMALL LETTER GHE
0xD4 => '#x0434', # CYRILLIC SMALL LETTER DE
0xD5 => '#x0435', # CYRILLIC SMALL LETTER IE
0xD6 => '#x0436', # CYRILLIC SMALL LETTER ZHE
0xD7 => '#x0437', # CYRILLIC SMALL LETTER ZE
0xD8 => '#x0438', # CYRILLIC SMALL LETTER I
0xD9 => '#x0439', # CYRILLIC SMALL LETTER SHORT I
0xDA => '#x043A', # CYRILLIC SMALL LETTER KA
0xDB => '#x043B', # CYRILLIC SMALL LETTER EL
0xDC => '#x043C', # CYRILLIC SMALL LETTER EM
0xDD => '#x043D', # CYRILLIC SMALL LETTER EN
0xDE => '#x043E', # CYRILLIC SMALL LETTER O
0xDF => '#x043F', # CYRILLIC SMALL LETTER PE
0xE0 => '#x0440', # CYRILLIC SMALL LETTER ER
0xE1 => '#x0441', # CYRILLIC SMALL LETTER ES
0xE2 => '#x0442', # CYRILLIC SMALL LETTER TE
0xE3 => '#x0443', # CYRILLIC SMALL LETTER U
0xE4 => '#x0444', # CYRILLIC SMALL LETTER EF
0xE5 => '#x0445', # CYRILLIC SMALL LETTER HA
0xE6 => '#x0446', # CYRILLIC SMALL LETTER TSE
0xE7 => '#x0447', # CYRILLIC SMALL LETTER CHE
0xE8 => '#x0448', # CYRILLIC SMALL LETTER SHA
0xE9 => '#x0449', # CYRILLIC SMALL LETTER SHCHA
0xEA => '#x044A', # CYRILLIC SMALL LETTER HARD SIGN
0xEB => '#x044B', # CYRILLIC SMALL LETTER YERU
0xEC => '#x044C', # CYRILLIC SMALL LETTER SOFT SIGN
0xED => '#x044D', # CYRILLIC SMALL LETTER E
0xEE => '#x044E', # CYRILLIC SMALL LETTER YU
0xEF => '#x044F', # CYRILLIC SMALL LETTER YA
0xF1 => '#x0451', # CYRILLIC SMALL LETTER IO
};
--- NEW FILE ---
package MHonArc::CharEnt::ISO8859_11;
# Thai
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0xA1 => '#x0E01', # THAI CHARACTER KO KAI
0xA2 => '#x0E02', # THAI CHARACTER KHO KHAI
0xA3 => '#x0E03', # THAI CHARACTER KHO KHUAT
0xA4 => '#x0E04', # THAI CHARACTER KHO KHWAI
0xA5 => '#x0E05', # THAI CHARACTER KHO KHON
0xA6 => '#x0E06', # THAI CHARACTER KHO RAKHANG
0xA7 => '#x0E07', # THAI CHARACTER NGO NGU
0xA8 => '#x0E08', # THAI CHARACTER CHO CHAN
0xA9 => '#x0E09', # THAI CHARACTER CHO CHING
0xAA => '#x0E0A', # THAI CHARACTER CHO CHANG
0xAB => '#x0E0B', # THAI CHARACTER SO SO
0xAC => '#x0E0C', # THAI CHARACTER CHO CHOE
0xAD => '#x0E0D', # THAI CHARACTER YO YING
0xAE => '#x0E0E', # THAI CHARACTER DO CHADA
0xAF => '#x0E0F', # THAI CHARACTER TO PATAK
0xB0 => '#x0E10', # THAI CHARACTER THO THAN
0xB1 => '#x0E11', # THAI CHARACTER THO NANGMONTHO
0xB2 => '#x0E12', # THAI CHARACTER THO PHUTHAO
0xB3 => '#x0E13', # THAI CHARACTER NO NEN
0xB4 => '#x0E14', # THAI CHARACTER DO DEK
0xB5 => '#x0E15', # THAI CHARACTER TO TAO
0xB6 => '#x0E16', # THAI CHARACTER THO THUNG
0xB7 => '#x0E17', # THAI CHARACTER THO THAHAN
0xB8 => '#x0E18', # THAI CHARACTER THO THONG
0xB9 => '#x0E19', # THAI CHARACTER NO NU
0xBA => '#x0E1A', # THAI CHARACTER BO BAIMAI
0xBB => '#x0E1B', # THAI CHARACTER PO PLA
0xBC => '#x0E1C', # THAI CHARACTER PHO PHUNG
0xBD => '#x0E1D', # THAI CHARACTER FO FA
0xBE => '#x0E1E', # THAI CHARACTER PHO PHAN
0xBF => '#x0E1F', # THAI CHARACTER FO FAN
0xC0 => '#x0E20', # THAI CHARACTER PHO SAMPHAO
0xC1 => '#x0E21', # THAI CHARACTER MO MA
0xC2 => '#x0E22', # THAI CHARACTER YO YAK
0xC3 => '#x0E23', # THAI CHARACTER RO RUA
0xC4 => '#x0E24', # THAI CHARACTER RU
0xC5 => '#x0E25', # THAI CHARACTER LO LING
0xC6 => '#x0E26', # THAI CHARACTER LU
0xC7 => '#x0E27', # THAI CHARACTER WO WAEN
0xC8 => '#x0E28', # THAI CHARACTER SO SALA
0xC9 => '#x0E29', # THAI CHARACTER SO RUSI
0xCA => '#x0E2A', # THAI CHARACTER SO SUA
0xCB => '#x0E2B', # THAI CHARACTER HO HIP
0xCC => '#x0E2C', # THAI CHARACTER LO CHULA
0xCD => '#x0E2D', # THAI CHARACTER O ANG
0xCE => '#x0E2E', # THAI CHARACTER HO NOKHUK
0xCF => '#x0E2F', # THAI CHARACTER PAIYANNOI
0xD0 => '#x0E30', # THAI CHARACTER SARA A
0xD1 => '#x0E31', # THAI CHARACTER MAI HAN-AKAT
0xD2 => '#x0E32', # THAI CHARACTER SARA AA
0xD3 => '#x0E33', # THAI CHARACTER SARA AM
0xD4 => '#x0E34', # THAI CHARACTER SARA I
0xD5 => '#x0E35', # THAI CHARACTER SARA II
0xD6 => '#x0E36', # THAI CHARACTER SARA UE
0xD7 => '#x0E37', # THAI CHARACTER SARA UEE
0xD8 => '#x0E38', # THAI CHARACTER SARA U
0xD9 => '#x0E39', # THAI CHARACTER SARA UU
0xDA => '#x0E3A', # THAI CHARACTER PHINTHU
0xDF => '#x0E3F', # THAI CURRENCY SYMBOL BAHT
0xE0 => '#x0E40', # THAI CHARACTER SARA E
0xE1 => '#x0E41', # THAI CHARACTER SARA AE
0xE2 => '#x0E42', # THAI CHARACTER SARA O
0xE3 => '#x0E43', # THAI CHARACTER SARA AI MAIMUAN
0xE4 => '#x0E44', # THAI CHARACTER SARA AI MAIMALAI
0xE5 => '#x0E45', # THAI CHARACTER LAKKHANGYAO
0xE6 => '#x0E46', # THAI CHARACTER MAIYAMOK
0xE7 => '#x0E47', # THAI CHARACTER MAITAIKHU
0xE8 => '#x0E48', # THAI CHARACTER MAI EK
0xE9 => '#x0E49', # THAI CHARACTER MAI THO
0xEA => '#x0E4A', # THAI CHARACTER MAI TRI
0xEB => '#x0E4B', # THAI CHARACTER MAI CHATTAWA
0xEC => '#x0E4C', # THAI CHARACTER THANTHAKHAT
0xED => '#x0E4D', # THAI CHARACTER NIKHAHIT
0xEE => '#x0E4E', # THAI CHARACTER YAMAKKAN
0xEF => '#x0E4F', # THAI CHARACTER FONGMAN
0xF0 => '#x0E50', # THAI DIGIT ZERO
0xF1 => '#x0E51', # THAI DIGIT ONE
0xF2 => '#x0E52', # THAI DIGIT TWO
0xF3 => '#x0E53', # THAI DIGIT THREE
0xF4 => '#x0E54', # THAI DIGIT FOUR
0xF5 => '#x0E55', # THAI DIGIT FIVE
0xF6 => '#x0E56', # THAI DIGIT SIX
0xF7 => '#x0E57', # THAI DIGIT SEVEN
0xF8 => '#x0E58', # THAI DIGIT EIGHT
0xF9 => '#x0E59', # THAI DIGIT NINE
0xFA => '#x0E5A', # THAI CHARACTER ANGKHANKHU
0xFB => '#x0E5B', # THAI CHARACTER KHOMUT
};
--- NEW FILE ---
package MHonArc::CharEnt::ISO8859_13;
# Latin7 (Baltic Rim)
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0xA1 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0xA2 => '#x00A2', # CENT SIGN
0xA3 => '#x00A3', # POUND SIGN
0xA4 => '#x00A4', # CURRENCY SIGN
0xA5 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0xA6 => '#x00A6', # BROKEN BAR
0xA7 => '#x00A7', # SECTION SIGN
0xA8 => '#x00D8', # LATIN CAPITAL LETTER O WITH STROKE
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAA => '#x0156', # LATIN CAPITAL LETTER R WITH CEDILLA
0xAB => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xAC => '#x00AC', # NOT SIGN
0xAD => '#x00AD', # SOFT HYPHEN
0xAE => '#x00AE', # REGISTERED SIGN
0xAF => '#x00C6', # LATIN CAPITAL LETTER AE
0xB0 => '#x00B0', # DEGREE SIGN
0xB1 => '#x00B1', # PLUS-MINUS SIGN
0xB2 => '#x00B2', # SUPERSCRIPT TWO
0xB3 => '#x00B3', # SUPERSCRIPT THREE
0xB4 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0xB5 => '#x00B5', # MICRO SIGN
0xB6 => '#x00B6', # PILCROW SIGN
0xB7 => '#x00B7', # MIDDLE DOT
0xB8 => '#x00F8', # LATIN SMALL LETTER O WITH STROKE
0xB9 => '#x00B9', # SUPERSCRIPT ONE
0xBA => '#x0157', # LATIN SMALL LETTER R WITH CEDILLA
0xBB => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xBC => '#x00BC', # VULGAR FRACTION ONE QUARTER
0xBD => '#x00BD', # VULGAR FRACTION ONE HALF
0xBE => '#x00BE', # VULGAR FRACTION THREE QUARTERS
0xBF => '#x00E6', # LATIN SMALL LETTER AE
0xC0 => '#x0104', # LATIN CAPITAL LETTER A WITH OGONEK
0xC1 => '#x012E', # LATIN CAPITAL LETTER I WITH OGONEK
0xC2 => '#x0100', # LATIN CAPITAL LETTER A WITH MACRON
0xC3 => '#x0106', # LATIN CAPITAL LETTER C WITH ACUTE
0xC4 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
0xC5 => '#x00C5', # LATIN CAPITAL LETTER A WITH RING ABOVE
0xC6 => '#x0118', # LATIN CAPITAL LETTER E WITH OGONEK
0xC7 => '#x0112', # LATIN CAPITAL LETTER E WITH MACRON
0xC8 => '#x010C', # LATIN CAPITAL LETTER C WITH CARON
0xC9 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0xCA => '#x0179', # LATIN CAPITAL LETTER Z WITH ACUTE
0xCB => '#x0116', # LATIN CAPITAL LETTER E WITH DOT ABOVE
0xCC => '#x0122', # LATIN CAPITAL LETTER G WITH CEDILLA
0xCD => '#x0136', # LATIN CAPITAL LETTER K WITH CEDILLA
0xCE => '#x012A', # LATIN CAPITAL LETTER I WITH MACRON
0xCF => '#x013B', # LATIN CAPITAL LETTER L WITH CEDILLA
0xD0 => '#x0160', # LATIN CAPITAL LETTER S WITH CARON
0xD1 => '#x0143', # LATIN CAPITAL LETTER N WITH ACUTE
0xD2 => '#x0145', # LATIN CAPITAL LETTER N WITH CEDILLA
0xD3 => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
0xD4 => '#x014C', # LATIN CAPITAL LETTER O WITH MACRON
0xD5 => '#x00D5', # LATIN CAPITAL LETTER O WITH TILDE
0xD6 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
0xD7 => '#x00D7', # MULTIPLICATION SIGN
0xD8 => '#x0172', # LATIN CAPITAL LETTER U WITH OGONEK
0xD9 => '#x0141', # LATIN CAPITAL LETTER L WITH STROKE
0xDA => '#x015A', # LATIN CAPITAL LETTER S WITH ACUTE
0xDB => '#x016A', # LATIN CAPITAL LETTER U WITH MACRON
0xDC => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
0xDD => '#x017B', # LATIN CAPITAL LETTER Z WITH DOT ABOVE
0xDE => '#x017D', # LATIN CAPITAL LETTER Z WITH CARON
0xDF => '#x00DF', # LATIN SMALL LETTER SHARP S (German)
0xE0 => '#x0105', # LATIN SMALL LETTER A WITH OGONEK
0xE1 => '#x012F', # LATIN SMALL LETTER I WITH OGONEK
0xE2 => '#x0101', # LATIN SMALL LETTER A WITH MACRON
0xE3 => '#x0107', # LATIN SMALL LETTER C WITH ACUTE
0xE4 => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
0xE5 => '#x00E5', # LATIN SMALL LETTER A WITH RING ABOVE
0xE6 => '#x0119', # LATIN SMALL LETTER E WITH OGONEK
0xE7 => '#x0113', # LATIN SMALL LETTER E WITH MACRON
0xE8 => '#x010D', # LATIN SMALL LETTER C WITH CARON
0xE9 => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0xEA => '#x017A', # LATIN SMALL LETTER Z WITH ACUTE
0xEB => '#x0117', # LATIN SMALL LETTER E WITH DOT ABOVE
0xEC => '#x0123', # LATIN SMALL LETTER G WITH CEDILLA
0xED => '#x0137', # LATIN SMALL LETTER K WITH CEDILLA
0xEE => '#x012B', # LATIN SMALL LETTER I WITH MACRON
0xEF => '#x013C', # LATIN SMALL LETTER L WITH CEDILLA
0xF0 => '#x0161', # LATIN SMALL LETTER S WITH CARON
0xF1 => '#x0144', # LATIN SMALL LETTER N WITH ACUTE
0xF2 => '#x0146', # LATIN SMALL LETTER N WITH CEDILLA
0xF3 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
0xF4 => '#x014D', # LATIN SMALL LETTER O WITH MACRON
0xF5 => '#x00F5', # LATIN SMALL LETTER O WITH TILDE
0xF6 => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
0xF7 => '#x00F7', # DIVISION SIGN
0xF8 => '#x0173', # LATIN SMALL LETTER U WITH OGONEK
0xF9 => '#x0142', # LATIN SMALL LETTER L WITH STROKE
0xFA => '#x015B', # LATIN SMALL LETTER S WITH ACUTE
0xFB => '#x016B', # LATIN SMALL LETTER U WITH MACRON
0xFC => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xFD => '#x017C', # LATIN SMALL LETTER Z WITH DOT ABOVE
0xFE => '#x017E', # LATIN SMALL LETTER Z WITH CARON
0xFF => '#x2019', # RIGHT SINGLE QUOTATION MARK
};
--- NEW FILE ---
package MHonArc::CharEnt::ISO8859_14;
# Latin8 (Celtic)
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0xA1 => '#x1E02', # LATIN CAPITAL LETTER B WITH DOT ABOVE
0xA2 => '#x1E03', # LATIN SMALL LETTER B WITH DOT ABOVE
0xA3 => '#x00A3', # POUND SIGN
0xA4 => '#x010A', # LATIN CAPITAL LETTER C WITH DOT ABOVE
0xA5 => '#x010B', # LATIN SMALL LETTER C WITH DOT ABOVE
0xA6 => '#x1E0A', # LATIN CAPITAL LETTER D WITH DOT ABOVE
0xA7 => '#x00A7', # SECTION SIGN
0xA8 => '#x1E80', # LATIN CAPITAL LETTER W WITH GRAVE
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAA => '#x1E82', # LATIN CAPITAL LETTER W WITH ACUTE
0xAB => '#x1E0B', # LATIN SMALL LETTER D WITH DOT ABOVE
0xAC => '#x1EF2', # LATIN CAPITAL LETTER Y WITH GRAVE
0xAD => '#x00AD', # SOFT HYPHEN
0xAE => '#x00AE', # REGISTERED SIGN
0xAF => '#x0178', # LATIN CAPITAL LETTER Y WITH DIAERESIS
0xB0 => '#x1E1E', # LATIN CAPITAL LETTER F WITH DOT ABOVE
0xB1 => '#x1E1F', # LATIN SMALL LETTER F WITH DOT ABOVE
0xB2 => '#x0120', # LATIN CAPITAL LETTER G WITH DOT ABOVE
0xB3 => '#x0121', # LATIN SMALL LETTER G WITH DOT ABOVE
0xB4 => '#x1E40', # LATIN CAPITAL LETTER M WITH DOT ABOVE
0xB5 => '#x1E41', # LATIN SMALL LETTER M WITH DOT ABOVE
0xB6 => '#x00B6', # PILCROW SIGN
0xB7 => '#x1E56', # LATIN CAPITAL LETTER P WITH DOT ABOVE
0xB8 => '#x1E81', # LATIN SMALL LETTER W WITH GRAVE
0xB9 => '#x1E57', # LATIN SMALL LETTER P WITH DOT ABOVE
0xBA => '#x1E83', # LATIN SMALL LETTER W WITH ACUTE
0xBB => '#x1E60', # LATIN CAPITAL LETTER S WITH DOT ABOVE
0xBC => '#x1EF3', # LATIN SMALL LETTER Y WITH GRAVE
0xBD => '#x1E84', # LATIN CAPITAL LETTER W WITH DIAERESIS
0xBE => '#x1E85', # LATIN SMALL LETTER W WITH DIAERESIS
0xBF => '#x1E61', # LATIN SMALL LETTER S WITH DOT ABOVE
0xC0 => '#x00C0', # LATIN CAPITAL LETTER A WITH GRAVE
0xC1 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
0xC2 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
0xC3 => '#x00C3', # LATIN CAPITAL LETTER A WITH TILDE
0xC4 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
0xC5 => '#x00C5', # LATIN CAPITAL LETTER A WITH RING ABOVE
0xC6 => '#x00C6', # LATIN CAPITAL LETTER AE
0xC7 => '#x00C7', # LATIN CAPITAL LETTER C WITH CEDILLA
0xC8 => '#x00C8', # LATIN CAPITAL LETTER E WITH GRAVE
0xC9 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0xCA => '#x00CA', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX
0xCB => '#x00CB', # LATIN CAPITAL LETTER E WITH DIAERESIS
0xCC => '#x00CC', # LATIN CAPITAL LETTER I WITH GRAVE
0xCD => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
0xCE => '#x00CE', # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
0xCF => '#x00CF', # LATIN CAPITAL LETTER I WITH DIAERESIS
0xD0 => '#x0174', # LATIN CAPITAL LETTER W WITH CIRCUMFLEX
0xD1 => '#x00D1', # LATIN CAPITAL LETTER N WITH TILDE
0xD2 => '#x00D2', # LATIN CAPITAL LETTER O WITH GRAVE
0xD3 => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
0xD4 => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
0xD5 => '#x00D5', # LATIN CAPITAL LETTER O WITH TILDE
0xD6 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
0xD7 => '#x1E6A', # LATIN CAPITAL LETTER T WITH DOT ABOVE
0xD8 => '#x00D8', # LATIN CAPITAL LETTER O WITH STROKE
0xD9 => '#x00D9', # LATIN CAPITAL LETTER U WITH GRAVE
0xDA => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
0xDB => '#x00DB', # LATIN CAPITAL LETTER U WITH CIRCUMFLEX
0xDC => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
0xDD => '#x00DD', # LATIN CAPITAL LETTER Y WITH ACUTE
0xDE => '#x0176', # LATIN CAPITAL LETTER Y WITH CIRCUMFLEX
0xDF => '#x00DF', # LATIN SMALL LETTER SHARP S
0xE0 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
0xE1 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
0xE2 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
0xE3 => '#x00E3', # LATIN SMALL LETTER A WITH TILDE
0xE4 => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
0xE5 => '#x00E5', # LATIN SMALL LETTER A WITH RING ABOVE
0xE6 => '#x00E6', # LATIN SMALL LETTER AE
0xE7 => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
0xE8 => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
0xE9 => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0xEA => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
0xEB => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
0xEC => '#x00EC', # LATIN SMALL LETTER I WITH GRAVE
0xED => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
0xEE => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
0xEF => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
0xF0 => '#x0175', # LATIN SMALL LETTER W WITH CIRCUMFLEX
0xF1 => '#x00F1', # LATIN SMALL LETTER N WITH TILDE
0xF2 => '#x00F2', # LATIN SMALL LETTER O WITH GRAVE
0xF3 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
0xF4 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
0xF5 => '#x00F5', # LATIN SMALL LETTER O WITH TILDE
0xF6 => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
0xF7 => '#x1E6B', # LATIN SMALL LETTER T WITH DOT ABOVE
0xF8 => '#x00F8', # LATIN SMALL LETTER O WITH STROKE
0xF9 => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
0xFA => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
0xFB => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
0xFC => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xFD => '#x00FD', # LATIN SMALL LETTER Y WITH ACUTE
0xFE => '#x0177', # LATIN SMALL LETTER Y WITH CIRCUMFLEX
0xFF => '#x00FF', # LATIN SMALL LETTER Y WITH DIAERESIS
};
--- NEW FILE ---
package MHonArc::CharEnt::ISO8859_16;
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0xA1 => '#x0104', # LATIN CAPITAL LETTER A WITH OGONEK
0xA2 => '#x0105', # LATIN SMALL LETTER A WITH OGONEK
0xA3 => '#x0141', # LATIN CAPITAL LETTER L WITH STROKE
0xA4 => '#x20AC', # EURO SIGN
0xA5 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
0xA6 => '#x0160', # LATIN CAPITAL LETTER S WITH CARON
0xA7 => '#x00A7', # SECTION SIGN
0xA8 => '#x0161', # LATIN SMALL LETTER S WITH CARON
0xA9 => '#x00A9', # COPYRIGHT SIGN
0xAA => '#x0218', # LATIN CAPITAL LETTER S WITH COMMA BELOW
0xAB => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xAC => '#x0179', # LATIN CAPITAL LETTER Z WITH ACUTE
0xAD => '#x00AD', # SOFT HYPHEN
0xAE => '#x017A', # LATIN SMALL LETTER Z WITH ACUTE
0xAF => '#x017B', # LATIN CAPITAL LETTER Z WITH DOT ABOVE
0xB0 => '#x00B0', # DEGREE SIGN
0xB1 => '#x00B1', # PLUS-MINUS SIGN
0xB2 => '#x010C', # LATIN CAPITAL LETTER C WITH CARON
0xB3 => '#x0142', # LATIN SMALL LETTER L WITH STROKE
0xB4 => '#x017D', # LATIN CAPITAL LETTER Z WITH CARON
0xB5 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0xB6 => '#x00B6', # PILCROW SIGN
0xB7 => '#x00B7', # MIDDLE DOT
0xB8 => '#x017E', # LATIN SMALL LETTER Z WITH CARON
0xB9 => '#x010D', # LATIN SMALL LETTER C WITH CARON
0xBA => '#x0219', # LATIN SMALL LETTER S WITH COMMA BELOW
0xBB => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xBC => '#x0152', # LATIN CAPITAL LIGATURE OE
0xBD => '#x0153', # LATIN SMALL LIGATURE OE
0xBE => '#x0178', # LATIN CAPITAL LETTER Y WITH DIAERESIS
0xBF => '#x017C', # LATIN SMALL LETTER Z WITH DOT ABOVE
0xC0 => '#x00C0', # LATIN CAPITAL LETTER A WITH GRAVE
0xC1 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
0xC2 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
0xC3 => '#x0102', # LATIN CAPITAL LETTER A WITH BREVE
0xC4 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
0xC5 => '#x0106', # LATIN CAPITAL LETTER C WITH ACUTE
0xC6 => '#x00C6', # LATIN CAPITAL LETTER AE
0xC7 => '#x00C7', # LATIN CAPITAL LETTER C WITH CEDILLA
0xC8 => '#x00C8', # LATIN CAPITAL LETTER E WITH GRAVE
0xC9 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0xCA => '#x00CA', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX
0xCB => '#x00CB', # LATIN CAPITAL LETTER E WITH DIAERESIS
0xCC => '#x00CC', # LATIN CAPITAL LETTER I WITH GRAVE
0xCD => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
0xCE => '#x00CE', # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
0xCF => '#x00CF', # LATIN CAPITAL LETTER I WITH DIAERESIS
0xD0 => '#x0110', # LATIN CAPITAL LETTER D WITH STROKE
0xD1 => '#x0143', # LATIN CAPITAL LETTER N WITH ACUTE
0xD2 => '#x00D2', # LATIN CAPITAL LETTER O WITH GRAVE
0xD3 => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
0xD4 => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
0xD5 => '#x0150', # LATIN CAPITAL LETTER O WITH DOUBLE ACUTE
0xD6 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
0xD7 => '#x015A', # LATIN CAPITAL LETTER S WITH ACUTE
0xD8 => '#x0170', # LATIN CAPITAL LETTER U WITH DOUBLE ACUTE
0xD9 => '#x00D9', # LATIN CAPITAL LETTER U WITH GRAVE
0xDA => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
0xDB => '#x00DB', # LATIN CAPITAL LETTER U WITH CIRCUMFLEX
0xDC => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
0xDD => '#x0118', # LATIN CAPITAL LETTER E WITH OGONEK
0xDE => '#x021A', # LATIN CAPITAL LETTER T WITH COMMA BELOW
0xDF => '#x00DF', # LATIN SMALL LETTER SHARP S
0xE0 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
0xE1 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
0xE2 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
0xE3 => '#x0103', # LATIN SMALL LETTER A WITH BREVE
0xE4 => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
0xE5 => '#x0107', # LATIN SMALL LETTER C WITH ACUTE
0xE6 => '#x00E6', # LATIN SMALL LETTER AE
0xE7 => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
0xE8 => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
0xE9 => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0xEA => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
0xEB => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
0xEC => '#x00EC', # LATIN SMALL LETTER I WITH GRAVE
0xED => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
0xEE => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
0xEF => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
0xF0 => '#x0111', # LATIN SMALL LETTER D WITH STROKE
0xF1 => '#x0144', # LATIN SMALL LETTER N WITH ACUTE
0xF2 => '#x00F2', # LATIN SMALL LETTER O WITH GRAVE
0xF3 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
0xF4 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
0xF5 => '#x0151', # LATIN SMALL LETTER O WITH DOUBLE ACUTE
0xF6 => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
0xF7 => '#x015B', # LATIN SMALL LETTER S WITH ACUTE
0xF8 => '#x0171', # LATIN SMALL LETTER U WITH DOUBLE ACUTE
0xF9 => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
0xFA => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
0xFB => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
0xFC => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
0xFD => '#x0119', # LATIN SMALL LETTER E WITH OGONEK
0xFE => '#x021B', # LATIN SMALL LETTER T WITH COMMA BELOW
0xFF => '#x00FF', # LATIN SMALL LETTER Y WITH DIAERESIS
};
--- NEW FILE ---
package MHonArc::CharEnt::KOI8_A;
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x24 => '#x00A4', # CURRENCY SIGN
0xC0 => '#x044E', # CYRILLIC SMALL LETTER YU
0xC1 => '#x0430', # CYRILLIC SMALL LETTER A
0xC2 => '#x0431', # CYRILLIC SMALL LETTER BE
0xC3 => '#x0446', # CYRILLIC SMALL LETTER TSE
0xC4 => '#x0434', # CYRILLIC SMALL LETTER DE
0xC5 => '#x0435', # CYRILLIC SMALL LETTER IE
0xC6 => '#x0444', # CYRILLIC SMALL LETTER EF
0xC7 => '#x0433', # CYRILLIC SMALL LETTER GHE
0xC8 => '#x0445', # CYRILLIC SMALL LETTER HA
0xC9 => '#x0438', # CYRILLIC SMALL LETTER I
0xCA => '#x0439', # CYRILLIC SMALL LETTER SHORT I
0xCB => '#x043A', # CYRILLIC SMALL LETTER KA
0xCC => '#x043B', # CYRILLIC SMALL LETTER EL
0xCD => '#x043C', # CYRILLIC SMALL LETTER EM
0xCE => '#x043D', # CYRILLIC SMALL LETTER EN
0xCF => '#x043E', # CYRILLIC SMALL LETTER O
0xD0 => '#x043F', # CYRILLIC SMALL LETTER PE
0xD1 => '#x044F', # CYRILLIC SMALL LETTER YA
0xD2 => '#x0440', # CYRILLIC SMALL LETTER ER
0xD3 => '#x0441', # CYRILLIC SMALL LETTER ES
0xD4 => '#x0442', # CYRILLIC SMALL LETTER TE
0xD5 => '#x0443', # CYRILLIC SMALL LETTER U
0xD6 => '#x0436', # CYRILLIC SMALL LETTER ZHE
0xD7 => '#x0432', # CYRILLIC SMALL LETTER VE
0xD8 => '#x044C', # CYRILLIC SMALL LETTER SOFT SIGN
0xD9 => '#x044B', # CYRILLIC SMALL LETTER YERU
0xDA => '#x0437', # CYRILLIC SMALL LETTER ZE
0xDB => '#x0448', # CYRILLIC SMALL LETTER SHA
0xDC => '#x044D', # CYRILLIC SMALL LETTER E
0xDD => '#x0449', # CYRILLIC SMALL LETTER SHCHA
0xDE => '#x0447', # CYRILLIC SMALL LETTER CHE
0xDF => '#x044A', # CYRILLIC SMALL LETTER HARD SIGN
0xE0 => '#x042E', # CYRILLIC CAPITAL LETTER YU
0xE1 => '#x0410', # CYRILLIC CAPITAL LETTER A
0xE2 => '#x0411', # CYRILLIC CAPITAL LETTER BE
0xE3 => '#x0426', # CYRILLIC CAPITAL LETTER TSE
0xE4 => '#x0414', # CYRILLIC CAPITAL LETTER DE
0xE5 => '#x0415', # CYRILLIC CAPITAL LETTER IE
0xE6 => '#x0424', # CYRILLIC CAPITAL LETTER EF
0xE7 => '#x0413', # CYRILLIC CAPITAL LETTER GHE
0xE8 => '#x0425', # CYRILLIC CAPITAL LETTER HA
0xE9 => '#x0418', # CYRILLIC CAPITAL LETTER I
0xEA => '#x0419', # CYRILLIC CAPITAL LETTER SHORT I
0xEB => '#x041A', # CYRILLIC CAPITAL LETTER KA
0xEC => '#x041B', # CYRILLIC CAPITAL LETTER EL
0xED => '#x041C', # CYRILLIC CAPITAL LETTER EM
0xEE => '#x041D', # CYRILLIC CAPITAL LETTER EN
0xEF => '#x041E', # CYRILLIC CAPITAL LETTER O
0xF0 => '#x041F', # CYRILLIC CAPITAL LETTER PE
0xF1 => '#x042F', # CYRILLIC CAPITAL LETTER YA
0xF2 => '#x0420', # CYRILLIC CAPITAL LETTER ER
0xF3 => '#x0421', # CYRILLIC CAPITAL LETTER ES
0xF4 => '#x0422', # CYRILLIC CAPITAL LETTER TE
0xF5 => '#x0423', # CYRILLIC CAPITAL LETTER U
0xF6 => '#x0416', # CYRILLIC CAPITAL LETTER ZHE
0xF7 => '#x0412', # CYRILLIC CAPITAL LETTER VE
0xF8 => '#x042C', # CYRILLIC CAPITAL LETTER SOFT SIGN
0xF9 => '#x042B', # CYRILLIC CAPITAL LETTER YERU
0xFA => '#x0417', # CYRILLIC CAPITAL LETTER ZE
0xFB => '#x0428', # CYRILLIC CAPITAL LETTER SHA
0xFC => '#x042D', # CYRILLIC CAPITAL LETTER E
0xFD => '#x0429', # CYRILLIC CAPITAL LETTER SHCHA
0xFE => '#x0427', # CYRILLIC CAPITAL LETTER CHE
};
--- NEW FILE ---
package MHonArc::CharEnt::KOI8_B;
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0xA3 => '#x0451', # CYRILLIC SMALL LETTER IO
0xB3 => '#x0401', # CYRILLIC CAPITAL LETTER IO
0xC0 => '#x044E', # CYRILLIC SMALL LETTER YU
0xC1 => '#x0430', # CYRILLIC SMALL LETTER A
0xC2 => '#x0431', # CYRILLIC SMALL LETTER BE
0xC3 => '#x0446', # CYRILLIC SMALL LETTER TSE
0xC4 => '#x0434', # CYRILLIC SMALL LETTER DE
0xC5 => '#x0435', # CYRILLIC SMALL LETTER IE
0xC6 => '#x0444', # CYRILLIC SMALL LETTER EF
0xC7 => '#x0433', # CYRILLIC SMALL LETTER GHE
0xC8 => '#x0445', # CYRILLIC SMALL LETTER HA
0xC9 => '#x0438', # CYRILLIC SMALL LETTER I
0xCA => '#x0439', # CYRILLIC SMALL LETTER SHORT I
0xCB => '#x043A', # CYRILLIC SMALL LETTER KA
0xCC => '#x043B', # CYRILLIC SMALL LETTER EL
0xCD => '#x043C', # CYRILLIC SMALL LETTER EM
0xCE => '#x043D', # CYRILLIC SMALL LETTER EN
0xCF => '#x043E', # CYRILLIC SMALL LETTER O
0xD0 => '#x043F', # CYRILLIC SMALL LETTER PE
0xD1 => '#x044F', # CYRILLIC SMALL LETTER YA
0xD2 => '#x0440', # CYRILLIC SMALL LETTER ER
0xD3 => '#x0441', # CYRILLIC SMALL LETTER ES
0xD4 => '#x0442', # CYRILLIC SMALL LETTER TE
0xD5 => '#x0443', # CYRILLIC SMALL LETTER U
0xD6 => '#x0436', # CYRILLIC SMALL LETTER ZHE
0xD7 => '#x0432', # CYRILLIC SMALL LETTER VE
0xD8 => '#x044C', # CYRILLIC SMALL LETTER SOFT SIGN
0xD9 => '#x044B', # CYRILLIC SMALL LETTER YERU
0xDA => '#x0437', # CYRILLIC SMALL LETTER ZE
0xDB => '#x0448', # CYRILLIC SMALL LETTER SHA
0xDC => '#x044D', # CYRILLIC SMALL LETTER E
0xDD => '#x0449', # CYRILLIC SMALL LETTER SHCHA
0xDE => '#x0447', # CYRILLIC SMALL LETTER CHE
0xDF => '#x044A', # CYRILLIC SMALL LETTER HARD SIGN
0xE0 => '#x042E', # CYRILLIC CAPITAL LETTER YU
0xE1 => '#x0410', # CYRILLIC CAPITAL LETTER A
0xE2 => '#x0411', # CYRILLIC CAPITAL LETTER BE
0xE3 => '#x0426', # CYRILLIC CAPITAL LETTER TSE
0xE4 => '#x0414', # CYRILLIC CAPITAL LETTER DE
0xE5 => '#x0415', # CYRILLIC CAPITAL LETTER IE
0xE6 => '#x0424', # CYRILLIC CAPITAL LETTER EF
0xE7 => '#x0413', # CYRILLIC CAPITAL LETTER GHE
0xE8 => '#x0425', # CYRILLIC CAPITAL LETTER HA
0xE9 => '#x0418', # CYRILLIC CAPITAL LETTER I
0xEA => '#x0419', # CYRILLIC CAPITAL LETTER SHORT I
0xEB => '#x041A', # CYRILLIC CAPITAL LETTER KA
0xEC => '#x041B', # CYRILLIC CAPITAL LETTER EL
0xED => '#x041C', # CYRILLIC CAPITAL LETTER EM
0xEE => '#x041D', # CYRILLIC CAPITAL LETTER EN
0xEF => '#x041E', # CYRILLIC CAPITAL LETTER O
0xF0 => '#x041F', # CYRILLIC CAPITAL LETTER PE
0xF1 => '#x042F', # CYRILLIC CAPITAL LETTER YA
0xF2 => '#x0420', # CYRILLIC CAPITAL LETTER ER
0xF3 => '#x0421', # CYRILLIC CAPITAL LETTER ES
0xF4 => '#x0422', # CYRILLIC CAPITAL LETTER TE
0xF5 => '#x0423', # CYRILLIC CAPITAL LETTER U
0xF6 => '#x0416', # CYRILLIC CAPITAL LETTER ZHE
0xF7 => '#x0412', # CYRILLIC CAPITAL LETTER VE
0xF8 => '#x042C', # CYRILLIC CAPITAL LETTER SOFT SIGN
0xF9 => '#x042B', # CYRILLIC CAPITAL LETTER YERU
0xFA => '#x0417', # CYRILLIC CAPITAL LETTER ZE
0xFB => '#x0428', # CYRILLIC CAPITAL LETTER SHA
0xFC => '#x042D', # CYRILLIC CAPITAL LETTER E
0xFD => '#x0429', # CYRILLIC CAPITAL LETTER SHCHA
0xFE => '#x0427', # CYRILLIC CAPITAL LETTER CHE
0xFF => '#x042A', # CYRILLIC CAPITAL LETTER HARD SIGN
};
--- NEW FILE ---
package MHonArc::CharEnt::KOI8_E;
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0xA1 => '#x0452', # CYRILLIC SMALL LETTER DJE
0xA2 => '#x0453', # CYRILLIC SMALL LETTER GJE
0xA3 => '#x0451', # CYRILLIC SMALL LETTER IO
0xA4 => '#x0454', # CYRILLIC SMALL LETTER UKRAINIAN IE
0xA5 => '#x0455', # CYRILLIC SMALL LETTER DZE
0xA6 => '#x0456', # CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
0xA7 => '#x0457', # CYRILLIC SMALL LETTER YI
0xA8 => '#x0458', # CYRILLIC SMALL LETTER JE
0xA9 => '#x0459', # CYRILLIC SMALL LETTER LJE
0xAA => '#x045A', # CYRILLIC SMALL LETTER NJE
0xAB => '#x045B', # CYRILLIC SMALL LETTER TSHE
0xAC => '#x045C', # CYRILLIC SMALL LETTER KJE
0xAE => '#x045E', # CYRILLIC SMALL LETTER SHORT U
0xAF => '#x045F', # CYRILLIC SMALL LETTER DZHE
0xB0 => '#x2116', # NUMERO SIGN
0xB1 => '#x0402', # CYRILLIC CAPITAL LETTER DJE
0xB2 => '#x0403', # CYRILLIC CAPITAL LETTER GJE
0xB3 => '#x0401', # CYRILLIC CAPITAL LETTER IO
0xB4 => '#x0404', # CYRILLIC CAPITAL LETTER UKRAINIAN IE
0xB5 => '#x0405', # CYRILLIC CAPITAL LETTER DZE
0xB6 => '#x0406', # CYRILLIC CAPITAL LETTER
BYELORUSSIAN-UKRAINIAN I
0xB7 => '#x0407', # CYRILLIC CAPITAL LETTER YI
0xB8 => '#x0408', # CYRILLIC CAPITAL LETTER JE
0xB9 => '#x0409', # CYRILLIC CAPITAL LETTER LJE
0xBA => '#x040A', # CYRILLIC CAPITAL LETTER NJE
0xBB => '#x040B', # CYRILLIC CAPITAL LETTER TSHE
0xBC => '#x040C', # CYRILLIC CAPITAL LETTER KJE
0xBE => '#x040E', # CYRILLIC CAPITAL LETTER SHORT U
0xBF => '#x040F', # CYRILLIC CAPITAL LETTER DZHE
0xC0 => '#x044E', # CYRILLIC SMALL LETTER YU
0xC1 => '#x0430', # CYRILLIC SMALL LETTER A
0xC2 => '#x0431', # CYRILLIC SMALL LETTER BE
0xC3 => '#x0446', # CYRILLIC SMALL LETTER TSE
0xC4 => '#x0434', # CYRILLIC SMALL LETTER DE
0xC5 => '#x0435', # CYRILLIC SMALL LETTER IE
0xC6 => '#x0444', # CYRILLIC SMALL LETTER EF
0xC7 => '#x0433', # CYRILLIC SMALL LETTER GHE
0xC8 => '#x0445', # CYRILLIC SMALL LETTER HA
0xC9 => '#x0438', # CYRILLIC SMALL LETTER I
0xCA => '#x0439', # CYRILLIC SMALL LETTER SHORT I
0xCB => '#x043A', # CYRILLIC SMALL LETTER KA
0xCC => '#x043B', # CYRILLIC SMALL LETTER EL
0xCD => '#x043C', # CYRILLIC SMALL LETTER EM
0xCE => '#x043D', # CYRILLIC SMALL LETTER EN
0xCF => '#x043E', # CYRILLIC SMALL LETTER O
0xD0 => '#x043F', # CYRILLIC SMALL LETTER PE
0xD1 => '#x044F', # CYRILLIC SMALL LETTER YA
0xD2 => '#x0440', # CYRILLIC SMALL LETTER ER
0xD3 => '#x0441', # CYRILLIC SMALL LETTER ES
0xD4 => '#x0442', # CYRILLIC SMALL LETTER TE
0xD5 => '#x0443', # CYRILLIC SMALL LETTER U
0xD6 => '#x0436', # CYRILLIC SMALL LETTER ZHE
0xD7 => '#x0432', # CYRILLIC SMALL LETTER VE
0xD8 => '#x044C', # CYRILLIC SMALL LETTER SOFT SIGN
0xD9 => '#x044B', # CYRILLIC SMALL LETTER YERU
0xDA => '#x0437', # CYRILLIC SMALL LETTER ZE
0xDB => '#x0448', # CYRILLIC SMALL LETTER SHA
0xDC => '#x044D', # CYRILLIC SMALL LETTER E
0xDD => '#x0449', # CYRILLIC SMALL LETTER SHCHA
0xDE => '#x0447', # CYRILLIC SMALL LETTER CHE
0xDF => '#x044A', # CYRILLIC SMALL LETTER HARD SIGN
0xE0 => '#x042E', # CYRILLIC CAPITAL LETTER YU
0xE1 => '#x0410', # CYRILLIC CAPITAL LETTER A
0xE2 => '#x0411', # CYRILLIC CAPITAL LETTER BE
0xE3 => '#x0426', # CYRILLIC CAPITAL LETTER TSE
0xE4 => '#x0414', # CYRILLIC CAPITAL LETTER DE
0xE5 => '#x0415', # CYRILLIC CAPITAL LETTER IE
0xE6 => '#x0424', # CYRILLIC CAPITAL LETTER EF
0xE7 => '#x0413', # CYRILLIC CAPITAL LETTER GHE
0xE8 => '#x0425', # CYRILLIC CAPITAL LETTER HA
0xE9 => '#x0418', # CYRILLIC CAPITAL LETTER I
0xEA => '#x0419', # CYRILLIC CAPITAL LETTER SHORT I
0xEB => '#x041A', # CYRILLIC CAPITAL LETTER KA
0xEC => '#x041B', # CYRILLIC CAPITAL LETTER EL
0xED => '#x041C', # CYRILLIC CAPITAL LETTER EM
0xEE => '#x041D', # CYRILLIC CAPITAL LETTER EN
0xEF => '#x041E', # CYRILLIC CAPITAL LETTER O
0xF0 => '#x041F', # CYRILLIC CAPITAL LETTER PE
0xF1 => '#x042F', # CYRILLIC CAPITAL LETTER YA
0xF2 => '#x0420', # CYRILLIC CAPITAL LETTER ER
0xF3 => '#x0421', # CYRILLIC CAPITAL LETTER ES
0xF4 => '#x0422', # CYRILLIC CAPITAL LETTER TE
0xF5 => '#x0423', # CYRILLIC CAPITAL LETTER U
0xF6 => '#x0416', # CYRILLIC CAPITAL LETTER ZHE
0xF7 => '#x0412', # CYRILLIC CAPITAL LETTER VE
0xF8 => '#x042C', # CYRILLIC CAPITAL LETTER SOFT SIGN
0xF9 => '#x042B', # CYRILLIC CAPITAL LETTER YERU
0xFA => '#x0417', # CYRILLIC CAPITAL LETTER ZE
0xFB => '#x0428', # CYRILLIC CAPITAL LETTER SHA
0xFC => '#x042D', # CYRILLIC CAPITAL LETTER E
0xFD => '#x0429', # CYRILLIC CAPITAL LETTER SHCHA
0xFE => '#x0427', # CYRILLIC CAPITAL LETTER CHE
0xFF => '#x042A', # CYRILLIC CAPITAL LETTER HARD SIGN
};
--- NEW FILE ---
package MHonArc::CharEnt::KOI8_F;
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x2500', # BOX DRAWINGS LIGHT HORIZONTAL
0x81 => '#x2502', # BOX DRAWINGS LIGHT VERTICAL
0x82 => '#x250C', # BOX DRAWINGS LIGHT DOWN AND RIGHT
0x83 => '#x2510', # BOX DRAWINGS LIGHT DOWN AND LEFT
0x84 => '#x2514', # BOX DRAWINGS LIGHT UP AND RIGHT
0x85 => '#x2518', # BOX DRAWINGS LIGHT UP AND LEFT
0x86 => '#x251C', # BOX DRAWINGS LIGHT VERTICAL AND RIGHT
0x87 => '#x2524', # BOX DRAWINGS LIGHT VERTICAL AND LEFT
0x88 => '#x252C', # BOX DRAWINGS LIGHT DOWN AND HORIZONTAL
0x89 => '#x2534', # BOX DRAWINGS LIGHT UP AND HORIZONTAL
0x8A => '#x253C', # BOX DRAWINGS LIGHT VERTICAL AND HORIZONTAL
0x8B => '#x2580', # UPPER HALF BLOCK
0x8C => '#x2584', # LOWER HALF BLOCK
0x8D => '#x2588', # FULL BLOCK
0x8E => '#x258C', # LEFT HALF BLOCK
0x8F => '#x2590', # RIGHT HALF BLOCK
0x90 => '#x2591', # LIGHT SHADE
0x91 => '#x2018', # LEFT SINGLE QUOTATION MARK
0x92 => '#x2019', # RIGHT SINGLE QUOTATION MARK
0x93 => '#x201C', # LEFT DOUBLE QUOTATION MARK
0x94 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
0x95 => '#x2022', # BULLET
0x96 => '#x2013', # EN DASH
0x97 => '#x2014', # EM DASH
0x98 => '#x00A9', # COPYRIGHT SIGN
0x99 => '#x2122', # TRADE MARK SIGN
0x9A => '#x00A0', # NO-BREAK SPACE
0x9B => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0x9C => '#x00AE', # REGISTERED SIGN
0x9D => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0x9E => '#x00B7', # MIDDLE DOT
0x9F => '#x00A4', # CURRENCY SIGN
0xA1 => '#x0452', # CYRILLIC SMALL LETTER DJE
0xA2 => '#x0453', # CYRILLIC SMALL LETTER GJE
0xA3 => '#x0451', # CYRILLIC SMALL LETTER IO
0xA4 => '#x0454', # CYRILLIC SMALL LETTER UKRAINIAN IE
0xA5 => '#x0455', # CYRILLIC SMALL LETTER DZE
0xA6 => '#x0456', # CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
0xA7 => '#x0457', # CYRILLIC SMALL LETTER YI
0xA8 => '#x0458', # CYRILLIC SMALL LETTER JE
0xA9 => '#x0459', # CYRILLIC SMALL LETTER LJE
0xAA => '#x045A', # CYRILLIC SMALL LETTER NJE
0xAB => '#x045B', # CYRILLIC SMALL LETTER TSHE
0xAC => '#x045C', # CYRILLIC SMALL LETTER KJE
0xAD => '#x0491', # CYRILLIC SMALL LETTER GHE WITH UPTURN
0xAE => '#x045E', # CYRILLIC SMALL LETTER SHORT U
0xAF => '#x045F', # CYRILLIC SMALL LETTER DZHE
0xB0 => '#x2116', # NUMERO SIGN
0xB1 => '#x0402', # CYRILLIC CAPITAL LETTER DJE
0xB2 => '#x0403', # CYRILLIC CAPITAL LETTER GJE
0xB3 => '#x0401', # CYRILLIC CAPITAL LETTER IO
0xB4 => '#x0404', # CYRILLIC CAPITAL LETTER UKRAINIAN IE
0xB5 => '#x0405', # CYRILLIC CAPITAL LETTER DZE
0xB6 => '#x0406', # CYRILLIC CAPITAL LETTER
BYELORUSSIAN-UKRAINIAN I
0xB7 => '#x0407', # CYRILLIC CAPITAL LETTER YI
0xB8 => '#x0408', # CYRILLIC CAPITAL LETTER JE
0xB9 => '#x0409', # CYRILLIC CAPITAL LETTER LJE
0xBA => '#x040A', # CYRILLIC CAPITAL LETTER NJE
0xBB => '#x040B', # CYRILLIC CAPITAL LETTER TSHE
0xBC => '#x040C', # CYRILLIC CAPITAL LETTER KJE
0xBD => '#x0490', # CYRILLIC CAPITAL LETTER GHE WITH UPTURN
0xBE => '#x040E', # CYRILLIC CAPITAL LETTER SHORT U
0xBF => '#x040F', # CYRILLIC CAPITAL LETTER DZHE
0xC0 => '#x044E', # CYRILLIC SMALL LETTER YU
0xC1 => '#x0430', # CYRILLIC SMALL LETTER A
0xC2 => '#x0431', # CYRILLIC SMALL LETTER BE
0xC3 => '#x0446', # CYRILLIC SMALL LETTER TSE
0xC4 => '#x0434', # CYRILLIC SMALL LETTER DE
0xC5 => '#x0435', # CYRILLIC SMALL LETTER IE
0xC6 => '#x0444', # CYRILLIC SMALL LETTER EF
0xC7 => '#x0433', # CYRILLIC SMALL LETTER GHE
0xC8 => '#x0445', # CYRILLIC SMALL LETTER HA
0xC9 => '#x0438', # CYRILLIC SMALL LETTER I
0xCA => '#x0439', # CYRILLIC SMALL LETTER SHORT I
0xCB => '#x043A', # CYRILLIC SMALL LETTER KA
0xCC => '#x043B', # CYRILLIC SMALL LETTER EL
0xCD => '#x043C', # CYRILLIC SMALL LETTER EM
0xCE => '#x043D', # CYRILLIC SMALL LETTER EN
0xCF => '#x043E', # CYRILLIC SMALL LETTER O
0xD0 => '#x043F', # CYRILLIC SMALL LETTER PE
0xD1 => '#x044F', # CYRILLIC SMALL LETTER YA
0xD2 => '#x0440', # CYRILLIC SMALL LETTER ER
0xD3 => '#x0441', # CYRILLIC SMALL LETTER ES
0xD4 => '#x0442', # CYRILLIC SMALL LETTER TE
0xD5 => '#x0443', # CYRILLIC SMALL LETTER U
0xD6 => '#x0436', # CYRILLIC SMALL LETTER ZHE
0xD7 => '#x0432', # CYRILLIC SMALL LETTER VE
0xD8 => '#x044C', # CYRILLIC SMALL LETTER SOFT SIGN
0xD9 => '#x044B', # CYRILLIC SMALL LETTER YERU
0xDA => '#x0437', # CYRILLIC SMALL LETTER ZE
0xDB => '#x0448', # CYRILLIC SMALL LETTER SHA
0xDC => '#x044D', # CYRILLIC SMALL LETTER E
0xDD => '#x0449', # CYRILLIC SMALL LETTER SHCHA
0xDE => '#x0447', # CYRILLIC SMALL LETTER CHE
0xDF => '#x044A', # CYRILLIC SMALL LETTER HARD SIGN
0xE0 => '#x042E', # CYRILLIC CAPITAL LETTER YU
0xE1 => '#x0410', # CYRILLIC CAPITAL LETTER A
0xE2 => '#x0411', # CYRILLIC CAPITAL LETTER BE
0xE3 => '#x0426', # CYRILLIC CAPITAL LETTER TSE
0xE4 => '#x0414', # CYRILLIC CAPITAL LETTER DE
0xE5 => '#x0415', # CYRILLIC CAPITAL LETTER IE
0xE6 => '#x0424', # CYRILLIC CAPITAL LETTER EF
0xE7 => '#x0413', # CYRILLIC CAPITAL LETTER GHE
0xE8 => '#x0425', # CYRILLIC CAPITAL LETTER HA
0xE9 => '#x0418', # CYRILLIC CAPITAL LETTER I
0xEA => '#x0419', # CYRILLIC CAPITAL LETTER SHORT I
0xEB => '#x041A', # CYRILLIC CAPITAL LETTER KA
0xEC => '#x041B', # CYRILLIC CAPITAL LETTER EL
0xED => '#x041C', # CYRILLIC CAPITAL LETTER EM
0xEE => '#x041D', # CYRILLIC CAPITAL LETTER EN
0xEF => '#x041E', # CYRILLIC CAPITAL LETTER O
0xF0 => '#x041F', # CYRILLIC CAPITAL LETTER PE
0xF1 => '#x042F', # CYRILLIC CAPITAL LETTER YA
0xF2 => '#x0420', # CYRILLIC CAPITAL LETTER ER
0xF3 => '#x0421', # CYRILLIC CAPITAL LETTER ES
0xF4 => '#x0422', # CYRILLIC CAPITAL LETTER TE
0xF5 => '#x0423', # CYRILLIC CAPITAL LETTER U
0xF6 => '#x0416', # CYRILLIC CAPITAL LETTER ZHE
0xF7 => '#x0412', # CYRILLIC CAPITAL LETTER VE
0xF8 => '#x042C', # CYRILLIC CAPITAL LETTER SOFT SIGN
0xF9 => '#x042B', # CYRILLIC CAPITAL LETTER YERU
0xFA => '#x0417', # CYRILLIC CAPITAL LETTER ZE
0xFB => '#x0428', # CYRILLIC CAPITAL LETTER SHA
0xFC => '#x042D', # CYRILLIC CAPITAL LETTER E
0xFD => '#x0429', # CYRILLIC CAPITAL LETTER SHCHA
0xFE => '#x0427', # CYRILLIC CAPITAL LETTER CHE
0xFF => '#x042A', # CYRILLIC CAPITAL LETTER HARD SIGN
};
--- NEW FILE ---
package MHonArc::CharEnt::KOI8_R;
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x2500', # BOX DRAWINGS LIGHT HORIZONTAL
0x81 => '#x2502', # BOX DRAWINGS LIGHT VERTICAL
0x82 => '#x250C', # BOX DRAWINGS LIGHT DOWN AND RIGHT
0x83 => '#x2510', # BOX DRAWINGS LIGHT DOWN AND LEFT
0x84 => '#x2514', # BOX DRAWINGS LIGHT UP AND RIGHT
0x85 => '#x2518', # BOX DRAWINGS LIGHT UP AND LEFT
0x86 => '#x251C', # BOX DRAWINGS LIGHT VERTICAL AND RIGHT
0x87 => '#x2524', # BOX DRAWINGS LIGHT VERTICAL AND LEFT
0x88 => '#x252C', # BOX DRAWINGS LIGHT DOWN AND HORIZONTAL
0x89 => '#x2534', # BOX DRAWINGS LIGHT UP AND HORIZONTAL
0x8A => '#x253C', # BOX DRAWINGS LIGHT VERTICAL AND HORIZONTAL
0x8B => '#x2580', # UPPER HALF BLOCK
0x8C => '#x2584', # LOWER HALF BLOCK
0x8D => '#x2588', # FULL BLOCK
0x8E => '#x258C', # LEFT HALF BLOCK
0x8F => '#x2590', # RIGHT HALF BLOCK
0x90 => '#x2591', # LIGHT SHADE
0x91 => '#x2592', # MEDIUM SHADE
0x92 => '#x2593', # DARK SHADE
0x93 => '#x2320', # TOP HALF INTEGRAL
0x94 => '#x25A0', # BLACK SQUARE
0x95 => '#x2022', # BULLET
0x96 => '#x221A', # SQUARE ROOT
0x97 => '#x2248', # ALMOST EQUAL TO
0x98 => '#x2264', # LESS-THAN OR EQUAL TO
0x99 => '#x2265', # GREATER-THAN OR EQUAL TO
0x9A => '#x00A0', # NO-BREAK SPACE
0x9B => '#x2321', # BOTTOM HALF INTEGRAL
0x9C => '#x00B0', # DEGREE SIGN
0x9D => '#x00B2', # SUPERSCRIPT TWO
0x9E => '#x00B7', # MIDDLE DOT
0x9F => '#x00F7', # DIVISION SIGN
0xA0 => '#x2550', # BOX DRAWINGS DOUBLE HORIZONTAL
0xA1 => '#x2551', # BOX DRAWINGS DOUBLE VERTICAL
0xA2 => '#x2552', # BOX DRAWINGS DOWN SINGLE AND RIGHT DOUBLE
0xA3 => '#x0451', # CYRILLIC SMALL LETTER IO
0xA4 => '#x2553', # BOX DRAWINGS DOWN DOUBLE AND RIGHT SINGLE
0xA5 => '#x2554', # BOX DRAWINGS DOUBLE DOWN AND RIGHT
0xA6 => '#x2555', # BOX DRAWINGS DOWN SINGLE AND LEFT DOUBLE
0xA7 => '#x2556', # BOX DRAWINGS DOWN DOUBLE AND LEFT SINGLE
0xA8 => '#x2557', # BOX DRAWINGS DOUBLE DOWN AND LEFT
0xA9 => '#x2558', # BOX DRAWINGS UP SINGLE AND RIGHT DOUBLE
0xAA => '#x2559', # BOX DRAWINGS UP DOUBLE AND RIGHT SINGLE
0xAB => '#x255A', # BOX DRAWINGS DOUBLE UP AND RIGHT
0xAC => '#x255B', # BOX DRAWINGS UP SINGLE AND LEFT DOUBLE
0xAD => '#x255C', # BOX DRAWINGS UP DOUBLE AND LEFT SINGLE
0xAE => '#x255D', # BOX DRAWINGS DOUBLE UP AND LEFT
0xAF => '#x255E', # BOX DRAWINGS VERTICAL SINGLE AND RIGHT DOUBLE
0xB0 => '#x255F', # BOX DRAWINGS VERTICAL DOUBLE AND RIGHT SINGLE
0xB1 => '#x2560', # BOX DRAWINGS DOUBLE VERTICAL AND RIGHT
0xB2 => '#x2561', # BOX DRAWINGS VERTICAL SINGLE AND LEFT DOUBLE
0xB3 => '#x0401', # CYRILLIC CAPITAL LETTER IO
0xB4 => '#x2562', # BOX DRAWINGS VERTICAL DOUBLE AND LEFT SINGLE
0xB5 => '#x2563', # BOX DRAWINGS DOUBLE VERTICAL AND LEFT
0xB6 => '#x2564', # BOX DRAWINGS DOWN SINGLE AND HORIZONTAL DOUBLE
0xB7 => '#x2565', # BOX DRAWINGS DOWN DOUBLE AND HORIZONTAL SINGLE
0xB8 => '#x2566', # BOX DRAWINGS DOUBLE DOWN AND HORIZONTAL
0xB9 => '#x2567', # BOX DRAWINGS UP SINGLE AND HORIZONTAL DOUBLE
0xBA => '#x2568', # BOX DRAWINGS UP DOUBLE AND HORIZONTAL SINGLE
0xBB => '#x2569', # BOX DRAWINGS DOUBLE UP AND HORIZONTAL
0xBC => '#x256A', # BOX DRAWINGS VERTICAL SINGLE AND HORIZONTAL
DOUBLE
0xBD => '#x256B', # BOX DRAWINGS VERTICAL DOUBLE AND HORIZONTAL
SINGLE
0xBE => '#x256C', # BOX DRAWINGS DOUBLE VERTICAL AND HORIZONTAL
0xC0 => '#x044E', # CYRILLIC SMALL LETTER YU
0xC1 => '#x0430', # CYRILLIC SMALL LETTER A
0xC2 => '#x0431', # CYRILLIC SMALL LETTER BE
0xC3 => '#x0446', # CYRILLIC SMALL LETTER TSE
0xC4 => '#x0434', # CYRILLIC SMALL LETTER DE
0xC5 => '#x0435', # CYRILLIC SMALL LETTER IE
0xC6 => '#x0444', # CYRILLIC SMALL LETTER EF
0xC7 => '#x0433', # CYRILLIC SMALL LETTER GHE
0xC8 => '#x0445', # CYRILLIC SMALL LETTER HA
0xC9 => '#x0438', # CYRILLIC SMALL LETTER I
0xCA => '#x0439', # CYRILLIC SMALL LETTER SHORT I
0xCB => '#x043A', # CYRILLIC SMALL LETTER KA
0xCC => '#x043B', # CYRILLIC SMALL LETTER EL
0xCD => '#x043C', # CYRILLIC SMALL LETTER EM
0xCE => '#x043D', # CYRILLIC SMALL LETTER EN
0xCF => '#x043E', # CYRILLIC SMALL LETTER O
0xD0 => '#x043F', # CYRILLIC SMALL LETTER PE
0xD1 => '#x044F', # CYRILLIC SMALL LETTER YA
0xD2 => '#x0440', # CYRILLIC SMALL LETTER ER
0xD3 => '#x0441', # CYRILLIC SMALL LETTER ES
0xD4 => '#x0442', # CYRILLIC SMALL LETTER TE
0xD5 => '#x0443', # CYRILLIC SMALL LETTER U
0xD6 => '#x0436', # CYRILLIC SMALL LETTER ZHE
0xD7 => '#x0432', # CYRILLIC SMALL LETTER VE
0xD8 => '#x044C', # CYRILLIC SMALL LETTER SOFT SIGN
0xD9 => '#x044B', # CYRILLIC SMALL LETTER YERU
0xDA => '#x0437', # CYRILLIC SMALL LETTER ZE
0xDB => '#x0448', # CYRILLIC SMALL LETTER SHA
0xDC => '#x044D', # CYRILLIC SMALL LETTER E
0xDD => '#x0449', # CYRILLIC SMALL LETTER SHCHA
0xDE => '#x0447', # CYRILLIC SMALL LETTER CHE
0xDF => '#x044A', # CYRILLIC SMALL LETTER HARD SIGN
0xE0 => '#x042E', # CYRILLIC CAPITAL LETTER YU
0xE1 => '#x0410', # CYRILLIC CAPITAL LETTER A
0xE2 => '#x0411', # CYRILLIC CAPITAL LETTER BE
0xE3 => '#x0426', # CYRILLIC CAPITAL LETTER TSE
0xE4 => '#x0414', # CYRILLIC CAPITAL LETTER DE
0xE5 => '#x0415', # CYRILLIC CAPITAL LETTER IE
0xE6 => '#x0424', # CYRILLIC CAPITAL LETTER EF
0xE7 => '#x0413', # CYRILLIC CAPITAL LETTER GHE
0xE8 => '#x0425', # CYRILLIC CAPITAL LETTER HA
0xE9 => '#x0418', # CYRILLIC CAPITAL LETTER I
0xEA => '#x0419', # CYRILLIC CAPITAL LETTER SHORT I
0xEB => '#x041A', # CYRILLIC CAPITAL LETTER KA
0xEC => '#x041B', # CYRILLIC CAPITAL LETTER EL
0xED => '#x041C', # CYRILLIC CAPITAL LETTER EM
0xEE => '#x041D', # CYRILLIC CAPITAL LETTER EN
0xEF => '#x041E', # CYRILLIC CAPITAL LETTER O
0xF0 => '#x041F', # CYRILLIC CAPITAL LETTER PE
0xF1 => '#x042F', # CYRILLIC CAPITAL LETTER YA
0xF2 => '#x0420', # CYRILLIC CAPITAL LETTER ER
0xF3 => '#x0421', # CYRILLIC CAPITAL LETTER ES
0xF4 => '#x0422', # CYRILLIC CAPITAL LETTER TE
0xF5 => '#x0423', # CYRILLIC CAPITAL LETTER U
0xF6 => '#x0416', # CYRILLIC CAPITAL LETTER ZHE
0xF7 => '#x0412', # CYRILLIC CAPITAL LETTER VE
0xF8 => '#x042C', # CYRILLIC CAPITAL LETTER SOFT SIGN
0xF9 => '#x042B', # CYRILLIC CAPITAL LETTER YERU
0xFA => '#x0417', # CYRILLIC CAPITAL LETTER ZE
0xFB => '#x0428', # CYRILLIC CAPITAL LETTER SHA
0xFC => '#x042D', # CYRILLIC CAPITAL LETTER E
0xFD => '#x0429', # CYRILLIC CAPITAL LETTER SHCHA
0xFE => '#x0427', # CYRILLIC CAPITAL LETTER CHE
0xFF => '#x042A', # CYRILLIC CAPITAL LETTER HARD SIGN
};
--- NEW FILE ---
package MHonArc::CharEnt::KOI8_U;
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x80 => '#x2500', # BOX DRAWINGS LIGHT HORIZONTAL
0x81 => '#x2502', # BOX DRAWINGS LIGHT VERTICAL
0x82 => '#x250C', # BOX DRAWINGS LIGHT DOWN AND RIGHT
0x83 => '#x2510', # BOX DRAWINGS LIGHT DOWN AND LEFT
0x84 => '#x2514', # BOX DRAWINGS LIGHT UP AND RIGHT
0x85 => '#x2518', # BOX DRAWINGS LIGHT UP AND LEFT
0x86 => '#x251C', # BOX DRAWINGS LIGHT VERTICAL AND RIGHT
0x87 => '#x2524', # BOX DRAWINGS LIGHT VERTICAL AND LEFT
0x88 => '#x252C', # BOX DRAWINGS LIGHT DOWN AND HORIZONTAL
0x89 => '#x2534', # BOX DRAWINGS LIGHT UP AND HORIZONTAL
0x8A => '#x253C', # BOX DRAWINGS LIGHT VERTICAL AND HORIZONTAL
0x8B => '#x2580', # UPPER HALF BLOCK
0x8C => '#x2584', # LOWER HALF BLOCK
0x8D => '#x2588', # FULL BLOCK
0x8E => '#x258C', # LEFT HALF BLOCK
0x8F => '#x2590', # RIGHT HALF BLOCK
0x90 => '#x2591', # LIGHT SHADE
0x91 => '#x2592', # MEDIUM SHADE
0x92 => '#x2593', # DARK SHADE
0x93 => '#x2320', # TOP HALF INTEGRAL
0x94 => '#x25A0', # BLACK SQUARE
0x95 => '#x2022', # BULLET
0x96 => '#x221A', # SQUARE ROOT
0x97 => '#x2248', # ALMOST EQUAL TO
0x98 => '#x2264', # LESS-THAN OR EQUAL TO
0x99 => '#x2265', # GREATER-THAN OR EQUAL TO
0x9A => '#x00A0', # NO-BREAK SPACE
0x9B => '#x2321', # BOTTOM HALF INTEGRAL
0x9C => '#x00B0', # DEGREE SIGN
0x9D => '#x00B2', # SUPERSCRIPT TWO
0x9E => '#x00B7', # MIDDLE DOT
0x9F => '#x00F7', # DIVISION SIGN
0xA0 => '#x2550', # BOX DRAWINGS DOUBLE HORIZONTAL
0xA1 => '#x2551', # BOX DRAWINGS DOUBLE VERTICAL
0xA2 => '#x2552', # BOX DRAWINGS DOWN SINGLE AND RIGHT DOUBLE
0xA3 => '#x0451', # CYRILLIC SMALL LETTER IO
0xA4 => '#x0454', # CYRILLIC SMALL LETTER UKRAINIAN IE
0xA5 => '#x2554', # BOX DRAWINGS DOUBLE DOWN AND RIGHT
0xA6 => '#x0456', # CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
0xA7 => '#x0457', # CYRILLIC SMALL LETTER YI
0xA8 => '#x2557', # BOX DRAWINGS DOUBLE DOWN AND LEFT
0xA9 => '#x2558', # BOX DRAWINGS UP SINGLE AND RIGHT DOUBLE
0xAA => '#x2559', # BOX DRAWINGS UP DOUBLE AND RIGHT SINGLE
0xAB => '#x255A', # BOX DRAWINGS DOUBLE UP AND RIGHT
0xAC => '#x255B', # BOX DRAWINGS UP SINGLE AND LEFT DOUBLE
0xAD => '#x0491', # CYRILLIC SMALL LETTER GHE WITH UPTURN
0xAE => '#x255D', # BOX DRAWINGS DOUBLE UP AND LEFT
0xAF => '#x255E', # BOX DRAWINGS VERTICAL SINGLE AND RIGHT DOUBLE
0xB0 => '#x255F', # BOX DRAWINGS VERTICAL DOUBLE AND RIGHT SINGLE
0xB1 => '#x2560', # BOX DRAWINGS DOUBLE VERTICAL AND RIGHT
0xB2 => '#x2561', # BOX DRAWINGS VERTICAL SINGLE AND LEFT DOUBLE
0xB3 => '#x0401', # CYRILLIC CAPITAL LETTER IO
0xB4 => '#x0404', # CYRILLIC CAPITAL LETTER UKRAINIAN IE
0xB5 => '#x2563', # BOX DRAWINGS DOUBLE VERTICAL AND LEFT
0xB6 => '#x0406', # CYRILLIC CAPITAL LETTER
BYELORUSSIAN-UKRAINIAN I
0xB7 => '#x0407', # CYRILLIC CAPITAL LETTER YI
0xB8 => '#x2566', # BOX DRAWINGS DOUBLE DOWN AND HORIZONTAL
0xB9 => '#x2567', # BOX DRAWINGS UP SINGLE AND HORIZONTAL DOUBLE
0xBA => '#x2568', # BOX DRAWINGS UP DOUBLE AND HORIZONTAL SINGLE
0xBB => '#x2569', # BOX DRAWINGS DOUBLE UP AND HORIZONTAL
0xBC => '#x256A', # BOX DRAWINGS VERTICAL SINGLE AND HORIZONTAL
DOUBLE
0xBD => '#x0490', # CYRILLIC CAPITAL LETTER GHE WITH UPTURN
0xBE => '#x256C', # BOX DRAWINGS DOUBLE VERTICAL AND HORIZONTAL
0xC0 => '#x044E', # CYRILLIC SMALL LETTER YU
0xC1 => '#x0430', # CYRILLIC SMALL LETTER A
0xC2 => '#x0431', # CYRILLIC SMALL LETTER BE
0xC3 => '#x0446', # CYRILLIC SMALL LETTER TSE
0xC4 => '#x0434', # CYRILLIC SMALL LETTER DE
0xC5 => '#x0435', # CYRILLIC SMALL LETTER IE
0xC6 => '#x0444', # CYRILLIC SMALL LETTER EF
0xC7 => '#x0433', # CYRILLIC SMALL LETTER GHE
0xC8 => '#x0445', # CYRILLIC SMALL LETTER HA
0xC9 => '#x0438', # CYRILLIC SMALL LETTER I
0xCA => '#x0439', # CYRILLIC SMALL LETTER SHORT I
0xCB => '#x043A', # CYRILLIC SMALL LETTER KA
0xCC => '#x043B', # CYRILLIC SMALL LETTER EL
0xCD => '#x043C', # CYRILLIC SMALL LETTER EM
0xCE => '#x043D', # CYRILLIC SMALL LETTER EN
0xCF => '#x043E', # CYRILLIC SMALL LETTER O
0xD0 => '#x043F', # CYRILLIC SMALL LETTER PE
0xD1 => '#x044F', # CYRILLIC SMALL LETTER YA
0xD2 => '#x0440', # CYRILLIC SMALL LETTER ER
0xD3 => '#x0441', # CYRILLIC SMALL LETTER ES
0xD4 => '#x0442', # CYRILLIC SMALL LETTER TE
0xD5 => '#x0443', # CYRILLIC SMALL LETTER U
0xD6 => '#x0436', # CYRILLIC SMALL LETTER ZHE
0xD7 => '#x0432', # CYRILLIC SMALL LETTER VE
0xD8 => '#x044C', # CYRILLIC SMALL LETTER SOFT SIGN
0xD9 => '#x044B', # CYRILLIC SMALL LETTER YERU
0xDA => '#x0437', # CYRILLIC SMALL LETTER ZE
0xDB => '#x0448', # CYRILLIC SMALL LETTER SHA
0xDC => '#x044D', # CYRILLIC SMALL LETTER E
0xDD => '#x0449', # CYRILLIC SMALL LETTER SHCHA
0xDE => '#x0447', # CYRILLIC SMALL LETTER CHE
0xDF => '#x044A', # CYRILLIC SMALL LETTER HARD SIGN
0xE0 => '#x042E', # CYRILLIC CAPITAL LETTER YU
0xE1 => '#x0410', # CYRILLIC CAPITAL LETTER A
0xE2 => '#x0411', # CYRILLIC CAPITAL LETTER BE
0xE3 => '#x0426', # CYRILLIC CAPITAL LETTER TSE
0xE4 => '#x0414', # CYRILLIC CAPITAL LETTER DE
0xE5 => '#x0415', # CYRILLIC CAPITAL LETTER IE
0xE6 => '#x0424', # CYRILLIC CAPITAL LETTER EF
0xE7 => '#x0413', # CYRILLIC CAPITAL LETTER GHE
0xE8 => '#x0425', # CYRILLIC CAPITAL LETTER HA
0xE9 => '#x0418', # CYRILLIC CAPITAL LETTER I
0xEA => '#x0419', # CYRILLIC CAPITAL LETTER SHORT I
0xEB => '#x041A', # CYRILLIC CAPITAL LETTER KA
0xEC => '#x041B', # CYRILLIC CAPITAL LETTER EL
0xED => '#x041C', # CYRILLIC CAPITAL LETTER EM
0xEE => '#x041D', # CYRILLIC CAPITAL LETTER EN
0xEF => '#x041E', # CYRILLIC CAPITAL LETTER O
0xF0 => '#x041F', # CYRILLIC CAPITAL LETTER PE
0xF1 => '#x042F', # CYRILLIC CAPITAL LETTER YA
0xF2 => '#x0420', # CYRILLIC CAPITAL LETTER ER
0xF3 => '#x0421', # CYRILLIC CAPITAL LETTER ES
0xF4 => '#x0422', # CYRILLIC CAPITAL LETTER TE
0xF5 => '#x0423', # CYRILLIC CAPITAL LETTER U
0xF6 => '#x0416', # CYRILLIC CAPITAL LETTER ZHE
0xF7 => '#x0412', # CYRILLIC CAPITAL LETTER VE
0xF8 => '#x042C', # CYRILLIC CAPITAL LETTER SOFT SIGN
0xF9 => '#x042B', # CYRILLIC CAPITAL LETTER YERU
0xFA => '#x0417', # CYRILLIC CAPITAL LETTER ZE
0xFB => '#x0428', # CYRILLIC CAPITAL LETTER SHA
0xFC => '#x042D', # CYRILLIC CAPITAL LETTER E
0xFD => '#x0429', # CYRILLIC CAPITAL LETTER SHCHA
0xFE => '#x0427', # CYRILLIC CAPITAL LETTER CHE
0xFF => '#x042A', # CYRILLIC CAPITAL LETTER HARD SIGN
};
--- NEW FILE ---
package MHonArc::CharEnt::KOI_0;
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x24 => '#x00A4', # CURRENCY SIGN
0x40 => '#x044E', # CYRILLIC SMALL LETTER YU
0x41 => '#x0430', # CYRILLIC SMALL LETTER A
0x42 => '#x0431', # CYRILLIC SMALL LETTER BE
0x43 => '#x0446', # CYRILLIC SMALL LETTER TSE
0x44 => '#x0434', # CYRILLIC SMALL LETTER DE
0x45 => '#x0435', # CYRILLIC SMALL LETTER IE
0x46 => '#x0444', # CYRILLIC SMALL LETTER EF
0x47 => '#x0433', # CYRILLIC SMALL LETTER GHE
0x48 => '#x0445', # CYRILLIC SMALL LETTER HA
0x49 => '#x0438', # CYRILLIC SMALL LETTER I
0x4A => '#x0439', # CYRILLIC SMALL LETTER SHORT I
0x4B => '#x043A', # CYRILLIC SMALL LETTER KA
0x4C => '#x043B', # CYRILLIC SMALL LETTER EL
0x4D => '#x043C', # CYRILLIC SMALL LETTER EM
0x4E => '#x043D', # CYRILLIC SMALL LETTER EN
0x4F => '#x043E', # CYRILLIC SMALL LETTER O
0x50 => '#x043F', # CYRILLIC SMALL LETTER PE
0x51 => '#x044F', # CYRILLIC SMALL LETTER YA
0x52 => '#x0440', # CYRILLIC SMALL LETTER ER
0x53 => '#x0441', # CYRILLIC SMALL LETTER ES
0x54 => '#x0442', # CYRILLIC SMALL LETTER TE
0x55 => '#x0443', # CYRILLIC SMALL LETTER U
0x56 => '#x0436', # CYRILLIC SMALL LETTER ZHE
0x57 => '#x0432', # CYRILLIC SMALL LETTER VE
0x58 => '#x044C', # CYRILLIC SMALL LETTER SOFT SIGN
0x59 => '#x044B', # CYRILLIC SMALL LETTER YERU
0x5A => '#x0437', # CYRILLIC SMALL LETTER ZE
0x5B => '#x0448', # CYRILLIC SMALL LETTER SHA
0x5C => '#x044D', # CYRILLIC SMALL LETTER E
0x5D => '#x0449', # CYRILLIC SMALL LETTER SHCHA
0x5E => '#x0447', # CYRILLIC SMALL LETTER CHE
0x5F => '#x044A', # CYRILLIC SMALL LETTER HARD SIGN
0x60 => '#x042E', # CYRILLIC CAPITAL LETTER YU
0x61 => '#x0410', # CYRILLIC CAPITAL LETTER A
0x62 => '#x0411', # CYRILLIC CAPITAL LETTER BE
0x63 => '#x0426', # CYRILLIC CAPITAL LETTER TSE
0x64 => '#x0414', # CYRILLIC CAPITAL LETTER DE
0x65 => '#x0415', # CYRILLIC CAPITAL LETTER IE
0x66 => '#x0424', # CYRILLIC CAPITAL LETTER EF
0x67 => '#x0413', # CYRILLIC CAPITAL LETTER GHE
0x68 => '#x0425', # CYRILLIC CAPITAL LETTER HA
0x69 => '#x0418', # CYRILLIC CAPITAL LETTER I
0x6A => '#x0419', # CYRILLIC CAPITAL LETTER SHORT I
0x6B => '#x041A', # CYRILLIC CAPITAL LETTER KA
0x6C => '#x041B', # CYRILLIC CAPITAL LETTER EL
0x6D => '#x041C', # CYRILLIC CAPITAL LETTER EM
0x6E => '#x041D', # CYRILLIC CAPITAL LETTER EN
0x6F => '#x041E', # CYRILLIC CAPITAL LETTER O
0x70 => '#x041F', # CYRILLIC CAPITAL LETTER PE
0x71 => '#x042F', # CYRILLIC CAPITAL LETTER YA
0x72 => '#x0420', # CYRILLIC CAPITAL LETTER ER
0x73 => '#x0421', # CYRILLIC CAPITAL LETTER ES
0x74 => '#x0422', # CYRILLIC CAPITAL LETTER TE
0x75 => '#x0423', # CYRILLIC CAPITAL LETTER U
0x76 => '#x0416', # CYRILLIC CAPITAL LETTER ZHE
0x77 => '#x0412', # CYRILLIC CAPITAL LETTER VE
0x78 => '#x042C', # CYRILLIC CAPITAL LETTER SOFT SIGN
0x79 => '#x042B', # CYRILLIC CAPITAL LETTER YERU
0x7A => '#x0417', # CYRILLIC CAPITAL LETTER ZE
0x7B => '#x0428', # CYRILLIC CAPITAL LETTER SHA
0x7C => '#x042D', # CYRILLIC CAPITAL LETTER E
0x7D => '#x0429', # CYRILLIC CAPITAL LETTER SHCHA
0x7E => '#x0427', # CYRILLIC CAPITAL LETTER CHE
};
--- NEW FILE ---
package MHonArc::CharEnt::KOI_7;
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x24 => '#x00A4', # CURRENCY SIGN
0x60 => '#x042E', # CYRILLIC CAPITAL LETTER YU
0x61 => '#x0410', # CYRILLIC CAPITAL LETTER A
0x62 => '#x0411', # CYRILLIC CAPITAL LETTER BE
0x63 => '#x0426', # CYRILLIC CAPITAL LETTER TSE
0x64 => '#x0414', # CYRILLIC CAPITAL LETTER DE
0x65 => '#x0415', # CYRILLIC CAPITAL LETTER IE
0x66 => '#x0424', # CYRILLIC CAPITAL LETTER EF
0x67 => '#x0413', # CYRILLIC CAPITAL LETTER GHE
0x68 => '#x0425', # CYRILLIC CAPITAL LETTER HA
0x69 => '#x0418', # CYRILLIC CAPITAL LETTER I
0x6A => '#x0419', # CYRILLIC CAPITAL LETTER SHORT I
0x6B => '#x041A', # CYRILLIC CAPITAL LETTER KA
0x6C => '#x041B', # CYRILLIC CAPITAL LETTER EL
0x6D => '#x041C', # CYRILLIC CAPITAL LETTER EM
0x6E => '#x041D', # CYRILLIC CAPITAL LETTER EN
0x6F => '#x041E', # CYRILLIC CAPITAL LETTER O
0x70 => '#x041F', # CYRILLIC CAPITAL LETTER PE
0x71 => '#x042F', # CYRILLIC CAPITAL LETTER YA
0x72 => '#x0420', # CYRILLIC CAPITAL LETTER ER
0x73 => '#x0421', # CYRILLIC CAPITAL LETTER ES
0x74 => '#x0422', # CYRILLIC CAPITAL LETTER TE
0x75 => '#x0423', # CYRILLIC CAPITAL LETTER U
0x76 => '#x0416', # CYRILLIC CAPITAL LETTER ZHE
0x77 => '#x0412', # CYRILLIC CAPITAL LETTER VE
0x78 => '#x042C', # CYRILLIC CAPITAL LETTER SOFT SIGN
0x79 => '#x042B', # CYRILLIC CAPITAL LETTER YERU
0x7A => '#x0417', # CYRILLIC CAPITAL LETTER ZE
0x7B => '#x0428', # CYRILLIC CAPITAL LETTER SHA
0x7C => '#x042D', # CYRILLIC CAPITAL LETTER E
0x7D => '#x0429', # CYRILLIC CAPITAL LETTER SHCHA
0x7E => '#x0427', # CYRILLIC CAPITAL LETTER CHE
};
--- NEW FILE ---
package MHonArc::CharEnt::VISCII;
# Vietnamese
+{
#--------------------------------------------------------------------------
# Hex Code Entity Ref # ISO external entity and description
#--------------------------------------------------------------------------
0x02 => '#x1EB2', # LATIN CAPITAL LETTER A WITH BREVE AND HOOK
ABOVE
0x05 => '#x1EB4', # LATIN CAPITAL LETTER A WITH BREVE AND TILDE
0x06 => '#x1EAA', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND
TILDE
0x14 => '#x1EF6', # LATIN CAPITAL LETTER Y WITH HOOK ABOVE
0x19 => '#x1EF8', # LATIN CAPITAL LETTER Y WITH TILDE
0x1E => '#x1EF4', # LATIN CAPITAL LETTER Y WITH DOT BELOW
0x80 => '#x1EA0', # LATIN CAPITAL LETTER A WITH DOT BELOW
0x81 => '#x1EAE', # LATIN CAPITAL LETTER A WITH BREVE AND ACUTE
0x82 => '#x1EB0', # LATIN CAPITAL LETTER A WITH BREVE AND GRAVE
0x83 => '#x1EB6', # LATIN CAPITAL LETTER A WITH BREVE AND DOT
BELOW
0x84 => '#x1EA4', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND
ACUTE
0x85 => '#x1EA6', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND
GRAVE
0x86 => '#x1EA8', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND
HOOK ABOVE
0x87 => '#x1EAC', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND
DOT BELOW
0x88 => '#x1EBC', # LATIN CAPITAL LETTER E WITH TILDE
0x89 => '#x1EB8', # LATIN CAPITAL LETTER E WITH DOT BELOW
0x8A => '#x1EBE', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND
ACUTE
0x8B => '#x1EC0', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND
GRAVE
0x8C => '#x1EC2', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND
HOOK ABOVE
0x8D => '#x1EC4', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND
TILDE
0x8E => '#x1EC6', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND
DOT BELOW
0x8F => '#x1ED0', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND
ACUTE
0x90 => '#x1ED2', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND
GRAVE
0x91 => '#x1ED4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND
HOOK ABOVE
0x92 => '#x1ED6', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND
TILDE
0x93 => '#x1ED8', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND
DOT BELOW
0x94 => '#x1EE2', # LATIN CAPITAL LETTER O WITH HORN AND DOT BELOW
0x95 => '#x1EDA', # LATIN CAPITAL LETTER O WITH HORN AND ACUTE
0x96 => '#x1EDC', # LATIN CAPITAL LETTER O WITH HORN AND GRAVE
0x97 => '#x1EDE', # LATIN CAPITAL LETTER O WITH HORN AND HOOK
ABOVE
0x98 => '#x1ECA', # LATIN CAPITAL LETTER I WITH DOT BELOW
0x99 => '#x1ECE', # LATIN CAPITAL LETTER O WITH HOOK ABOVE
0x9A => '#x1ECC', # LATIN CAPITAL LETTER O WITH DOT BELOW
0x9B => '#x1EC8', # LATIN CAPITAL LETTER I WITH HOOK ABOVE
0x9C => '#x1EE6', # LATIN CAPITAL LETTER U WITH HOOK ABOVE
0x9D => '#x0168', # LATIN CAPITAL LETTER U WITH TILDE
0x9E => '#x1EE4', # LATIN CAPITAL LETTER U WITH DOT BELOW
0x9F => '#x1EF2', # LATIN CAPITAL LETTER Y WITH GRAVE
0xA0 => '#x00D5', # LATIN CAPITAL LETTER O WITH TILDE
0xA1 => '#x1EAF', # LATIN SMALL LETTER A WITH BREVE AND ACUTE
0xA2 => '#x1EB1', # LATIN SMALL LETTER A WITH BREVE AND GRAVE
0xA3 => '#x1EB7', # LATIN SMALL LETTER A WITH BREVE AND DOT BELOW
0xA4 => '#x1EA5', # LATIN SMALL LETTER A WITH CIRCUMFLEX AND ACUTE
0xA5 => '#x1EA7', # LATIN SMALL LETTER A WITH CIRCUMFLEX AND GRAVE
0xA6 => '#x1EA8', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND
HOOK ABOVE
0xA7 => '#x1EAD', # LATIN SMALL LETTER A WITH CIRCUMFLEX AND DOT
BELOW
0xA8 => '#x1EBD', # LATIN SMALL LETTER E WITH TILDE
0xA9 => '#x1EB9', # LATIN SMALL LETTER E WITH DOT BELOW
0xAA => '#x1EBF', # LATIN SMALL LETTER E WITH CIRCUMFLEX AND ACUTE
0xAB => '#x1EC1', # LATIN SMALL LETTER E WITH CIRCUMFLEX AND GRAVE
0xAC => '#x1EC3', # LATIN SMALL LETTER E WITH CIRCUMFLEX AND HOOK
ABOVE
0xAD => '#x1EC5', # LATIN SMALL LETTER E WITH CIRCUMFLEX AND TILDE
0xAE => '#x1EC7', # LATIN SMALL LETTER E WITH CIRCUMFLEX AND DOT
BELOW
0xAF => '#x1ED1', # LATIN SMALL LETTER O WITH CIRCUMFLEX AND ACUTE
0xB0 => '#x1ED3', # LATIN SMALL LETTER O WITH CIRCUMFLEX AND GRAVE
0xB1 => '#x1ED5', # LATIN SMALL LETTER O WITH CIRCUMFLEX AND HOOK
ABOVE
0xB2 => '#x1ED7', # LATIN SMALL LETTER O WITH CIRCUMFLEX AND TILDE
0xB3 => '#x1EE0', # LATIN CAPITAL LETTER O WITH HORN AND TILDE
0xB4 => '#x01A0', # LATIN CAPITAL LETTER O WITH HORN
0xB5 => '#x1ED9', # LATIN SMALL LETTER O WITH CIRCUMFLEX AND DOT
BELOW
0xB6 => '#x1EDD', # LATIN SMALL LETTER O WITH HORN AND GRAVE
0xB7 => '#x1EDF', # LATIN SMALL LETTER O WITH HORN AND HOOK ABOVE
0xB8 => '#x1ECB', # LATIN SMALL LETTER I WITH DOT BELOW
0xB9 => '#x1EF0', # LATIN CAPITAL LETTER U WITH HORN AND DOT BELOW
0xBA => '#x1EE8', # LATIN CAPITAL LETTER U WITH HORN AND ACUTE
0xBB => '#x1EEA', # LATIN CAPITAL LETTER U WITH HORN AND GRAVE
0xBC => '#x1EEC', # LATIN CAPITAL LETTER U WITH HORN AND HOOK
ABOVE
0xBD => '#x01A1', # LATIN SMALL LETTER O WITH HORN
0xBE => '#x1EDB', # LATIN SMALL LETTER O WITH HORN AND ACUTE
0xBF => '#x01AF', # LATIN CAPITAL LETTER U WITH HORN
0xC0 => '#x00C0', # LATIN CAPITAL LETTER A WITH GRAVE
0xC1 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
0xC2 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
0xC3 => '#x00C3', # LATIN CAPITAL LETTER A WITH TILDE
0xC4 => '#x1EA2', # LATIN CAPITAL LETTER A WITH HOOK ABOVE
0xC5 => '#x0102', # LATIN CAPITAL LETTER A WITH BREVE
0xC6 => '#x1EB3', # LATIN SMALL LETTER A WITH BREVE AND HOOK ABOVE
0xC7 => '#x1EB5', # LATIN SMALL LETTER A WITH BREVE AND TILDE
0xC8 => '#x00C8', # LATIN CAPITAL LETTER E WITH GRAVE
0xC9 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
0xCA => '#x00CA', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX
0xCB => '#x1EBA', # LATIN CAPITAL LETTER E WITH HOOK ABOVE
0xCC => '#x00CC', # LATIN CAPITAL LETTER I WITH GRAVE
0xCD => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
0xCE => '#x0128', # LATIN CAPITAL LETTER I WITH TILDE
0xCF => '#x1EF3', # LATIN SMALL LETTER Y WITH GRAVE
0xD0 => '#x0110', # LATIN CAPITAL LETTER D WITH STROKE
0xD1 => '#x1EE9', # LATIN SMALL LETTER U WITH HORN AND ACUTE
0xD2 => '#x00D2', # LATIN CAPITAL LETTER O WITH GRAVE
0xD3 => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
0xD4 => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
0xD5 => '#x1EA1', # LATIN SMALL LETTER A WITH DOT BELOW
0xD6 => '#x1EF7', # LATIN SMALL LETTER Y WITH HOOK ABOVE
0xD7 => '#x1EEB', # LATIN SMALL LETTER U WITH HORN AND GRAVE
0xD8 => '#x1EED', # LATIN SMALL LETTER U WITH HORN AND HOOK ABOVE
0xD9 => '#x00D9', # LATIN CAPITAL LETTER U WITH GRAVE
0xDA => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
0xDB => '#x1EF9', # LATIN SMALL LETTER Y WITH TILDE
0xDC => '#x1EF5', # LATIN SMALL LETTER Y WITH DOT BELOW
0xDD => '#x00DD', # LATIN CAPITAL LETTER Y WITH ACUTE
0xDE => '#x1EE1', # LATIN SMALL LETTER O WITH HORN AND TILDE
0xDF => '#x01B0', # LATIN SMALL LETTER U WITH HORN
0xE0 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
0xE1 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
0xE2 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
0xE3 => '#x00E3', # LATIN SMALL LETTER A WITH TILDE
0xE4 => '#x1EA3', # LATIN SMALL LETTER A WITH HOOK ABOVE
0xE5 => '#x0103', # LATIN SMALL LETTER A WITH BREVE
0xE6 => '#x1EEF', # LATIN SMALL LETTER U WITH HORN AND TILDE
0xE7 => '#x1EAB', # LATIN SMALL LETTER A WITH CIRCUMFLEX AND TILDE
0xE8 => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
0xE9 => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
0xEA => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
0xEB => '#x1EBB', # LATIN SMALL LETTER E WITH HOOK ABOVE
0xEC => '#x00EC', # LATIN SMALL LETTER I WITH GRAVE
0xED => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
0xEE => '#x0129', # LATIN SMALL LETTER I WITH TILDE
0xEF => '#x1EC9', # LATIN SMALL LETTER I WITH HOOK ABOVE
0xF0 => '#x0111', # LATIN SMALL LETTER D WITH STROKE
0xF1 => '#x1EF1', # LATIN SMALL LETTER U WITH HORN AND DOT BELOW
0xF2 => '#x00F2', # LATIN SMALL LETTER O WITH GRAVE
0xF3 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
0xF4 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
0xF5 => '#x00F5', # LATIN SMALL LETTER O WITH TILDE
0xF6 => '#x1ECF', # LATIN SMALL LETTER O WITH HOOK ABOVE
0xF7 => '#x1ECD', # LATIN SMALL LETTER O WITH DOT BELOW
0xF8 => '#x1EE5', # LATIN SMALL LETTER U WITH DOT BELOW
0xF9 => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
0xFA => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
0xFB => '#x0169', # LATIN SMALL LETTER U WITH TILDE
0xFC => '#x1EE7', # LATIN SMALL LETTER U WITH HOOK ABOVE
0xFD => '#x00FD', # LATIN SMALL LETTER Y WITH ACUTE
0xFE => '#x1EE3', # LATIN SMALL LETTER O WITH HORN AND DOT BELOW
0xFF => '#x1EEE', # LATIN CAPITAL LETTER U WITH HORN AND TILDE
};
Index: CP1250.pm
===================================================================
RCS file: /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt/CP1250.pm,v
retrieving revision 1.1
retrieving revision 1.2
diff -C2 -r1.1 -r1.2
*** CP1250.pm 5 Sep 2001 14:16:03 -0000 1.1
--- CP1250.pm 17 Nov 2002 03:38:53 -0000 1.2
***************
*** 34,38 ****
--- 34,168 ----
## Windows-1250: WinLatin2
##---------------------------------------------------------------------------
+ +{
+ #--------------------------------------------------------------------------
+ # Hex Code Entity Ref # ISO external entity and description
+ #--------------------------------------------------------------------------
+ 0x80 => '#x20AC', # EURO SIGN
+ 0x82 => '#x201A', # SINGLE LOW-9 QUOTATION MARK
+ 0x84 => '#x201E', # DOUBLE LOW-9 QUOTATION MARK
+ 0x85 => '#x2026', # HORIZONTAL ELLIPSIS
+ 0x86 => '#x2020', # DAGGER
+ 0x87 => '#x2021', # DOUBLE DAGGER
+ 0x89 => '#x2030', # PER MILLE SIGN
+ 0x8A => '#x0160', # LATIN CAPITAL LETTER S WITH CARON
+ 0x8B => '#x2039', # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
+ 0x8C => '#x015A', # LATIN CAPITAL LETTER S WITH ACUTE
+ 0x8D => '#x0164', # LATIN CAPITAL LETTER T WITH CARON
+ 0x8E => '#x017D', # LATIN CAPITAL LETTER Z WITH CARON
+ 0x8F => '#x0179', # LATIN CAPITAL LETTER Z WITH ACUTE
+ 0x91 => '#x2018', # LEFT SINGLE QUOTATION MARK
+ 0x92 => '#x2019', # RIGHT SINGLE QUOTATION MARK
+ 0x93 => '#x201C', # LEFT DOUBLE QUOTATION MARK
+ 0x94 => '#x201D', # RIGHT DOUBLE QUOTATION MARK
+ 0x95 => '#x2022', # BULLET
+ 0x96 => '#x2013', # EN DASH
+ 0x97 => '#x2014', # EM DASH
+ 0x99 => '#x2122', # TRADE MARK SIGN
+ 0x9A => '#x0161', # LATIN SMALL LETTER S WITH CARON
+ 0x9B => '#x203A', # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
+ 0x9C => '#x015B', # LATIN SMALL LETTER S WITH ACUTE
+ 0x9D => '#x0165', # LATIN SMALL LETTER T WITH CARON
+ 0x9E => '#x017E', # LATIN SMALL LETTER Z WITH CARON
+ 0x9F => '#x017A', # LATIN SMALL LETTER Z WITH ACUTE
+ 0xA1 => '#x02C7', # CARON
+ 0xA2 => '#x02D8', # BREVE
+ 0xA3 => '#x0141', # LATIN CAPITAL LETTER L WITH STROKE
+ 0xA4 => '#x00A4', # CURRENCY SIGN
+ 0xA5 => '#x0104', # LATIN CAPITAL LETTER A WITH OGONEK
+ 0xA6 => '#x00A6', # BROKEN BAR
+ 0xA7 => '#x00A7', # SECTION SIGN
+ 0xA8 => '#x00A8', # DIAERESIS
+ 0xA9 => '#x00A9', # COPYRIGHT SIGN
+ 0xAA => '#x015E', # LATIN CAPITAL LETTER S WITH CEDILLA
+ 0xAB => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
+ 0xAC => '#x00AC', # NOT SIGN
+ 0xAD => '#x00AD', # SOFT HYPHEN
+ 0xAE => '#x00AE', # REGISTERED SIGN
+ 0xAF => '#x017B', # LATIN CAPITAL LETTER Z WITH DOT ABOVE
+ 0xB0 => '#x00B0', # DEGREE SIGN
+ 0xB1 => '#x00B1', # PLUS-MINUS SIGN
+ 0xB2 => '#x02DB', # OGONEK
+ 0xB3 => '#x0142', # LATIN SMALL LETTER L WITH STROKE
+ 0xB4 => '#x00B4', # ACUTE ACCENT
+ 0xB5 => '#x00B5', # MICRO SIGN
+ 0xB6 => '#x00B6', # PILCROW SIGN
+ 0xB7 => '#x00B7', # MIDDLE DOT
+ 0xB8 => '#x00B8', # CEDILLA
+ 0xB9 => '#x0105', # LATIN SMALL LETTER A WITH OGONEK
+ 0xBA => '#x015F', # LATIN SMALL LETTER S WITH CEDILLA
+ 0xBB => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
+ 0xBC => '#x013D', # LATIN CAPITAL LETTER L WITH CARON
+ 0xBD => '#x02DD', # DOUBLE ACUTE ACCENT
+ 0xBE => '#x013E', # LATIN SMALL LETTER L WITH CARON
+ 0xBF => '#x017C', # LATIN SMALL LETTER Z WITH DOT ABOVE
+ 0xC0 => '#x0154', # LATIN CAPITAL LETTER R WITH ACUTE
+ 0xC1 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
+ 0xC2 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
+ 0xC3 => '#x0102', # LATIN CAPITAL LETTER A WITH BREVE
+ 0xC4 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
+ 0xC5 => '#x0139', # LATIN CAPITAL LETTER L WITH ACUTE
+ 0xC6 => '#x0106', # LATIN CAPITAL LETTER C WITH ACUTE
+ 0xC7 => '#x00C7', # LATIN CAPITAL LETTER C WITH CEDILLA
+ 0xC8 => '#x010C', # LATIN CAPITAL LETTER C WITH CARON
+ 0xC9 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
+ 0xCA => '#x0118', # LATIN CAPITAL LETTER E WITH OGONEK
+ 0xCB => '#x00CB', # LATIN CAPITAL LETTER E WITH DIAERESIS
+ 0xCC => '#x011A', # LATIN CAPITAL LETTER E WITH CARON
+ 0xCD => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
+ 0xCE => '#x00CE', # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
+ 0xCF => '#x010E', # LATIN CAPITAL LETTER D WITH CARON
+ 0xD0 => '#x0110', # LATIN CAPITAL LETTER D WITH STROKE
+ 0xD1 => '#x0143', # LATIN CAPITAL LETTER N WITH ACUTE
+ 0xD2 => '#x0147', # LATIN CAPITAL LETTER N WITH CARON
+ 0xD3 => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
+ 0xD4 => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
+ 0xD5 => '#x0150', # LATIN CAPITAL LETTER O WITH DOUBLE ACUTE
+ 0xD6 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
+ 0xD7 => '#x00D7', # MULTIPLICATION SIGN
+ 0xD8 => '#x0158', # LATIN CAPITAL LETTER R WITH CARON
+ 0xD9 => '#x016E', # LATIN CAPITAL LETTER U WITH RING ABOVE
+ 0xDA => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
+ 0xDB => '#x0170', # LATIN CAPITAL LETTER U WITH DOUBLE ACUTE
+ 0xDC => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
+ 0xDD => '#x00DD', # LATIN CAPITAL LETTER Y WITH ACUTE
+ 0xDE => '#x0162', # LATIN CAPITAL LETTER T WITH CEDILLA
+ 0xDF => '#x00DF', # LATIN SMALL LETTER SHARP S
+ 0xE0 => '#x0155', # LATIN SMALL LETTER R WITH ACUTE
+ 0xE1 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
+ 0xE2 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
+ 0xE3 => '#x0103', # LATIN SMALL LETTER A WITH BREVE
+ 0xE4 => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
+ 0xE5 => '#x013A', # LATIN SMALL LETTER L WITH ACUTE
+ 0xE6 => '#x0107', # LATIN SMALL LETTER C WITH ACUTE
+ 0xE7 => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
+ 0xE8 => '#x010D', # LATIN SMALL LETTER C WITH CARON
+ 0xE9 => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
+ 0xEA => '#x0119', # LATIN SMALL LETTER E WITH OGONEK
+ 0xEB => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
+ 0xEC => '#x011B', # LATIN SMALL LETTER E WITH CARON
+ 0xED => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
+ 0xEE => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
+ 0xEF => '#x010F', # LATIN SMALL LETTER D WITH CARON
+ 0xF0 => '#x0111', # LATIN SMALL LETTER D WITH STROKE
+ 0xF1 => '#x0144', # LATIN SMALL LETTER N WITH ACUTE
+ 0xF2 => '#x0148', # LATIN SMALL LETTER N WITH CARON
+ 0xF3 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
+ 0xF4 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
+ 0xF5 => '#x0151', # LATIN SMALL LETTER O WITH DOUBLE ACUTE
+ 0xF6 => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
+ 0xF7 => '#x00F7', # DIVISION SIGN
+ 0xF8 => '#x0159', # LATIN SMALL LETTER R WITH CARON
+ 0xF9 => '#x016F', # LATIN SMALL LETTER U WITH RING ABOVE
+ 0xFA => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
+ 0xFB => '#x0171', # LATIN SMALL LETTER U WITH DOUBLE ACUTE
+ 0xFC => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
+ 0xFD => '#x00FD', # LATIN SMALL LETTER Y WITH ACUTE
+ 0xFE => '#x0163', # LATIN SMALL LETTER T WITH CEDILLA
+ 0xFF => '#x02D9', # DOT ABOVE
+ };
+ __END__
+
+ # SGML-based map
+{
#--------------------------------------------------------------------------
Index: ISO8859_10.pm
===================================================================
RCS file: /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt/ISO8859_10.pm,v
retrieving revision 1.1
retrieving revision 1.2
diff -C2 -r1.1 -r1.2
*** ISO8859_10.pm 19 Aug 2001 09:53:55 -0000 1.1
--- ISO8859_10.pm 17 Nov 2002 03:38:53 -0000 1.2
***************
*** 34,38 ****
--- 34,140 ----
## ISO-8859-10: Latin-6
##---------------------------------------------------------------------------
+ +{
+ #--------------------------------------------------------------------------
+ # Hex Code Entity Ref # ISO external entity and description
+ #--------------------------------------------------------------------------
+ 0xA1 => '#x0104', # LATIN CAPITAL LETTER A WITH OGONEK
+ 0xA2 => '#x0112', # LATIN CAPITAL LETTER E WITH MACRON
+ 0xA3 => '#x0122', # LATIN CAPITAL LETTER G WITH CEDILLA
+ 0xA4 => '#x012A', # LATIN CAPITAL LETTER I WITH MACRON
+ 0xA5 => '#x0128', # LATIN CAPITAL LETTER I WITH TILDE
+ 0xA6 => '#x0136', # LATIN CAPITAL LETTER K WITH CEDILLA
+ 0xA7 => '#x00A7', # SECTION SIGN
+ 0xA8 => '#x013B', # LATIN CAPITAL LETTER L WITH CEDILLA
+ 0xA9 => '#x0110', # LATIN CAPITAL LETTER D WITH STROKE
+ 0xAA => '#x0160', # LATIN CAPITAL LETTER S WITH CARON
+ 0xAB => '#x0166', # LATIN CAPITAL LETTER T WITH STROKE
+ 0xAC => '#x017D', # LATIN CAPITAL LETTER Z WITH CARON
+ 0xAD => '#x00AD', # SOFT HYPHEN
+ 0xAE => '#x016A', # LATIN CAPITAL LETTER U WITH MACRON
+ 0xAF => '#x014A', # LATIN CAPITAL LETTER ENG
+ 0xB0 => '#x00B0', # DEGREE SIGN
+ 0xB1 => '#x0105', # LATIN SMALL LETTER A WITH OGONEK
+ 0xB2 => '#x0113', # LATIN SMALL LETTER E WITH MACRON
+ 0xB3 => '#x0123', # LATIN SMALL LETTER G WITH CEDILLA
+ 0xB4 => '#x012B', # LATIN SMALL LETTER I WITH MACRON
+ 0xB5 => '#x0129', # LATIN SMALL LETTER I WITH TILDE
+ 0xB6 => '#x0137', # LATIN SMALL LETTER K WITH CEDILLA
+ 0xB7 => '#x00B7', # MIDDLE DOT
+ 0xB8 => '#x013C', # LATIN SMALL LETTER L WITH CEDILLA
+ 0xB9 => '#x0111', # LATIN SMALL LETTER D WITH STROKE
+ 0xBA => '#x0161', # LATIN SMALL LETTER S WITH CARON
+ 0xBB => '#x0167', # LATIN SMALL LETTER T WITH STROKE
+ 0xBC => '#x017E', # LATIN SMALL LETTER Z WITH CARON
+ 0xBD => '#x2015', # HORIZONTAL BAR
+ 0xBE => '#x016B', # LATIN SMALL LETTER U WITH MACRON
+ 0xBF => '#x014B', # LATIN SMALL LETTER ENG
+ 0xC0 => '#x0100', # LATIN CAPITAL LETTER A WITH MACRON
+ 0xC1 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
+ 0xC2 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
+ 0xC3 => '#x00C3', # LATIN CAPITAL LETTER A WITH TILDE
+ 0xC4 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
+ 0xC5 => '#x00C5', # LATIN CAPITAL LETTER A WITH RING ABOVE
+ 0xC6 => '#x00C6', # LATIN CAPITAL LETTER AE
+ 0xC7 => '#x012E', # LATIN CAPITAL LETTER I WITH OGONEK
+ 0xC8 => '#x010C', # LATIN CAPITAL LETTER C WITH CARON
+ 0xC9 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
+ 0xCA => '#x0118', # LATIN CAPITAL LETTER E WITH OGONEK
+ 0xCB => '#x00CB', # LATIN CAPITAL LETTER E WITH DIAERESIS
+ 0xCC => '#x0116', # LATIN CAPITAL LETTER E WITH DOT ABOVE
+ 0xCD => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
+ 0xCE => '#x00CE', # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
+ 0xCF => '#x00CF', # LATIN CAPITAL LETTER I WITH DIAERESIS
+ 0xD0 => '#x00D0', # LATIN CAPITAL LETTER ETH (Icelandic)
+ 0xD1 => '#x0145', # LATIN CAPITAL LETTER N WITH CEDILLA
+ 0xD2 => '#x014C', # LATIN CAPITAL LETTER O WITH MACRON
+ 0xD3 => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
+ 0xD4 => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
+ 0xD5 => '#x00D5', # LATIN CAPITAL LETTER O WITH TILDE
+ 0xD6 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
+ 0xD7 => '#x0168', # LATIN CAPITAL LETTER U WITH TILDE
+ 0xD8 => '#x00D8', # LATIN CAPITAL LETTER O WITH STROKE
+ 0xD9 => '#x0172', # LATIN CAPITAL LETTER U WITH OGONEK
+ 0xDA => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
+ 0xDB => '#x00DB', # LATIN CAPITAL LETTER U WITH CIRCUMFLEX
+ 0xDC => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
+ 0xDD => '#x00DD', # LATIN CAPITAL LETTER Y WITH ACUTE
+ 0xDE => '#x00DE', # LATIN CAPITAL LETTER THORN (Icelandic)
+ 0xDF => '#x00DF', # LATIN SMALL LETTER SHARP S (German)
+ 0xE0 => '#x0101', # LATIN SMALL LETTER A WITH MACRON
+ 0xE1 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
+ 0xE2 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
+ 0xE3 => '#x00E3', # LATIN SMALL LETTER A WITH TILDE
+ 0xE4 => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
+ 0xE5 => '#x00E5', # LATIN SMALL LETTER A WITH RING ABOVE
+ 0xE6 => '#x00E6', # LATIN SMALL LETTER AE
+ 0xE7 => '#x012F', # LATIN SMALL LETTER I WITH OGONEK
+ 0xE8 => '#x010D', # LATIN SMALL LETTER C WITH CARON
+ 0xE9 => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
+ 0xEA => '#x0119', # LATIN SMALL LETTER E WITH OGONEK
+ 0xEB => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
+ 0xEC => '#x0117', # LATIN SMALL LETTER E WITH DOT ABOVE
+ 0xED => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
+ 0xEE => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
+ 0xEF => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
+ 0xF0 => '#x00F0', # LATIN SMALL LETTER ETH (Icelandic)
+ 0xF1 => '#x0146', # LATIN SMALL LETTER N WITH CEDILLA
+ 0xF2 => '#x014D', # LATIN SMALL LETTER O WITH MACRON
+ 0xF3 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
+ 0xF4 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
+ 0xF5 => '#x00F5', # LATIN SMALL LETTER O WITH TILDE
+ 0xF6 => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
+ 0xF7 => '#x0169', # LATIN SMALL LETTER U WITH TILDE
+ 0xF8 => '#x00F8', # LATIN SMALL LETTER O WITH STROKE
+ 0xF9 => '#x0173', # LATIN SMALL LETTER U WITH OGONEK
+ 0xFA => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
+ 0xFB => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
+ 0xFC => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
+ 0xFD => '#x00FD', # LATIN SMALL LETTER Y WITH ACUTE
+ 0xFE => '#x00FE', # LATIN SMALL LETTER THORN (Icelandic)
+ 0xFF => '#x0138', # LATIN SMALL LETTER KRA
+ };
+ __END__
+ # SGML-based map
+{
#--------------------------------------------------------------------------
Index: ISO8859_15.pm
===================================================================
RCS file: /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt/ISO8859_15.pm,v
retrieving revision 1.1
retrieving revision 1.2
diff -C2 -r1.1 -r1.2
*** ISO8859_15.pm 13 Apr 2002 00:58:11 -0000 1.1
--- ISO8859_15.pm 17 Nov 2002 03:38:53 -0000 1.2
***************
*** 60,68 ****
0xB2, 'sup2', # ISOnum : SUPERSCRIPT TWO
0xB3, 'sup3', # ISOnum : SUPERSCRIPT THREE
! 0xB4, 'Zcaron', # ISOlat9: ZCARON
0xB5, 'micro', # ISOnum : MICRO SIGN
0xB6, 'para', # ISOnum : PILCROW SIGN
0xB7, 'middot', # ISOnum : MIDDLE DOT
! 0xB8, 'zcaron', # ISOlat9: ZCARON SMALL
0xB9, 'sup1', # ISOnum : SUPERSCRIPT ONE
0xBA, 'ordm', # ISOnum : MASCULINE ORDINAL INDICATOR
--- 60,70 ----
0xB2, 'sup2', # ISOnum : SUPERSCRIPT TWO
0xB3, 'sup3', # ISOnum : SUPERSCRIPT THREE
! # 0xB4, 'Zcaron', # ISOlat9: ZCARON
! 0xB4, '#x017D', # ISOlat9: ZCARON
0xB5, 'micro', # ISOnum : MICRO SIGN
0xB6, 'para', # ISOnum : PILCROW SIGN
0xB7, 'middot', # ISOnum : MIDDLE DOT
! # 0xB8, 'zcaron', # ISOlat9: ZCARON SMALL
! 0xB8, '#x017E', # ISOlat9: ZCARON SMALL
0xB9, 'sup1', # ISOnum : SUPERSCRIPT ONE
0xBA, 'ordm', # ISOnum : MASCULINE ORDINAL INDICATOR
Index: ISO8859_2.pm
===================================================================
RCS file: /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt/ISO8859_2.pm,v
retrieving revision 1.1
retrieving revision 1.2
diff -C2 -r1.1 -r1.2
*** ISO8859_2.pm 19 Aug 2001 09:53:55 -0000 1.1
--- ISO8859_2.pm 17 Nov 2002 03:38:53 -0000 1.2
***************
*** 34,38 ****
--- 34,140 ----
## ISO-8859-2: Latin-2
##---------------------------------------------------------------------------
+ +{
+ #--------------------------------------------------------------------------
+ # Hex Code Entity Ref # ISO external entity and description
+ #--------------------------------------------------------------------------
+ 0xA1 => '#x0104', # LATIN CAPITAL LETTER A WITH OGONEK
+ 0xA2 => '#x02D8', # BREVE
+ 0xA3 => '#x0141', # LATIN CAPITAL LETTER L WITH STROKE
+ 0xA4 => '#x00A4', # CURRENCY SIGN
+ 0xA5 => '#x013D', # LATIN CAPITAL LETTER L WITH CARON
+ 0xA6 => '#x015A', # LATIN CAPITAL LETTER S WITH ACUTE
+ 0xA7 => '#x00A7', # SECTION SIGN
+ 0xA8 => '#x00A8', # DIAERESIS
+ 0xA9 => '#x0160', # LATIN CAPITAL LETTER S WITH CARON
+ 0xAA => '#x015E', # LATIN CAPITAL LETTER S WITH CEDILLA
+ 0xAB => '#x0164', # LATIN CAPITAL LETTER T WITH CARON
+ 0xAC => '#x0179', # LATIN CAPITAL LETTER Z WITH ACUTE
+ 0xAD => '#x00AD', # SOFT HYPHEN
+ 0xAE => '#x017D', # LATIN CAPITAL LETTER Z WITH CARON
+ 0xAF => '#x017B', # LATIN CAPITAL LETTER Z WITH DOT ABOVE
+ 0xB0 => '#x00B0', # DEGREE SIGN
+ 0xB1 => '#x0105', # LATIN SMALL LETTER A WITH OGONEK
+ 0xB2 => '#x02DB', # OGONEK
+ 0xB3 => '#x0142', # LATIN SMALL LETTER L WITH STROKE
+ 0xB4 => '#x00B4', # ACUTE ACCENT
+ 0xB5 => '#x013E', # LATIN SMALL LETTER L WITH CARON
+ 0xB6 => '#x015B', # LATIN SMALL LETTER S WITH ACUTE
+ 0xB7 => '#x02C7', # CARON
+ 0xB8 => '#x00B8', # CEDILLA
+ 0xB9 => '#x0161', # LATIN SMALL LETTER S WITH CARON
+ 0xBA => '#x015F', # LATIN SMALL LETTER S WITH CEDILLA
+ 0xBB => '#x0165', # LATIN SMALL LETTER T WITH CARON
+ 0xBC => '#x017A', # LATIN SMALL LETTER Z WITH ACUTE
+ 0xBD => '#x02DD', # DOUBLE ACUTE ACCENT
+ 0xBE => '#x017E', # LATIN SMALL LETTER Z WITH CARON
+ 0xBF => '#x017C', # LATIN SMALL LETTER Z WITH DOT ABOVE
+ 0xC0 => '#x0154', # LATIN CAPITAL LETTER R WITH ACUTE
+ 0xC1 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
+ 0xC2 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
+ 0xC3 => '#x0102', # LATIN CAPITAL LETTER A WITH BREVE
+ 0xC4 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
+ 0xC5 => '#x0139', # LATIN CAPITAL LETTER L WITH ACUTE
+ 0xC6 => '#x0106', # LATIN CAPITAL LETTER C WITH ACUTE
+ 0xC7 => '#x00C7', # LATIN CAPITAL LETTER C WITH CEDILLA
+ 0xC8 => '#x010C', # LATIN CAPITAL LETTER C WITH CARON
+ 0xC9 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
+ 0xCA => '#x0118', # LATIN CAPITAL LETTER E WITH OGONEK
+ 0xCB => '#x00CB', # LATIN CAPITAL LETTER E WITH DIAERESIS
+ 0xCC => '#x011A', # LATIN CAPITAL LETTER E WITH CARON
+ 0xCD => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
+ 0xCE => '#x00CE', # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
+ 0xCF => '#x010E', # LATIN CAPITAL LETTER D WITH CARON
+ 0xD0 => '#x0110', # LATIN CAPITAL LETTER D WITH STROKE
+ 0xD1 => '#x0143', # LATIN CAPITAL LETTER N WITH ACUTE
+ 0xD2 => '#x0147', # LATIN CAPITAL LETTER N WITH CARON
+ 0xD3 => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
+ 0xD4 => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
+ 0xD5 => '#x0150', # LATIN CAPITAL LETTER O WITH DOUBLE ACUTE
+ 0xD6 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
+ 0xD7 => '#x00D7', # MULTIPLICATION SIGN
+ 0xD8 => '#x0158', # LATIN CAPITAL LETTER R WITH CARON
+ 0xD9 => '#x016E', # LATIN CAPITAL LETTER U WITH RING ABOVE
+ 0xDA => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
+ 0xDB => '#x0170', # LATIN CAPITAL LETTER U WITH DOUBLE ACUTE
+ 0xDC => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
+ 0xDD => '#x00DD', # LATIN CAPITAL LETTER Y WITH ACUTE
+ 0xDE => '#x0162', # LATIN CAPITAL LETTER T WITH CEDILLA
+ 0xDF => '#x00DF', # LATIN SMALL LETTER SHARP S
+ 0xE0 => '#x0155', # LATIN SMALL LETTER R WITH ACUTE
+ 0xE1 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
+ 0xE2 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
+ 0xE3 => '#x0103', # LATIN SMALL LETTER A WITH BREVE
+ 0xE4 => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
+ 0xE5 => '#x013A', # LATIN SMALL LETTER L WITH ACUTE
+ 0xE6 => '#x0107', # LATIN SMALL LETTER C WITH ACUTE
+ 0xE7 => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
+ 0xE8 => '#x010D', # LATIN SMALL LETTER C WITH CARON
+ 0xE9 => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
+ 0xEA => '#x0119', # LATIN SMALL LETTER E WITH OGONEK
+ 0xEB => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
+ 0xEC => '#x011B', # LATIN SMALL LETTER E WITH CARON
+ 0xED => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
+ 0xEE => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
+ 0xEF => '#x010F', # LATIN SMALL LETTER D WITH CARON
+ 0xF0 => '#x0111', # LATIN SMALL LETTER D WITH STROKE
+ 0xF1 => '#x0144', # LATIN SMALL LETTER N WITH ACUTE
+ 0xF2 => '#x0148', # LATIN SMALL LETTER N WITH CARON
+ 0xF3 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
+ 0xF4 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
+ 0xF5 => '#x0151', # LATIN SMALL LETTER O WITH DOUBLE ACUTE
+ 0xF6 => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
+ 0xF7 => '#x00F7', # DIVISION SIGN
+ 0xF8 => '#x0159', # LATIN SMALL LETTER R WITH CARON
+ 0xF9 => '#x016F', # LATIN SMALL LETTER U WITH RING ABOVE
+ 0xFA => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
+ 0xFB => '#x0171', # LATIN SMALL LETTER U WITH DOUBLE ACUTE
+ 0xFC => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
+ 0xFD => '#x00FD', # LATIN SMALL LETTER Y WITH ACUTE
+ 0xFE => '#x0163', # LATIN SMALL LETTER T WITH CEDILLA
+ 0xFF => '#x02D9', # DOT ABOVE
+ };
+ __END__
+ # SGML-based map
+{
#--------------------------------------------------------------------------
Index: ISO8859_3.pm
===================================================================
RCS file: /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt/ISO8859_3.pm,v
retrieving revision 1.1
retrieving revision 1.2
diff -C2 -r1.1 -r1.2
*** ISO8859_3.pm 19 Aug 2001 09:53:55 -0000 1.1
--- ISO8859_3.pm 17 Nov 2002 03:38:53 -0000 1.2
***************
*** 34,38 ****
--- 34,133 ----
## ISO-8859-3: Latin-3
##---------------------------------------------------------------------------
+ +{
+ #--------------------------------------------------------------------------
+ # Hex Code Entity Ref # ISO external entity and description
+ #--------------------------------------------------------------------------
+ 0xA1 => '#x0126', # LATIN CAPITAL LETTER H WITH STROKE
+ 0xA2 => '#x02D8', # BREVE
+ 0xA3 => '#x00A3', # POUND SIGN
+ 0xA4 => '#x00A4', # CURRENCY SIGN
+ 0xA6 => '#x0124', # LATIN CAPITAL LETTER H WITH CIRCUMFLEX
+ 0xA7 => '#x00A7', # SECTION SIGN
+ 0xA8 => '#x00A8', # DIAERESIS
+ 0xA9 => '#x0130', # LATIN CAPITAL LETTER I WITH DOT ABOVE
+ 0xAA => '#x015E', # LATIN CAPITAL LETTER S WITH CEDILLA
+ 0xAB => '#x011E', # LATIN CAPITAL LETTER G WITH BREVE
+ 0xAC => '#x0134', # LATIN CAPITAL LETTER J WITH CIRCUMFLEX
+ 0xAD => '#x00AD', # SOFT HYPHEN
+ 0xAF => '#x017B', # LATIN CAPITAL LETTER Z WITH DOT ABOVE
+ 0xB0 => '#x00B0', # DEGREE SIGN
+ 0xB1 => '#x0127', # LATIN SMALL LETTER H WITH STROKE
+ 0xB2 => '#x00B2', # SUPERSCRIPT TWO
+ 0xB3 => '#x00B3', # SUPERSCRIPT THREE
+ 0xB4 => '#x00B4', # ACUTE ACCENT
+ 0xB5 => '#x00B5', # MICRO SIGN
+ 0xB6 => '#x0125', # LATIN SMALL LETTER H WITH CIRCUMFLEX
+ 0xB7 => '#x00B7', # MIDDLE DOT
+ 0xB8 => '#x00B8', # CEDILLA
+ 0xB9 => '#x0131', # LATIN SMALL LETTER DOTLESS I
+ 0xBA => '#x015F', # LATIN SMALL LETTER S WITH CEDILLA
+ 0xBB => '#x011F', # LATIN SMALL LETTER G WITH BREVE
+ 0xBC => '#x0135', # LATIN SMALL LETTER J WITH CIRCUMFLEX
+ 0xBD => '#x00BD', # VULGAR FRACTION ONE HALF
+ 0xBF => '#x017C', # LATIN SMALL LETTER Z WITH DOT ABOVE
+ 0xC0 => '#x00C0', # LATIN CAPITAL LETTER A WITH GRAVE
+ 0xC1 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
+ 0xC2 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
+ 0xC4 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
+ 0xC5 => '#x010A', # LATIN CAPITAL LETTER C WITH DOT ABOVE
+ 0xC6 => '#x0108', # LATIN CAPITAL LETTER C WITH CIRCUMFLEX
+ 0xC7 => '#x00C7', # LATIN CAPITAL LETTER C WITH CEDILLA
+ 0xC8 => '#x00C8', # LATIN CAPITAL LETTER E WITH GRAVE
+ 0xC9 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
+ 0xCA => '#x00CA', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX
+ 0xCB => '#x00CB', # LATIN CAPITAL LETTER E WITH DIAERESIS
+ 0xCC => '#x00CC', # LATIN CAPITAL LETTER I WITH GRAVE
+ 0xCD => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
+ 0xCE => '#x00CE', # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
+ 0xCF => '#x00CF', # LATIN CAPITAL LETTER I WITH DIAERESIS
+ 0xD1 => '#x00D1', # LATIN CAPITAL LETTER N WITH TILDE
+ 0xD2 => '#x00D2', # LATIN CAPITAL LETTER O WITH GRAVE
+ 0xD3 => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
+ 0xD4 => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
+ 0xD5 => '#x0120', # LATIN CAPITAL LETTER G WITH DOT ABOVE
+ 0xD6 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
+ 0xD7 => '#x00D7', # MULTIPLICATION SIGN
+ 0xD8 => '#x011C', # LATIN CAPITAL LETTER G WITH CIRCUMFLEX
+ 0xD9 => '#x00D9', # LATIN CAPITAL LETTER U WITH GRAVE
+ 0xDA => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
+ 0xDB => '#x00DB', # LATIN CAPITAL LETTER U WITH CIRCUMFLEX
+ 0xDC => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
+ 0xDD => '#x016C', # LATIN CAPITAL LETTER U WITH BREVE
+ 0xDE => '#x015C', # LATIN CAPITAL LETTER S WITH CIRCUMFLEX
+ 0xDF => '#x00DF', # LATIN SMALL LETTER SHARP S
+ 0xE0 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
+ 0xE1 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
+ 0xE2 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
+ 0xE4 => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
+ 0xE5 => '#x010B', # LATIN SMALL LETTER C WITH DOT ABOVE
+ 0xE6 => '#x0109', # LATIN SMALL LETTER C WITH CIRCUMFLEX
+ 0xE7 => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
+ 0xE8 => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
+ 0xE9 => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
+ 0xEA => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
+ 0xEB => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
+ 0xEC => '#x00EC', # LATIN SMALL LETTER I WITH GRAVE
+ 0xED => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
+ 0xEE => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
+ 0xEF => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
+ 0xF1 => '#x00F1', # LATIN SMALL LETTER N WITH TILDE
+ 0xF2 => '#x00F2', # LATIN SMALL LETTER O WITH GRAVE
+ 0xF3 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
+ 0xF4 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
+ 0xF5 => '#x0121', # LATIN SMALL LETTER G WITH DOT ABOVE
+ 0xF6 => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
+ 0xF7 => '#x00F7', # DIVISION SIGN
+ 0xF8 => '#x011D', # LATIN SMALL LETTER G WITH CIRCUMFLEX
+ 0xF9 => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
+ 0xFA => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
+ 0xFB => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
+ 0xFC => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
+ 0xFD => '#x016D', # LATIN SMALL LETTER U WITH BREVE
+ 0xFE => '#x015D', # LATIN SMALL LETTER S WITH CIRCUMFLEX
+ 0xFF => '#x02D9', # DOT ABOVE
+ };
+ __END__
+ # SGML-based map
+{
#--------------------------------------------------------------------------
Index: ISO8859_4.pm
===================================================================
RCS file: /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt/ISO8859_4.pm,v
retrieving revision 1.1
retrieving revision 1.2
diff -C2 -r1.1 -r1.2
*** ISO8859_4.pm 19 Aug 2001 09:53:55 -0000 1.1
--- ISO8859_4.pm 17 Nov 2002 03:38:53 -0000 1.2
***************
*** 34,38 ****
--- 34,140 ----
## ISO-8859-4: Latin-4
##---------------------------------------------------------------------------
+ +{
+ #--------------------------------------------------------------------------
+ # Hex Code Entity Ref # ISO external entity and description
+ #--------------------------------------------------------------------------
+ 0xA1 => '#x0104', # LATIN CAPITAL LETTER A WITH OGONEK
+ 0xA2 => '#x0138', # LATIN SMALL LETTER KRA
+ 0xA3 => '#x0156', # LATIN CAPITAL LETTER R WITH CEDILLA
+ 0xA4 => '#x00A4', # CURRENCY SIGN
+ 0xA5 => '#x0128', # LATIN CAPITAL LETTER I WITH TILDE
+ 0xA6 => '#x013B', # LATIN CAPITAL LETTER L WITH CEDILLA
+ 0xA7 => '#x00A7', # SECTION SIGN
+ 0xA8 => '#x00A8', # DIAERESIS
+ 0xA9 => '#x0160', # LATIN CAPITAL LETTER S WITH CARON
+ 0xAA => '#x0112', # LATIN CAPITAL LETTER E WITH MACRON
+ 0xAB => '#x0122', # LATIN CAPITAL LETTER G WITH CEDILLA
+ 0xAC => '#x0166', # LATIN CAPITAL LETTER T WITH STROKE
+ 0xAD => '#x00AD', # SOFT HYPHEN
+ 0xAE => '#x017D', # LATIN CAPITAL LETTER Z WITH CARON
+ 0xAF => '#x00AF', # MACRON
+ 0xB0 => '#x00B0', # DEGREE SIGN
+ 0xB1 => '#x0105', # LATIN SMALL LETTER A WITH OGONEK
+ 0xB2 => '#x02DB', # OGONEK
+ 0xB3 => '#x0157', # LATIN SMALL LETTER R WITH CEDILLA
+ 0xB4 => '#x00B4', # ACUTE ACCENT
+ 0xB5 => '#x0129', # LATIN SMALL LETTER I WITH TILDE
+ 0xB6 => '#x013C', # LATIN SMALL LETTER L WITH CEDILLA
+ 0xB7 => '#x02C7', # CARON
+ 0xB8 => '#x00B8', # CEDILLA
+ 0xB9 => '#x0161', # LATIN SMALL LETTER S WITH CARON
+ 0xBA => '#x0113', # LATIN SMALL LETTER E WITH MACRON
+ 0xBB => '#x0123', # LATIN SMALL LETTER G WITH CEDILLA
+ 0xBC => '#x0167', # LATIN SMALL LETTER T WITH STROKE
+ 0xBD => '#x014A', # LATIN CAPITAL LETTER ENG
+ 0xBE => '#x017E', # LATIN SMALL LETTER Z WITH CARON
+ 0xBF => '#x014B', # LATIN SMALL LETTER ENG
+ 0xC0 => '#x0100', # LATIN CAPITAL LETTER A WITH MACRON
+ 0xC1 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
+ 0xC2 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
+ 0xC3 => '#x00C3', # LATIN CAPITAL LETTER A WITH TILDE
+ 0xC4 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
+ 0xC5 => '#x00C5', # LATIN CAPITAL LETTER A WITH RING ABOVE
+ 0xC6 => '#x00C6', # LATIN CAPITAL LETTER AE
+ 0xC7 => '#x012E', # LATIN CAPITAL LETTER I WITH OGONEK
+ 0xC8 => '#x010C', # LATIN CAPITAL LETTER C WITH CARON
+ 0xC9 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
+ 0xCA => '#x0118', # LATIN CAPITAL LETTER E WITH OGONEK
+ 0xCB => '#x00CB', # LATIN CAPITAL LETTER E WITH DIAERESIS
+ 0xCC => '#x0116', # LATIN CAPITAL LETTER E WITH DOT ABOVE
+ 0xCD => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
+ 0xCE => '#x00CE', # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
+ 0xCF => '#x012A', # LATIN CAPITAL LETTER I WITH MACRON
+ 0xD0 => '#x0110', # LATIN CAPITAL LETTER D WITH STROKE
+ 0xD1 => '#x0145', # LATIN CAPITAL LETTER N WITH CEDILLA
+ 0xD2 => '#x014C', # LATIN CAPITAL LETTER O WITH MACRON
+ 0xD3 => '#x0136', # LATIN CAPITAL LETTER K WITH CEDILLA
+ 0xD4 => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
+ 0xD5 => '#x00D5', # LATIN CAPITAL LETTER O WITH TILDE
+ 0xD6 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
+ 0xD7 => '#x00D7', # MULTIPLICATION SIGN
+ 0xD8 => '#x00D8', # LATIN CAPITAL LETTER O WITH STROKE
+ 0xD9 => '#x0172', # LATIN CAPITAL LETTER U WITH OGONEK
+ 0xDA => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
+ 0xDB => '#x00DB', # LATIN CAPITAL LETTER U WITH CIRCUMFLEX
+ 0xDC => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
+ 0xDD => '#x0168', # LATIN CAPITAL LETTER U WITH TILDE
+ 0xDE => '#x016A', # LATIN CAPITAL LETTER U WITH MACRON
+ 0xDF => '#x00DF', # LATIN SMALL LETTER SHARP S
+ 0xE0 => '#x0101', # LATIN SMALL LETTER A WITH MACRON
+ 0xE1 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
+ 0xE2 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
+ 0xE3 => '#x00E3', # LATIN SMALL LETTER A WITH TILDE
+ 0xE4 => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
+ 0xE5 => '#x00E5', # LATIN SMALL LETTER A WITH RING ABOVE
+ 0xE6 => '#x00E6', # LATIN SMALL LETTER AE
+ 0xE7 => '#x012F', # LATIN SMALL LETTER I WITH OGONEK
+ 0xE8 => '#x010D', # LATIN SMALL LETTER C WITH CARON
+ 0xE9 => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
+ 0xEA => '#x0119', # LATIN SMALL LETTER E WITH OGONEK
+ 0xEB => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
+ 0xEC => '#x0117', # LATIN SMALL LETTER E WITH DOT ABOVE
+ 0xED => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
+ 0xEE => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
+ 0xEF => '#x012B', # LATIN SMALL LETTER I WITH MACRON
+ 0xF0 => '#x0111', # LATIN SMALL LETTER D WITH STROKE
+ 0xF1 => '#x0146', # LATIN SMALL LETTER N WITH CEDILLA
+ 0xF2 => '#x014D', # LATIN SMALL LETTER O WITH MACRON
+ 0xF3 => '#x0137', # LATIN SMALL LETTER K WITH CEDILLA
+ 0xF4 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
+ 0xF5 => '#x00F5', # LATIN SMALL LETTER O WITH TILDE
+ 0xF6 => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
+ 0xF7 => '#x00F7', # DIVISION SIGN
+ 0xF8 => '#x00F8', # LATIN SMALL LETTER O WITH STROKE
+ 0xF9 => '#x0173', # LATIN SMALL LETTER U WITH OGONEK
+ 0xFA => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
+ 0xFB => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
+ 0xFC => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
+ 0xFD => '#x0169', # LATIN SMALL LETTER U WITH TILDE
+ 0xFE => '#x016B', # LATIN SMALL LETTER U WITH MACRON
+ 0xFF => '#x02D9', # DOT ABOVE
+ };
+ __END__
+ # SGML-based map
+{
#--------------------------------------------------------------------------
Index: ISO8859_5.pm
===================================================================
RCS file: /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt/ISO8859_5.pm,v
retrieving revision 1.1
retrieving revision 1.2
diff -C2 -r1.1 -r1.2
*** ISO8859_5.pm 19 Aug 2001 09:53:55 -0000 1.1
--- ISO8859_5.pm 17 Nov 2002 03:38:53 -0000 1.2
***************
*** 34,38 ****
--- 34,138 ----
## ISO-8859-5: Cyrillic
##---------------------------------------------------------------------------
+ +{
+ #--------------------------------------------------------------------------
+ # Hex Code Entity Ref # ISO external entity and description
+ #--------------------------------------------------------------------------
+ 0xA1 => '#x0401', # CYRILLIC CAPITAL LETTER IO
+ 0xA2 => '#x0402', # CYRILLIC CAPITAL LETTER DJE
+ 0xA3 => '#x0403', # CYRILLIC CAPITAL LETTER GJE
+ 0xA4 => '#x0404', # CYRILLIC CAPITAL LETTER UKRAINIAN IE
+ 0xA5 => '#x0405', # CYRILLIC CAPITAL LETTER DZE
+ 0xA6 => '#x0406', # CYRILLIC CAPITAL LETTER
BYELORUSSIAN-UKRAINIAN I
+ 0xA7 => '#x0407', # CYRILLIC CAPITAL LETTER YI
+ 0xA8 => '#x0408', # CYRILLIC CAPITAL LETTER JE
+ 0xA9 => '#x0409', # CYRILLIC CAPITAL LETTER LJE
+ 0xAA => '#x040A', # CYRILLIC CAPITAL LETTER NJE
+ 0xAB => '#x040B', # CYRILLIC CAPITAL LETTER TSHE
+ 0xAC => '#x040C', # CYRILLIC CAPITAL LETTER KJE
+ 0xAE => '#x040E', # CYRILLIC CAPITAL LETTER SHORT U
+ 0xAF => '#x040F', # CYRILLIC CAPITAL LETTER DZHE
+ 0xB0 => '#x0410', # CYRILLIC CAPITAL LETTER A
+ 0xB1 => '#x0411', # CYRILLIC CAPITAL LETTER BE
+ 0xB2 => '#x0412', # CYRILLIC CAPITAL LETTER VE
+ 0xB3 => '#x0413', # CYRILLIC CAPITAL LETTER GHE
+ 0xB4 => '#x0414', # CYRILLIC CAPITAL LETTER DE
+ 0xB5 => '#x0415', # CYRILLIC CAPITAL LETTER IE
+ 0xB6 => '#x0416', # CYRILLIC CAPITAL LETTER ZHE
+ 0xB7 => '#x0417', # CYRILLIC CAPITAL LETTER ZE
+ 0xB8 => '#x0418', # CYRILLIC CAPITAL LETTER I
+ 0xB9 => '#x0419', # CYRILLIC CAPITAL LETTER SHORT I
+ 0xBA => '#x041A', # CYRILLIC CAPITAL LETTER KA
+ 0xBB => '#x041B', # CYRILLIC CAPITAL LETTER EL
+ 0xBC => '#x041C', # CYRILLIC CAPITAL LETTER EM
+ 0xBD => '#x041D', # CYRILLIC CAPITAL LETTER EN
+ 0xBE => '#x041E', # CYRILLIC CAPITAL LETTER O
+ 0xBF => '#x041F', # CYRILLIC CAPITAL LETTER PE
+ 0xC0 => '#x0420', # CYRILLIC CAPITAL LETTER ER
+ 0xC1 => '#x0421', # CYRILLIC CAPITAL LETTER ES
+ 0xC2 => '#x0422', # CYRILLIC CAPITAL LETTER TE
+ 0xC3 => '#x0423', # CYRILLIC CAPITAL LETTER U
+ 0xC4 => '#x0424', # CYRILLIC CAPITAL LETTER EF
+ 0xC5 => '#x0425', # CYRILLIC CAPITAL LETTER HA
+ 0xC6 => '#x0426', # CYRILLIC CAPITAL LETTER TSE
+ 0xC7 => '#x0427', # CYRILLIC CAPITAL LETTER CHE
+ 0xC8 => '#x0428', # CYRILLIC CAPITAL LETTER SHA
+ 0xC9 => '#x0429', # CYRILLIC CAPITAL LETTER SHCHA
+ 0xCA => '#x042A', # CYRILLIC CAPITAL LETTER HARD SIGN
+ 0xCB => '#x042B', # CYRILLIC CAPITAL LETTER YERU
+ 0xCC => '#x042C', # CYRILLIC CAPITAL LETTER SOFT SIGN
+ 0xCD => '#x042D', # CYRILLIC CAPITAL LETTER E
+ 0xCE => '#x042E', # CYRILLIC CAPITAL LETTER YU
+ 0xCF => '#x042F', # CYRILLIC CAPITAL LETTER YA
+ 0xD0 => '#x0430', # CYRILLIC SMALL LETTER A
+ 0xD1 => '#x0431', # CYRILLIC SMALL LETTER BE
+ 0xD2 => '#x0432', # CYRILLIC SMALL LETTER VE
+ 0xD3 => '#x0433', # CYRILLIC SMALL LETTER GHE
+ 0xD4 => '#x0434', # CYRILLIC SMALL LETTER DE
+ 0xD5 => '#x0435', # CYRILLIC SMALL LETTER IE
+ 0xD6 => '#x0436', # CYRILLIC SMALL LETTER ZHE
+ 0xD7 => '#x0437', # CYRILLIC SMALL LETTER ZE
+ 0xD8 => '#x0438', # CYRILLIC SMALL LETTER I
+ 0xD9 => '#x0439', # CYRILLIC SMALL LETTER SHORT I
+ 0xDA => '#x043A', # CYRILLIC SMALL LETTER KA
+ 0xDB => '#x043B', # CYRILLIC SMALL LETTER EL
+ 0xDC => '#x043C', # CYRILLIC SMALL LETTER EM
+ 0xDD => '#x043D', # CYRILLIC SMALL LETTER EN
+ 0xDE => '#x043E', # CYRILLIC SMALL LETTER O
+ 0xDF => '#x043F', # CYRILLIC SMALL LETTER PE
+ 0xE0 => '#x0440', # CYRILLIC SMALL LETTER ER
+ 0xE1 => '#x0441', # CYRILLIC SMALL LETTER ES
+ 0xE2 => '#x0442', # CYRILLIC SMALL LETTER TE
+ 0xE3 => '#x0443', # CYRILLIC SMALL LETTER U
+ 0xE4 => '#x0444', # CYRILLIC SMALL LETTER EF
+ 0xE5 => '#x0445', # CYRILLIC SMALL LETTER HA
+ 0xE6 => '#x0446', # CYRILLIC SMALL LETTER TSE
+ 0xE7 => '#x0447', # CYRILLIC SMALL LETTER CHE
+ 0xE8 => '#x0448', # CYRILLIC SMALL LETTER SHA
+ 0xE9 => '#x0449', # CYRILLIC SMALL LETTER SHCHA
+ 0xEA => '#x044A', # CYRILLIC SMALL LETTER HARD SIGN
+ 0xEB => '#x044B', # CYRILLIC SMALL LETTER YERU
+ 0xEC => '#x044C', # CYRILLIC SMALL LETTER SOFT SIGN
+ 0xED => '#x044D', # CYRILLIC SMALL LETTER E
+ 0xEE => '#x044E', # CYRILLIC SMALL LETTER YU
+ 0xEF => '#x044F', # CYRILLIC SMALL LETTER YA
+ 0xF0 => '#x2116', # NUMERO SIGN
+ 0xF1 => '#x0451', # CYRILLIC SMALL LETTER IO
+ 0xF2 => '#x0452', # CYRILLIC SMALL LETTER DJE
+ 0xF3 => '#x0453', # CYRILLIC SMALL LETTER GJE
+ 0xF4 => '#x0454', # CYRILLIC SMALL LETTER UKRAINIAN IE
+ 0xF5 => '#x0455', # CYRILLIC SMALL LETTER DZE
+ 0xF6 => '#x0456', # CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
+ 0xF7 => '#x0457', # CYRILLIC SMALL LETTER YI
+ 0xF8 => '#x0458', # CYRILLIC SMALL LETTER JE
+ 0xF9 => '#x0459', # CYRILLIC SMALL LETTER LJE
+ 0xFA => '#x045A', # CYRILLIC SMALL LETTER NJE
+ 0xFB => '#x045B', # CYRILLIC SMALL LETTER TSHE
+ 0xFC => '#x045C', # CYRILLIC SMALL LETTER KJE
+ 0xFE => '#x045E', # CYRILLIC SMALL LETTER SHORT U
+ 0xFF => '#x045F', # CYRILLIC SMALL LETTER DZHE
+ };
+ __END__
+ # SGML-based map
+{
#--------------------------------------------------------------------------
Index: ISO8859_6.pm
===================================================================
RCS file: /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt/ISO8859_6.pm,v
retrieving revision 1.1
retrieving revision 1.2
diff -C2 -r1.1 -r1.2
*** ISO8859_6.pm 19 Aug 2001 09:53:55 -0000 1.1
--- ISO8859_6.pm 17 Nov 2002 03:38:53 -0000 1.2
***************
*** 34,41 ****
## ISO-8859-6: Arabic
##---------------------------------------------------------------------------
## Note: There is no ISO entities for arabic characters. Some of
## the following are non-standard entity references. 'ISOarbc'
## is used as the entity defining the Arabic entities.
-
+{
#--------------------------------------------------------------------------
--- 34,98 ----
## ISO-8859-6: Arabic
##---------------------------------------------------------------------------
+ +{
+ #--------------------------------------------------------------------------
+ # Hex Code Entity Ref # ISO external entity and description
+ #--------------------------------------------------------------------------
+ 0xA4 => '#x00A4', # CURRENCY SIGN
+ 0xAC => '#x060C', # ARABIC COMMA
+ 0xAD => '#x00AD', # SOFT HYPHEN
+ 0xBB => '#x061B', # ARABIC SEMICOLON
+ 0xBF => '#x061F', # ARABIC QUESTION MARK
+ 0xC1 => '#x0621', # ARABIC LETTER HAMZA
+ 0xC2 => '#x0622', # ARABIC LETTER ALEF WITH MADDA ABOVE
+ 0xC3 => '#x0623', # ARABIC LETTER ALEF WITH HAMZA ABOVE
+ 0xC4 => '#x0624', # ARABIC LETTER WAW WITH HAMZA ABOVE
+ 0xC5 => '#x0625', # ARABIC LETTER ALEF WITH HAMZA BELOW
+ 0xC6 => '#x0626', # ARABIC LETTER YEH WITH HAMZA ABOVE
+ 0xC7 => '#x0627', # ARABIC LETTER ALEF
+ 0xC8 => '#x0628', # ARABIC LETTER BEH
+ 0xC9 => '#x0629', # ARABIC LETTER TEH MARBUTA
+ 0xCA => '#x062A', # ARABIC LETTER TEH
+ 0xCB => '#x062B', # ARABIC LETTER THEH
+ 0xCC => '#x062C', # ARABIC LETTER JEEM
+ 0xCD => '#x062D', # ARABIC LETTER HAH
+ 0xCE => '#x062E', # ARABIC LETTER KHAH
+ 0xCF => '#x062F', # ARABIC LETTER DAL
+ 0xD0 => '#x0630', # ARABIC LETTER THAL
+ 0xD1 => '#x0631', # ARABIC LETTER REH
+ 0xD2 => '#x0632', # ARABIC LETTER ZAIN
+ 0xD3 => '#x0633', # ARABIC LETTER SEEN
+ 0xD4 => '#x0634', # ARABIC LETTER SHEEN
+ 0xD5 => '#x0635', # ARABIC LETTER SAD
+ 0xD6 => '#x0636', # ARABIC LETTER DAD
+ 0xD7 => '#x0637', # ARABIC LETTER TAH
+ 0xD8 => '#x0638', # ARABIC LETTER ZAH
+ 0xD9 => '#x0639', # ARABIC LETTER AIN
+ 0xDA => '#x063A', # ARABIC LETTER GHAIN
+ 0xE0 => '#x0640', # ARABIC TATWEEL
+ 0xE1 => '#x0641', # ARABIC LETTER FEH
+ 0xE2 => '#x0642', # ARABIC LETTER QAF
+ 0xE3 => '#x0643', # ARABIC LETTER KAF
+ 0xE4 => '#x0644', # ARABIC LETTER LAM
+ 0xE5 => '#x0645', # ARABIC LETTER MEEM
+ 0xE6 => '#x0646', # ARABIC LETTER NOON
+ 0xE7 => '#x0647', # ARABIC LETTER HEH
+ 0xE8 => '#x0648', # ARABIC LETTER WAW
+ 0xE9 => '#x0649', # ARABIC LETTER ALEF MAKSURA
+ 0xEA => '#x064A', # ARABIC LETTER YEH
+ 0xEB => '#x064B', # ARABIC FATHATAN
+ 0xEC => '#x064C', # ARABIC DAMMATAN
+ 0xED => '#x064D', # ARABIC KASRATAN
+ 0xEE => '#x064E', # ARABIC FATHA
+ 0xEF => '#x064F', # ARABIC DAMMA
+ 0xF0 => '#x0650', # ARABIC KASRA
+ 0xF1 => '#x0651', # ARABIC SHADDA
+ 0xF2 => '#x0652', # ARABIC SUKUN
+ };
+
+ __END__
+ # SGML-based map
## Note: There is no ISO entities for arabic characters. Some of
## the following are non-standard entity references. 'ISOarbc'
## is used as the entity defining the Arabic entities.
+{
#--------------------------------------------------------------------------
Index: ISO8859_7.pm
===================================================================
RCS file: /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt/ISO8859_7.pm,v
retrieving revision 1.1
retrieving revision 1.2
diff -C2 -r1.1 -r1.2
*** ISO8859_7.pm 19 Aug 2001 09:53:56 -0000 1.1
--- ISO8859_7.pm 17 Nov 2002 03:38:53 -0000 1.2
***************
*** 34,38 ****
--- 34,134 ----
## ISO-8859-7: Greek
##---------------------------------------------------------------------------
+ +{
+ #--------------------------------------------------------------------------
+ # Hex Code Entity Ref # ISO external entity and description
+ #--------------------------------------------------------------------------
+ 0xA1 => '#x2018', # LEFT SINGLE QUOTATION MARK
+ 0xA2 => '#x2019', # RIGHT SINGLE QUOTATION MARK
+ 0xA3 => '#x00A3', # POUND SIGN
+ 0xA6 => '#x00A6', # BROKEN BAR
+ 0xA7 => '#x00A7', # SECTION SIGN
+ 0xA8 => '#x00A8', # DIAERESIS
+ 0xA9 => '#x00A9', # COPYRIGHT SIGN
+ 0xAB => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
+ 0xAC => '#x00AC', # NOT SIGN
+ 0xAD => '#x00AD', # SOFT HYPHEN
+ 0xAF => '#x2015', # HORIZONTAL BAR
+ 0xB0 => '#x00B0', # DEGREE SIGN
+ 0xB1 => '#x00B1', # PLUS-MINUS SIGN
+ 0xB2 => '#x00B2', # SUPERSCRIPT TWO
+ 0xB3 => '#x00B3', # SUPERSCRIPT THREE
+ 0xB4 => '#x0384', # GREEK TONOS
+ 0xB5 => '#x0385', # GREEK DIALYTIKA TONOS
+ 0xB6 => '#x0386', # GREEK CAPITAL LETTER ALPHA WITH TONOS
+ 0xB7 => '#x00B7', # MIDDLE DOT
+ 0xB8 => '#x0388', # GREEK CAPITAL LETTER EPSILON WITH TONOS
+ 0xB9 => '#x0389', # GREEK CAPITAL LETTER ETA WITH TONOS
+ 0xBA => '#x038A', # GREEK CAPITAL LETTER IOTA WITH TONOS
+ 0xBB => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
+ 0xBC => '#x038C', # GREEK CAPITAL LETTER OMICRON WITH TONOS
+ 0xBD => '#x00BD', # VULGAR FRACTION ONE HALF
+ 0xBE => '#x038E', # GREEK CAPITAL LETTER UPSILON WITH TONOS
+ 0xBF => '#x038F', # GREEK CAPITAL LETTER OMEGA WITH TONOS
+ 0xC0 => '#x0390', # GREEK SMALL LETTER IOTA WITH DIALYTIKA AND
TONOS
+ 0xC1 => '#x0391', # GREEK CAPITAL LETTER ALPHA
+ 0xC2 => '#x0392', # GREEK CAPITAL LETTER BETA
+ 0xC3 => '#x0393', # GREEK CAPITAL LETTER GAMMA
+ 0xC4 => '#x0394', # GREEK CAPITAL LETTER DELTA
+ 0xC5 => '#x0395', # GREEK CAPITAL LETTER EPSILON
+ 0xC6 => '#x0396', # GREEK CAPITAL LETTER ZETA
+ 0xC7 => '#x0397', # GREEK CAPITAL LETTER ETA
+ 0xC8 => '#x0398', # GREEK CAPITAL LETTER THETA
+ 0xC9 => '#x0399', # GREEK CAPITAL LETTER IOTA
+ 0xCA => '#x039A', # GREEK CAPITAL LETTER KAPPA
+ 0xCB => '#x039B', # GREEK CAPITAL LETTER LAMDA
+ 0xCC => '#x039C', # GREEK CAPITAL LETTER MU
+ 0xCD => '#x039D', # GREEK CAPITAL LETTER NU
+ 0xCE => '#x039E', # GREEK CAPITAL LETTER XI
+ 0xCF => '#x039F', # GREEK CAPITAL LETTER OMICRON
+ 0xD0 => '#x03A0', # GREEK CAPITAL LETTER PI
+ 0xD1 => '#x03A1', # GREEK CAPITAL LETTER RHO
+ 0xD3 => '#x03A3', # GREEK CAPITAL LETTER SIGMA
+ 0xD4 => '#x03A4', # GREEK CAPITAL LETTER TAU
+ 0xD5 => '#x03A5', # GREEK CAPITAL LETTER UPSILON
+ 0xD6 => '#x03A6', # GREEK CAPITAL LETTER PHI
+ 0xD7 => '#x03A7', # GREEK CAPITAL LETTER CHI
+ 0xD8 => '#x03A8', # GREEK CAPITAL LETTER PSI
+ 0xD9 => '#x03A9', # GREEK CAPITAL LETTER OMEGA
+ 0xDA => '#x03AA', # GREEK CAPITAL LETTER IOTA WITH DIALYTIKA
+ 0xDB => '#x03AB', # GREEK CAPITAL LETTER UPSILON WITH DIALYTIKA
+ 0xDC => '#x03AC', # GREEK SMALL LETTER ALPHA WITH TONOS
+ 0xDD => '#x03AD', # GREEK SMALL LETTER EPSILON WITH TONOS
+ 0xDE => '#x03AE', # GREEK SMALL LETTER ETA WITH TONOS
+ 0xDF => '#x03AF', # GREEK SMALL LETTER IOTA WITH TONOS
+ 0xE0 => '#x03B0', # GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND
TONOS
+ 0xE1 => '#x03B1', # GREEK SMALL LETTER ALPHA
+ 0xE2 => '#x03B2', # GREEK SMALL LETTER BETA
+ 0xE3 => '#x03B3', # GREEK SMALL LETTER GAMMA
+ 0xE4 => '#x03B4', # GREEK SMALL LETTER DELTA
+ 0xE5 => '#x03B5', # GREEK SMALL LETTER EPSILON
+ 0xE6 => '#x03B6', # GREEK SMALL LETTER ZETA
+ 0xE7 => '#x03B7', # GREEK SMALL LETTER ETA
+ 0xE8 => '#x03B8', # GREEK SMALL LETTER THETA
+ 0xE9 => '#x03B9', # GREEK SMALL LETTER IOTA
+ 0xEA => '#x03BA', # GREEK SMALL LETTER KAPPA
+ 0xEB => '#x03BB', # GREEK SMALL LETTER LAMDA
+ 0xEC => '#x03BC', # GREEK SMALL LETTER MU
+ 0xED => '#x03BD', # GREEK SMALL LETTER NU
+ 0xEE => '#x03BE', # GREEK SMALL LETTER XI
+ 0xEF => '#x03BF', # GREEK SMALL LETTER OMICRON
+ 0xF0 => '#x03C0', # GREEK SMALL LETTER PI
+ 0xF1 => '#x03C1', # GREEK SMALL LETTER RHO
+ 0xF2 => '#x03C2', # GREEK SMALL LETTER FINAL SIGMA
+ 0xF3 => '#x03C3', # GREEK SMALL LETTER SIGMA
+ 0xF4 => '#x03C4', # GREEK SMALL LETTER TAU
+ 0xF5 => '#x03C5', # GREEK SMALL LETTER UPSILON
+ 0xF6 => '#x03C6', # GREEK SMALL LETTER PHI
+ 0xF7 => '#x03C7', # GREEK SMALL LETTER CHI
+ 0xF8 => '#x03C8', # GREEK SMALL LETTER PSI
+ 0xF9 => '#x03C9', # GREEK SMALL LETTER OMEGA
+ 0xFA => '#x03CA', # GREEK SMALL LETTER IOTA WITH DIALYTIKA
+ 0xFB => '#x03CB', # GREEK SMALL LETTER UPSILON WITH DIALYTIKA
+ 0xFC => '#x03CC', # GREEK SMALL LETTER OMICRON WITH TONOS
+ 0xFD => '#x03CD', # GREEK SMALL LETTER UPSILON WITH TONOS
+ 0xFE => '#x03CE', # GREEK SMALL LETTER OMEGA WITH TONOS
+ };
+ __END__
+ # SGML-based map
+{
#--------------------------------------------------------------------------
Index: ISO8859_8.pm
===================================================================
RCS file: /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt/ISO8859_8.pm,v
retrieving revision 1.1
retrieving revision 1.2
diff -C2 -r1.1 -r1.2
*** ISO8859_8.pm 19 Aug 2001 09:53:56 -0000 1.1
--- ISO8859_8.pm 17 Nov 2002 03:38:53 -0000 1.2
***************
*** 34,37 ****
--- 34,105 ----
## ISO-8859-8: Hebrew
##---------------------------------------------------------------------------
+ +{
+ #--------------------------------------------------------------------------
+ # Hex Code Entity Ref # ISO external entity and description
+ #--------------------------------------------------------------------------
+ 0xA2 => '#x00A2', # CENT SIGN
+ 0xA3 => '#x00A3', # POUND SIGN
+ 0xA4 => '#x00A4', # CURRENCY SIGN
+ 0xA5 => '#x00A5', # YEN SIGN
+ 0xA6 => '#x00A6', # BROKEN BAR
+ 0xA7 => '#x00A7', # SECTION SIGN
+ 0xA8 => '#x00A8', # DIAERESIS
+ 0xA9 => '#x00A9', # COPYRIGHT SIGN
+ 0xAA => '#x00D7', # MULTIPLICATION SIGN
+ 0xAB => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
+ 0xAC => '#x00AC', # NOT SIGN
+ 0xAD => '#x00AD', # SOFT HYPHEN
+ 0xAE => '#x00AE', # REGISTERED SIGN
+ 0xAF => '#x00AF', # MACRON
+ 0xB0 => '#x00B0', # DEGREE SIGN
+ 0xB1 => '#x00B1', # PLUS-MINUS SIGN
+ 0xB2 => '#x00B2', # SUPERSCRIPT TWO
+ 0xB3 => '#x00B3', # SUPERSCRIPT THREE
+ 0xB4 => '#x00B4', # ACUTE ACCENT
+ 0xB5 => '#x00B5', # MICRO SIGN
+ 0xB6 => '#x00B6', # PILCROW SIGN
+ 0xB7 => '#x00B7', # MIDDLE DOT
+ 0xB8 => '#x00B8', # CEDILLA
+ 0xB9 => '#x00B9', # SUPERSCRIPT ONE
+ 0xBA => '#x00F7', # DIVISION SIGN
+ 0xBB => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
+ 0xBC => '#x00BC', # VULGAR FRACTION ONE QUARTER
+ 0xBD => '#x00BD', # VULGAR FRACTION ONE HALF
+ 0xBE => '#x00BE', # VULGAR FRACTION THREE QUARTERS
+ 0xDF => '#x2017', # DOUBLE LOW LINE
+ 0xE0 => '#x05D0', # HEBREW LETTER ALEF
+ 0xE1 => '#x05D1', # HEBREW LETTER BET
+ 0xE2 => '#x05D2', # HEBREW LETTER GIMEL
+ 0xE3 => '#x05D3', # HEBREW LETTER DALET
+ 0xE4 => '#x05D4', # HEBREW LETTER HE
+ 0xE5 => '#x05D5', # HEBREW LETTER VAV
+ 0xE6 => '#x05D6', # HEBREW LETTER ZAYIN
+ 0xE7 => '#x05D7', # HEBREW LETTER HET
+ 0xE8 => '#x05D8', # HEBREW LETTER TET
+ 0xE9 => '#x05D9', # HEBREW LETTER YOD
+ 0xEA => '#x05DA', # HEBREW LETTER FINAL KAF
+ 0xEB => '#x05DB', # HEBREW LETTER KAF
+ 0xEC => '#x05DC', # HEBREW LETTER LAMED
+ 0xED => '#x05DD', # HEBREW LETTER FINAL MEM
+ 0xEE => '#x05DE', # HEBREW LETTER MEM
+ 0xEF => '#x05DF', # HEBREW LETTER FINAL NUN
+ 0xF0 => '#x05E0', # HEBREW LETTER NUN
+ 0xF1 => '#x05E1', # HEBREW LETTER SAMEKH
+ 0xF2 => '#x05E2', # HEBREW LETTER AYIN
+ 0xF3 => '#x05E3', # HEBREW LETTER FINAL PE
+ 0xF4 => '#x05E4', # HEBREW LETTER PE
+ 0xF5 => '#x05E5', # HEBREW LETTER FINAL TSADI
+ 0xF6 => '#x05E6', # HEBREW LETTER TSADI
+ 0xF7 => '#x05E7', # HEBREW LETTER QOF
+ 0xF8 => '#x05E8', # HEBREW LETTER RESH
+ 0xF9 => '#x05E9', # HEBREW LETTER SHIN
+ 0xFA => '#x05EA', # HEBREW LETTER TAV
+ 0xFD => '#x200E', # LEFT-TO-RIGHT MARK
+ 0xFE => '#x200F', # RIGHT-TO-LEFT MARK
+ };
+
+ __END__
+
+ ## SGML-based map
## Note: There is no ISO entities for hebrew characters. ISOamso
## defines a few characters, but they are for math purposes.
Index: ISO8859_9.pm
===================================================================
RCS file: /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt/ISO8859_9.pm,v
retrieving revision 1.1
retrieving revision 1.2
diff -C2 -r1.1 -r1.2
*** ISO8859_9.pm 19 Aug 2001 09:53:56 -0000 1.1
--- ISO8859_9.pm 17 Nov 2002 03:38:53 -0000 1.2
***************
*** 34,38 ****
--- 34,140 ----
## ISO-8859-9: Latin-5
##---------------------------------------------------------------------------
+ +{
+ #--------------------------------------------------------------------------
+ # Hex Code Entity Ref # ISO external entity and description
+ #--------------------------------------------------------------------------
+ 0xA1 => '#x00A1', # INVERTED EXCLAMATION MARK
+ 0xA2 => '#x00A2', # CENT SIGN
+ 0xA3 => '#x00A3', # POUND SIGN
+ 0xA4 => '#x00A4', # CURRENCY SIGN
+ 0xA5 => '#x00A5', # YEN SIGN
+ 0xA6 => '#x00A6', # BROKEN BAR
+ 0xA7 => '#x00A7', # SECTION SIGN
+ 0xA8 => '#x00A8', # DIAERESIS
+ 0xA9 => '#x00A9', # COPYRIGHT SIGN
+ 0xAA => '#x00AA', # FEMININE ORDINAL INDICATOR
+ 0xAB => '#x00AB', # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
+ 0xAC => '#x00AC', # NOT SIGN
+ 0xAD => '#x00AD', # SOFT HYPHEN
+ 0xAE => '#x00AE', # REGISTERED SIGN
+ 0xAF => '#x00AF', # MACRON
+ 0xB0 => '#x00B0', # DEGREE SIGN
+ 0xB1 => '#x00B1', # PLUS-MINUS SIGN
+ 0xB2 => '#x00B2', # SUPERSCRIPT TWO
+ 0xB3 => '#x00B3', # SUPERSCRIPT THREE
+ 0xB4 => '#x00B4', # ACUTE ACCENT
+ 0xB5 => '#x00B5', # MICRO SIGN
+ 0xB6 => '#x00B6', # PILCROW SIGN
+ 0xB7 => '#x00B7', # MIDDLE DOT
+ 0xB8 => '#x00B8', # CEDILLA
+ 0xB9 => '#x00B9', # SUPERSCRIPT ONE
+ 0xBA => '#x00BA', # MASCULINE ORDINAL INDICATOR
+ 0xBB => '#x00BB', # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
+ 0xBC => '#x00BC', # VULGAR FRACTION ONE QUARTER
+ 0xBD => '#x00BD', # VULGAR FRACTION ONE HALF
+ 0xBE => '#x00BE', # VULGAR FRACTION THREE QUARTERS
+ 0xBF => '#x00BF', # INVERTED QUESTION MARK
+ 0xC0 => '#x00C0', # LATIN CAPITAL LETTER A WITH GRAVE
+ 0xC1 => '#x00C1', # LATIN CAPITAL LETTER A WITH ACUTE
+ 0xC2 => '#x00C2', # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
+ 0xC3 => '#x00C3', # LATIN CAPITAL LETTER A WITH TILDE
+ 0xC4 => '#x00C4', # LATIN CAPITAL LETTER A WITH DIAERESIS
+ 0xC5 => '#x00C5', # LATIN CAPITAL LETTER A WITH RING ABOVE
+ 0xC6 => '#x00C6', # LATIN CAPITAL LETTER AE
+ 0xC7 => '#x00C7', # LATIN CAPITAL LETTER C WITH CEDILLA
+ 0xC8 => '#x00C8', # LATIN CAPITAL LETTER E WITH GRAVE
+ 0xC9 => '#x00C9', # LATIN CAPITAL LETTER E WITH ACUTE
+ 0xCA => '#x00CA', # LATIN CAPITAL LETTER E WITH CIRCUMFLEX
+ 0xCB => '#x00CB', # LATIN CAPITAL LETTER E WITH DIAERESIS
+ 0xCC => '#x00CC', # LATIN CAPITAL LETTER I WITH GRAVE
+ 0xCD => '#x00CD', # LATIN CAPITAL LETTER I WITH ACUTE
+ 0xCE => '#x00CE', # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
+ 0xCF => '#x00CF', # LATIN CAPITAL LETTER I WITH DIAERESIS
+ 0xD0 => '#x011E', # LATIN CAPITAL LETTER G WITH BREVE
+ 0xD1 => '#x00D1', # LATIN CAPITAL LETTER N WITH TILDE
+ 0xD2 => '#x00D2', # LATIN CAPITAL LETTER O WITH GRAVE
+ 0xD3 => '#x00D3', # LATIN CAPITAL LETTER O WITH ACUTE
+ 0xD4 => '#x00D4', # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
+ 0xD5 => '#x00D5', # LATIN CAPITAL LETTER O WITH TILDE
+ 0xD6 => '#x00D6', # LATIN CAPITAL LETTER O WITH DIAERESIS
+ 0xD7 => '#x00D7', # MULTIPLICATION SIGN
+ 0xD8 => '#x00D8', # LATIN CAPITAL LETTER O WITH STROKE
+ 0xD9 => '#x00D9', # LATIN CAPITAL LETTER U WITH GRAVE
+ 0xDA => '#x00DA', # LATIN CAPITAL LETTER U WITH ACUTE
+ 0xDB => '#x00DB', # LATIN CAPITAL LETTER U WITH CIRCUMFLEX
+ 0xDC => '#x00DC', # LATIN CAPITAL LETTER U WITH DIAERESIS
+ 0xDD => '#x0130', # LATIN CAPITAL LETTER I WITH DOT ABOVE
+ 0xDE => '#x015E', # LATIN CAPITAL LETTER S WITH CEDILLA
+ 0xDF => '#x00DF', # LATIN SMALL LETTER SHARP S
+ 0xE0 => '#x00E0', # LATIN SMALL LETTER A WITH GRAVE
+ 0xE1 => '#x00E1', # LATIN SMALL LETTER A WITH ACUTE
+ 0xE2 => '#x00E2', # LATIN SMALL LETTER A WITH CIRCUMFLEX
+ 0xE3 => '#x00E3', # LATIN SMALL LETTER A WITH TILDE
+ 0xE4 => '#x00E4', # LATIN SMALL LETTER A WITH DIAERESIS
+ 0xE5 => '#x00E5', # LATIN SMALL LETTER A WITH RING ABOVE
+ 0xE6 => '#x00E6', # LATIN SMALL LETTER AE
+ 0xE7 => '#x00E7', # LATIN SMALL LETTER C WITH CEDILLA
+ 0xE8 => '#x00E8', # LATIN SMALL LETTER E WITH GRAVE
+ 0xE9 => '#x00E9', # LATIN SMALL LETTER E WITH ACUTE
+ 0xEA => '#x00EA', # LATIN SMALL LETTER E WITH CIRCUMFLEX
+ 0xEB => '#x00EB', # LATIN SMALL LETTER E WITH DIAERESIS
+ 0xEC => '#x00EC', # LATIN SMALL LETTER I WITH GRAVE
+ 0xED => '#x00ED', # LATIN SMALL LETTER I WITH ACUTE
+ 0xEE => '#x00EE', # LATIN SMALL LETTER I WITH CIRCUMFLEX
+ 0xEF => '#x00EF', # LATIN SMALL LETTER I WITH DIAERESIS
+ 0xF0 => '#x011F', # LATIN SMALL LETTER G WITH BREVE
+ 0xF1 => '#x00F1', # LATIN SMALL LETTER N WITH TILDE
+ 0xF2 => '#x00F2', # LATIN SMALL LETTER O WITH GRAVE
+ 0xF3 => '#x00F3', # LATIN SMALL LETTER O WITH ACUTE
+ 0xF4 => '#x00F4', # LATIN SMALL LETTER O WITH CIRCUMFLEX
+ 0xF5 => '#x00F5', # LATIN SMALL LETTER O WITH TILDE
+ 0xF6 => '#x00F6', # LATIN SMALL LETTER O WITH DIAERESIS
+ 0xF7 => '#x00F7', # DIVISION SIGN
+ 0xF8 => '#x00F8', # LATIN SMALL LETTER O WITH STROKE
+ 0xF9 => '#x00F9', # LATIN SMALL LETTER U WITH GRAVE
+ 0xFA => '#x00FA', # LATIN SMALL LETTER U WITH ACUTE
+ 0xFB => '#x00FB', # LATIN SMALL LETTER U WITH CIRCUMFLEX
+ 0xFC => '#x00FC', # LATIN SMALL LETTER U WITH DIAERESIS
+ 0xFD => '#x0131', # LATIN SMALL LETTER DOTLESS I
+ 0xFE => '#x015F', # LATIN SMALL LETTER S WITH CEDILLA
+ 0xFF => '#x00FF', # LATIN SMALL LETTER Y WITH DIAERESIS
+ };
+ __END__
+ # SGML-based map
+{
#--------------------------------------------------------------------------
---------------------------------------------------------------------
To sign-off this list, send email to majordomo(_at_)mhonarc(_dot_)org with the
message text UNSUBSCRIBE MHONARC-DEV