mhonarc-commits
[Top] [All Lists]

CVS: mhonarc/MHonArc/lib/MHonArc/CharEnt HP_ROMAN8.pm,NONE,1.1 AppleRomania...

2002-12-17 22:39:04
Update of /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt
In directory subversions:/tmp/cvs-serv25303/CharEnt

Modified Files:
	AppleRomanian.pm KOI8_U.pm 
Added Files:
	HP_ROMAN8.pm 
Log Message:
* MHonArc::UTF8 redesigned: Auto-checks for Encode and Unicode::MapUTF8.
  Also utf8 support code added for perl installations that do not
  have either module installed.

  Wrapper modules are provided for each implementation, so, in theory,
  they can be referenced directly, but MHonArc::UTF8 is designed to
  used directly for CHARSETCONVERTERS and TEXTCLIPFUNC resources.

* Text encoding functions for MHonArc::UTF8::* modules have been
  added to support soon-to-be TEXTENCODE and TEXTENCODERFUNC resources
  for utf8 encoding of all text entities.

* Added MHonArc::{Char,CharMaps} and MHonArc::Char::{JP,KR} to encapsulate
  common code.

* Added MHonArc::Encode to support soon-to-be TEXTENCODE and
  TEXTENCODERFUNC resources for arbitrary character encoding of all
  text entities.  Requires either the Encode or Unicode::MapUTF8 module
  to be installed.

* Added hp-roman8 support.

* Added mapping of copyright symbol in koi8-u.


--- NEW FILE ---

package MHonArc::CharEnt::HP_ROMAN8;

+{
  #--------------------------------------------------------------------------
  # Raw Text    Entity Ref      # Description
  #--------------------------------------------------------------------------
    '¡' =>	'À',	# LATIN CAPITAL LETTER A WITH GRAVE
    '¢' =>	'Â',	# LATIN CAPITAL LETTER A WITH CIRCUMFLEX
    '£' =>	'È',	# LATIN CAPITAL LETTER E WITH GRAVE
    '¤' =>	'Ê',	# LATIN CAPITAL LETTER E WITH CIRCUMFLEX
    '¥' =>	'Ë',	# LATIN CAPITAL LETTER E WITH DIAERESIS
    '¦' =>	'Î',	# LATIN CAPITAL LETTER I WITH CIRCUMFLEX
    '§' =>	'Ï',	# LATIN CAPITAL LETTER I WITH DIAERESIS
    '¨' =>	'´',	# ACUTE ACCENT
    '©' =>	'ˋ',	# MODIFIER LETTER GRAVE ACCENT
    'ª' =>	'ˆ',	# MODIFIER LETTER CIRCUMFLEX ACCENT
    '«' =>	'¨',	# DIAERESIS
    '¬' =>	'˜',	# SMALL TILDE
    '­' =>	'Ù',	# LATIN CAPITAL LETTER U WITH GRAVE
    '®' =>	'Û',	# LATIN CAPITAL LETTER U WITH CIRCUMFLEX
    '¯' =>	'₤',	# LIRA SIGN
    '°' =>	'¯',	# MACRON
    '±' =>	'Ý',	# LATIN CAPITAL LETTER Y WITH ACUTE
    '²' =>	'ý',	# LATIN SMALL LETTER Y WITH ACUTE
    '³' =>	'°',	# DEGREE SIGN
    '´' =>	'Ç',	# LATIN CAPITAL LETTER C WITH CEDILLA
    'µ' =>	'ç',	# LATIN SMALL LETTER C WITH CEDILLA
    '¶' =>	'Ñ',	# LATIN CAPITAL LETTER N WITH TILDE
    '·' =>	'ñ',	# LATIN SMALL LETTER N WITH TILDE
    '¸' =>	'¡',	# INVERTED EXCLAMATION MARK
    '¹' =>	'¿',	# INVERTED QUESTION MARK
    'º' =>	'¤',	# CURRENCY SIGN
    '»' =>	'£',	# POUND SIGN
    '¼' =>	'¥',	# YEN SIGN
    '½' =>	'§',	# SECTION SIGN
    '¾' =>	'ƒ',	# LATIN SMALL LETTER F WITH HOOK
    '¿' =>	'¢',	# CENT SIGN
    'À' =>	'â',	# LATIN SMALL LETTER A WITH CIRCUMFLEX
    'Á' =>	'ê',	# LATIN SMALL LETTER E WITH CIRCUMFLEX
    'Â' =>	'ô',	# LATIN SMALL LETTER O WITH CIRCUMFLEX
    'Ã' =>	'û',	# LATIN SMALL LETTER U WITH CIRCUMFLEX
    'Ä' =>	'á',	# LATIN SMALL LETTER A WITH ACUTE
    'Å' =>	'é',	# LATIN SMALL LETTER E WITH ACUTE
    'Æ' =>	'ó',	# LATIN SMALL LETTER O WITH ACUTE
    'Ç' =>	'ú',	# LATIN SMALL LETTER U WITH ACUTE
    'È' =>	'à',	# LATIN SMALL LETTER A WITH GRAVE
    'É' =>	'è',	# LATIN SMALL LETTER E WITH GRAVE
    'Ê' =>	'ò',	# LATIN SMALL LETTER O WITH GRAVE
    'Ë' =>	'ù',	# LATIN SMALL LETTER U WITH GRAVE
    'Ì' =>	'ä',	# LATIN SMALL LETTER A WITH DIAERESIS
    'Í' =>	'ë',	# LATIN SMALL LETTER E WITH DIAERESIS
    'Î' =>	'ö',	# LATIN SMALL LETTER O WITH DIAERESIS
    'Ï' =>	'ü',	# LATIN SMALL LETTER U WITH DIAERESIS
    'Ð' =>	'Å',	# LATIN CAPITAL LETTER A WITH RING ABOVE
    'Ñ' =>	'î',	# LATIN SMALL LETTER I WITH CIRCUMFLEX
    'Ò' =>	'Ø',	# LATIN CAPITAL LETTER O WITH STROKE
    'Ó' =>	'Æ',	# LATIN CAPITAL LETTER AE
    'Ô' =>	'å',	# LATIN SMALL LETTER A WITH RING ABOVE
    'Õ' =>	'í',	# LATIN SMALL LETTER I WITH ACUTE
    'Ö' =>	'ø',	# LATIN SMALL LETTER O WITH STROKE
    '×' =>	'æ',	# LATIN SMALL LETTER AE
    'Ø' =>	'Ä',	# LATIN CAPITAL LETTER A WITH DIAERESIS
    'Ù' =>	'ì',	# LATIN SMALL LETTER I WITH GRAVE
    'Ú' =>	'Ö',	# LATIN CAPITAL LETTER O WITH DIAERESIS
    'Û' =>	'Ü',	# LATIN CAPITAL LETTER U WITH DIAERESIS
    'Ü' =>	'É',	# LATIN CAPITAL LETTER E WITH ACUTE
    'Ý' =>	'ï',	# LATIN SMALL LETTER I WITH DIAERESIS
    'Þ' =>	'ß',	# LATIN SMALL LETTER SHARP S
    'ß' =>	'Ô',	# LATIN CAPITAL LETTER O WITH CIRCUMFLEX
    'à' =>	'Á',	# LATIN CAPITAL LETTER A WITH ACUTE
    'á' =>	'Ã',	# LATIN CAPITAL LETTER A WITH TILDE
    'â' =>	'ã',	# LATIN SMALL LETTER A WITH TILDE
    'ã' =>	'Ð',	# LATIN CAPITAL LETTER ETH
    'ä' =>	'ð',	# LATIN SMALL LETTER ETH
    'å' =>	'Í',	# LATIN CAPITAL LETTER I WITH ACUTE
    'æ' =>	'Ì',	# LATIN CAPITAL LETTER I WITH GRAVE
    'ç' =>	'Ó',	# LATIN CAPITAL LETTER O WITH ACUTE
    'è' =>	'Ò',	# LATIN CAPITAL LETTER O WITH GRAVE
    'é' =>	'Õ',	# LATIN CAPITAL LETTER O WITH TILDE
    'ê' =>	'õ',	# LATIN SMALL LETTER O WITH TILDE
    'ë' =>	'Š',	# LATIN CAPITAL LETTER S WITH CARON
    'ì' =>	'š',	# LATIN SMALL LETTER S WITH CARON
    'í' =>	'Ú',	# LATIN CAPITAL LETTER U WITH ACUTE
    'î' =>	'Ÿ',	# LATIN CAPITAL LETTER Y WITH DIAERESIS
    'ð' =>	'Þ',	# LATIN CAPITAL LETTER THORN
    'ñ' =>	'þ',	# LATIN SMALL LETTER THORN
    'ò' =>	'·',	# MIDDLE DOT
    'ó' =>	'µ',	# MICRO SIGN
    'ô' =>	'¶',	# PILCROW SIGN
    'õ' =>	'¾',	# VULGAR FRACTION THREE QUARTERS
    'ö' =>	'—',	# EM DASH
    '÷' =>	'¼',	# VULGAR FRACTION ONE QUARTER
    'ø' =>	'½',	# VULGAR FRACTION ONE HALF
    'ù' =>	'ª',	# FEMININE ORDINAL INDICATOR
    'ú' =>	'º',	# MASCULINE ORDINAL INDICATOR
    'û' =>	'«',	# LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
    'ü' =>	'■',	# BLACK SQUARE
    'ý' =>	'»',	# RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
    'þ' =>	'±',	# PLUS-MINUS SIGN
    'ÿ' =>	'ÿ',	# LATIN SMALL LETTER Y WITH DIAERESIS
};

Index: AppleRomanian.pm
===================================================================
RCS file: /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt/AppleRomanian.pm,v
retrieving revision 1.2
retrieving revision 1.3
diff -C2 -r1.2 -r1.3
*** AppleRomanian.pm	3 Dec 2002 06:00:55 -0000	1.2
--- AppleRomanian.pm	18 Dec 2002 05:38:43 -0000	1.3
***************
*** 54,58 ****
      '­' =>	'≠',	# NOT EQUAL TO
      '®' =>	'Ă',	# LATIN CAPITAL LETTER A WITH BREVE
!     '¯' =>	'S', '̦',	# LATIN CAPITAL LETTER S + COMBINING COMMA BELOW
      '°' =>	'∞',	# INFINITY
      '±' =>	'±',	# PLUS-MINUS SIGN
--- 54,58 ----
      '­' =>	'≠',	# NOT EQUAL TO
      '®' =>	'Ă',	# LATIN CAPITAL LETTER A WITH BREVE
!     '¯' =>	'Ș',	# LATIN CAPITAL LETTER S + COMBINING COMMA BELOW
      '°' =>	'∞',	# INFINITY
      '±' =>	'±',	# PLUS-MINUS SIGN

Index: KOI8_U.pm
===================================================================
RCS file: /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt/KOI8_U.pm,v
retrieving revision 1.2
retrieving revision 1.3
diff -C2 -r1.2 -r1.3
*** KOI8_U.pm	3 Dec 2002 06:00:57 -0000	1.2
--- KOI8_U.pm	18 Dec 2002 05:38:43 -0000	1.3
***************
*** 1,8 ****
  
! package MHonArc::CharEnt::KOI8_U;
  
  +{
    #--------------------------------------------------------------------------
!   # Hex Code    Entity Ref      # ISO external entity and description
    #--------------------------------------------------------------------------
      '€' =>	'─',	# BOX DRAWINGS LIGHT HORIZONTAL
--- 1,8 ----
  
! package MHonArc::CharEnt::KOI_8;
  
  +{
    #--------------------------------------------------------------------------
!   # Raw Text    Entity Ref      # Description
    #--------------------------------------------------------------------------
      '€' =>	'─',	# BOX DRAWINGS LIGHT HORIZONTAL
***************
*** 69,72 ****
--- 69,73 ----
      '½' =>	'Ґ',	# CYRILLIC CAPITAL LETTER GHE WITH UPTURN
      '¾' =>	'╬',	# BOX DRAWINGS DOUBLE VERTICAL AND HORIZONTAL
+     '¿' =>	'©',	# COPYRIGHT SIGN
      'À' =>	'ю',	# CYRILLIC SMALL LETTER YU
      'Á' =>	'а',	# CYRILLIC SMALL LETTER A

---------------------------------------------------------------------
To sign-off this list, send email to majordomo(_at_)mhonarc(_dot_)org with the
message text UNSUBSCRIBE MHONARC-DEV