mhonarc-commits
[Top] [All Lists]

CVS: mhonarc/MHonArc/lib/MHonArc CharEnt.pm,1.3,1.4

2002-11-16 20:39:29
Update of /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc
In directory subversions:/tmp/cvs-serv25158/lib/MHonArc

Modified Files:
	CharEnt.pm 
Log Message:
* Added CHARSETALIASES resource to define aliases for official
  charset names.
* MHonArc::CharEnt:
  + Several charset mappings added to MHonArc::CharEnt with the
    default value for CHARSETCONVERTERS updated to reflect the new
    mappings: various Cyrillic sets, VISCII, Apple-based charsets, etc.
    Sets that have bidirectional rendering (Hebrew, Arabic) exist,
    but directional re-ording for rendering is currently not supported.
  . Some existing mappings have been updated to use Unicode numeric
    character entity references (&#xHHHH;) instead of standard SGML
    character entity references (eg. &Aelig;).  Most, if not all,
    web browsers only support the set of SGML entity references
    defined in the HTML 4.0 specification.

    All existing tables should now generate entity references
    recognized by all HTML 4.0 compliant browsers.


Index: CharEnt.pm
===================================================================
RCS file: /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt.pm,v
retrieving revision 1.3
retrieving revision 1.4
diff -C2 -r1.3 -r1.4
*** CharEnt.pm	13 Apr 2002 00:58:09 -0000	1.3
--- CharEnt.pm	17 Nov 2002 03:38:53 -0000	1.4
***************
*** 66,102 ****
  
  my %CharsetMaps = (
!     'iso-8859-1'  =>	'MHonArc/CharEnt/ISO8859_1.pm',
!     'iso-8859-2'  =>	'MHonArc/CharEnt/ISO8859_2.pm',
!     'iso-8859-3'  =>	'MHonArc/CharEnt/ISO8859_3.pm',
!     'iso-8859-4'  =>	'MHonArc/CharEnt/ISO8859_4.pm',
!     'iso-8859-5'  =>	'MHonArc/CharEnt/ISO8859_5.pm',
!     'iso-8859-6'  =>	'MHonArc/CharEnt/ISO8859_6.pm',
!     'iso-8859-7'  =>	'MHonArc/CharEnt/ISO8859_7.pm',
!     'iso-8859-8'  =>	'MHonArc/CharEnt/ISO8859_8.pm',
!     'iso-8859-9'  =>	'MHonArc/CharEnt/ISO8859_9.pm',
!     'iso-8859-10' =>	'MHonArc/CharEnt/ISO8859_10.pm',
!     'iso-8859-15' =>	'MHonArc/CharEnt/ISO8859_15.pm',
!     'latin1'      =>	'MHonArc/CharEnt/ISO8859_1.pm',
!     'latin2'      =>	'MHonArc/CharEnt/ISO8859_2.pm',
!     'latin3'      =>	'MHonArc/CharEnt/ISO8859_3.pm',
!     'latin4'      =>	'MHonArc/CharEnt/ISO8859_4.pm',
!     'latin5'      =>	'MHonArc/CharEnt/ISO8859_9.pm',
!     'latin6'      =>	'MHonArc/CharEnt/ISO8859_10.pm',
!     'latin9'      =>	'MHonArc/CharEnt/ISO8859_15.pm',
!     'windows-1250'=>	'MHonArc/CharEnt/CP1250.pm',
!     'windows-1252'=>	'MHonArc/CharEnt/CP1252.pm',
  );
  
  my %ReverseCharsetMaps = (
!     'iso-8859-1'  =>	'MHonArc/CharEnt/ISO8859_1R.pm',
!     'iso-8859-3'  =>	'MHonArc/CharEnt/ISO8859_3R.pm',
!     'iso-8859-7'  =>	'MHonArc/CharEnt/ISO8859_7R.pm',
!     'iso-8859-8'  =>	'MHonArc/CharEnt/ISO8859_8R.pm',
!     'iso-8859-9'  =>	'MHonArc/CharEnt/ISO8859_9R.pm',
!     'iso-8859-15' =>	'MHonArc/CharEnt/ISO8859_15R.pm',
!     'latin1'      =>	'MHonArc/CharEnt/ISO8859_1R.pm',
!     'latin3'      =>	'MHonArc/CharEnt/ISO8859_3R.pm',
!     'latin5'      =>	'MHonArc/CharEnt/ISO8859_9R.pm',
!     'latin9'      =>	'MHonArc/CharEnt/ISO8859_15R.pm',
  );
  
--- 66,123 ----
  
  my %CharsetMaps = (
!     'iso-8859-1'     =>	'MHonArc/CharEnt/ISO8859_1.pm',
!     'iso-8859-2'     =>	'MHonArc/CharEnt/ISO8859_2.pm',
!     'iso-8859-3'     =>	'MHonArc/CharEnt/ISO8859_3.pm',
!     'iso-8859-4'     =>	'MHonArc/CharEnt/ISO8859_4.pm',
!     'iso-8859-5'     =>	'MHonArc/CharEnt/ISO8859_5.pm',
!     'iso-8859-6'     =>	'MHonArc/CharEnt/ISO8859_6.pm',
!     'iso-8859-7'     =>	'MHonArc/CharEnt/ISO8859_7.pm',
!     'iso-8859-8'     =>	'MHonArc/CharEnt/ISO8859_8.pm',
!     'iso-8859-9'     =>	'MHonArc/CharEnt/ISO8859_9.pm',
!     'iso-8859-10'    =>	'MHonArc/CharEnt/ISO8859_10.pm',
!     'iso-8859-11'    =>	'MHonArc/CharEnt/ISO8859_11.pm',
!     'iso-8859-13'    =>	'MHonArc/CharEnt/ISO8859_13.pm',
!     'iso-8859-14'    =>	'MHonArc/CharEnt/ISO8859_14.pm',
!     'iso-8859-15'    =>	'MHonArc/CharEnt/ISO8859_15.pm',
!     'iso-8859-16'    =>	'MHonArc/CharEnt/ISO8859_16.pm',
!     'cp1250'	     =>	'MHonArc/CharEnt/CP1250.pm',
!     'cp1251'	     =>	'MHonArc/CharEnt/CP1251.pm',
!     'cp1252'	     =>	'MHonArc/CharEnt/CP1252.pm',
!     'cp1253'	     =>	'MHonArc/CharEnt/CP1253.pm',
!     'cp1254'	     =>	'MHonArc/CharEnt/CP1254.pm',
!     'cp1255'	     =>	'MHonArc/CharEnt/CP1255.pm',
!     'cp1256'	     =>	'MHonArc/CharEnt/CP1256.pm',
!     'cp1257'	     =>	'MHonArc/CharEnt/CP1257.pm',
!     'cp1258'	     =>	'MHonArc/CharEnt/CP1258.pm',
!     'koi-0'	     =>	'MHonArc/CharEnt/KOI_0.pm',
!     'koi-7'	     =>	'MHonArc/CharEnt/KOI_7.pm',
!     'koi8-a'	     =>	'MHonArc/CharEnt/KOI8_A.pm',
!     'koi8-b'	     =>	'MHonArc/CharEnt/KOI8_B.pm',
!     'koi8-e'	     =>	'MHonArc/CharEnt/KOI8_E.pm',
!     'koi8-f'	     =>	'MHonArc/CharEnt/KOI8_F.pm',
!     'koi8-r'	     =>	'MHonArc/CharEnt/KOI8_R.pm',
!     'koi8-u'	     =>	'MHonArc/CharEnt/KOI8_U.pm',
!     'gost19768-87'   =>	'MHonArc/CharEnt/GOST19768_87.pm',
!     'viscii'	     =>	'MHonArc/CharEnt/VISCII.pm',
!     'apple-arabic'   =>	'MHonArc/CharEnt/AppleArabic.pm',
!     'apple-centeuro' =>	'MHonArc/CharEnt/AppleCenteuro.pm',
!     'apple-croatian' =>	'MHonArc/CharEnt/AppleCroatian.pm',
!     'apple-cyrillic' =>	'MHonArc/CharEnt/AppleCyrillic.pm',
!     'apple-greek'    =>	'MHonArc/CharEnt/AppleGreek.pm',
!     'apple-hebrew'   =>	'MHonArc/CharEnt/AppleHebrew.pm',
!     'apple-iceland'  =>	'MHonArc/CharEnt/AppleIceland.pm',
!     'apple-romanian' =>	'MHonArc/CharEnt/AppleRomanian.pm',
!     'apple-roman'    =>	'MHonArc/CharEnt/AppleRoman.pm',
!     'apple-thai'     =>	'MHonArc/CharEnt/AppleThai.pm',
!     'apple-turkish'  =>	'MHonArc/CharEnt/AppleTurkish.pm',
  );
  
  my %ReverseCharsetMaps = (
!     'iso-8859-1'     =>	'MHonArc/CharEnt/ISO8859_1R.pm',
!     'iso-8859-3'     =>	'MHonArc/CharEnt/ISO8859_3R.pm',
!     'iso-8859-7'     =>	'MHonArc/CharEnt/ISO8859_7R.pm',
!     'iso-8859-8'     =>	'MHonArc/CharEnt/ISO8859_8R.pm',
!     'iso-8859-9'     =>	'MHonArc/CharEnt/ISO8859_9R.pm',
!     'iso-8859-15'    =>	'MHonArc/CharEnt/ISO8859_15R.pm',
  );
  
***************
*** 135,139 ****
  	    $ret .= pack("C", $char);
  	} elsif ($map->{$char}) {
! 	    $ret .= join('', '&', $map->{$char}, ';');
  	} elsif ($ASCIIMap{$char}) {
  	    $ret .= join('', '&', $ASCIIMap{$char}, ';');
--- 156,162 ----
  	    $ret .= pack("C", $char);
  	} elsif ($map->{$char}) {
! 	    $ret .= ref($map->{$char}) ?
! 			join('', map { '&'.$_.';' } @{$map->{$char}}) :
! 			join('', '&', $map->{$char}, ';');
  	} elsif ($ASCIIMap{$char}) {
  	    $ret .= join('', '&', $ASCIIMap{$char}, ';');
***************
*** 203,206 ****
--- 226,230 ----
  	  $map = _load_charmap($charset);
        }
+       # XXX: Does not handle list values!
        $map = $ent2char_maps{$charset} = { reverse %$map };
  
***************
*** 220,222 ****
  ##---------------------------------------------------------------------------##
  1;
- 
--- 244,245 ----

---------------------------------------------------------------------
To sign-off this list, send email to majordomo(_at_)mhonarc(_dot_)org with the
message text UNSUBSCRIBE MHONARC-DEV