Update of /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc
In directory subversions:/tmp/cvs-serv25158/lib/MHonArc
Modified Files:
CharEnt.pm
Log Message:
* Added CHARSETALIASES resource to define aliases for official
charset names.
* MHonArc::CharEnt:
+ Several charset mappings added to MHonArc::CharEnt with the
default value for CHARSETCONVERTERS updated to reflect the new
mappings: various Cyrillic sets, VISCII, Apple-based charsets, etc.
Sets that have bidirectional rendering (Hebrew, Arabic) exist,
but directional re-ording for rendering is currently not supported.
. Some existing mappings have been updated to use Unicode numeric
character entity references (&#xHHHH;) instead of standard SGML
character entity references (eg. &Aelig;). Most, if not all,
web browsers only support the set of SGML entity references
defined in the HTML 4.0 specification.
All existing tables should now generate entity references
recognized by all HTML 4.0 compliant browsers.
Index: CharEnt.pm
===================================================================
RCS file: /cvsroot/mhonarc/mhonarc/MHonArc/lib/MHonArc/CharEnt.pm,v
retrieving revision 1.3
retrieving revision 1.4
diff -C2 -r1.3 -r1.4
*** CharEnt.pm 13 Apr 2002 00:58:09 -0000 1.3
--- CharEnt.pm 17 Nov 2002 03:38:53 -0000 1.4
***************
*** 66,102 ****
my %CharsetMaps = (
! 'iso-8859-1' => 'MHonArc/CharEnt/ISO8859_1.pm',
! 'iso-8859-2' => 'MHonArc/CharEnt/ISO8859_2.pm',
! 'iso-8859-3' => 'MHonArc/CharEnt/ISO8859_3.pm',
! 'iso-8859-4' => 'MHonArc/CharEnt/ISO8859_4.pm',
! 'iso-8859-5' => 'MHonArc/CharEnt/ISO8859_5.pm',
! 'iso-8859-6' => 'MHonArc/CharEnt/ISO8859_6.pm',
! 'iso-8859-7' => 'MHonArc/CharEnt/ISO8859_7.pm',
! 'iso-8859-8' => 'MHonArc/CharEnt/ISO8859_8.pm',
! 'iso-8859-9' => 'MHonArc/CharEnt/ISO8859_9.pm',
! 'iso-8859-10' => 'MHonArc/CharEnt/ISO8859_10.pm',
! 'iso-8859-15' => 'MHonArc/CharEnt/ISO8859_15.pm',
! 'latin1' => 'MHonArc/CharEnt/ISO8859_1.pm',
! 'latin2' => 'MHonArc/CharEnt/ISO8859_2.pm',
! 'latin3' => 'MHonArc/CharEnt/ISO8859_3.pm',
! 'latin4' => 'MHonArc/CharEnt/ISO8859_4.pm',
! 'latin5' => 'MHonArc/CharEnt/ISO8859_9.pm',
! 'latin6' => 'MHonArc/CharEnt/ISO8859_10.pm',
! 'latin9' => 'MHonArc/CharEnt/ISO8859_15.pm',
! 'windows-1250'=> 'MHonArc/CharEnt/CP1250.pm',
! 'windows-1252'=> 'MHonArc/CharEnt/CP1252.pm',
);
my %ReverseCharsetMaps = (
! 'iso-8859-1' => 'MHonArc/CharEnt/ISO8859_1R.pm',
! 'iso-8859-3' => 'MHonArc/CharEnt/ISO8859_3R.pm',
! 'iso-8859-7' => 'MHonArc/CharEnt/ISO8859_7R.pm',
! 'iso-8859-8' => 'MHonArc/CharEnt/ISO8859_8R.pm',
! 'iso-8859-9' => 'MHonArc/CharEnt/ISO8859_9R.pm',
! 'iso-8859-15' => 'MHonArc/CharEnt/ISO8859_15R.pm',
! 'latin1' => 'MHonArc/CharEnt/ISO8859_1R.pm',
! 'latin3' => 'MHonArc/CharEnt/ISO8859_3R.pm',
! 'latin5' => 'MHonArc/CharEnt/ISO8859_9R.pm',
! 'latin9' => 'MHonArc/CharEnt/ISO8859_15R.pm',
);
--- 66,123 ----
my %CharsetMaps = (
! 'iso-8859-1' => 'MHonArc/CharEnt/ISO8859_1.pm',
! 'iso-8859-2' => 'MHonArc/CharEnt/ISO8859_2.pm',
! 'iso-8859-3' => 'MHonArc/CharEnt/ISO8859_3.pm',
! 'iso-8859-4' => 'MHonArc/CharEnt/ISO8859_4.pm',
! 'iso-8859-5' => 'MHonArc/CharEnt/ISO8859_5.pm',
! 'iso-8859-6' => 'MHonArc/CharEnt/ISO8859_6.pm',
! 'iso-8859-7' => 'MHonArc/CharEnt/ISO8859_7.pm',
! 'iso-8859-8' => 'MHonArc/CharEnt/ISO8859_8.pm',
! 'iso-8859-9' => 'MHonArc/CharEnt/ISO8859_9.pm',
! 'iso-8859-10' => 'MHonArc/CharEnt/ISO8859_10.pm',
! 'iso-8859-11' => 'MHonArc/CharEnt/ISO8859_11.pm',
! 'iso-8859-13' => 'MHonArc/CharEnt/ISO8859_13.pm',
! 'iso-8859-14' => 'MHonArc/CharEnt/ISO8859_14.pm',
! 'iso-8859-15' => 'MHonArc/CharEnt/ISO8859_15.pm',
! 'iso-8859-16' => 'MHonArc/CharEnt/ISO8859_16.pm',
! 'cp1250' => 'MHonArc/CharEnt/CP1250.pm',
! 'cp1251' => 'MHonArc/CharEnt/CP1251.pm',
! 'cp1252' => 'MHonArc/CharEnt/CP1252.pm',
! 'cp1253' => 'MHonArc/CharEnt/CP1253.pm',
! 'cp1254' => 'MHonArc/CharEnt/CP1254.pm',
! 'cp1255' => 'MHonArc/CharEnt/CP1255.pm',
! 'cp1256' => 'MHonArc/CharEnt/CP1256.pm',
! 'cp1257' => 'MHonArc/CharEnt/CP1257.pm',
! 'cp1258' => 'MHonArc/CharEnt/CP1258.pm',
! 'koi-0' => 'MHonArc/CharEnt/KOI_0.pm',
! 'koi-7' => 'MHonArc/CharEnt/KOI_7.pm',
! 'koi8-a' => 'MHonArc/CharEnt/KOI8_A.pm',
! 'koi8-b' => 'MHonArc/CharEnt/KOI8_B.pm',
! 'koi8-e' => 'MHonArc/CharEnt/KOI8_E.pm',
! 'koi8-f' => 'MHonArc/CharEnt/KOI8_F.pm',
! 'koi8-r' => 'MHonArc/CharEnt/KOI8_R.pm',
! 'koi8-u' => 'MHonArc/CharEnt/KOI8_U.pm',
! 'gost19768-87' => 'MHonArc/CharEnt/GOST19768_87.pm',
! 'viscii' => 'MHonArc/CharEnt/VISCII.pm',
! 'apple-arabic' => 'MHonArc/CharEnt/AppleArabic.pm',
! 'apple-centeuro' => 'MHonArc/CharEnt/AppleCenteuro.pm',
! 'apple-croatian' => 'MHonArc/CharEnt/AppleCroatian.pm',
! 'apple-cyrillic' => 'MHonArc/CharEnt/AppleCyrillic.pm',
! 'apple-greek' => 'MHonArc/CharEnt/AppleGreek.pm',
! 'apple-hebrew' => 'MHonArc/CharEnt/AppleHebrew.pm',
! 'apple-iceland' => 'MHonArc/CharEnt/AppleIceland.pm',
! 'apple-romanian' => 'MHonArc/CharEnt/AppleRomanian.pm',
! 'apple-roman' => 'MHonArc/CharEnt/AppleRoman.pm',
! 'apple-thai' => 'MHonArc/CharEnt/AppleThai.pm',
! 'apple-turkish' => 'MHonArc/CharEnt/AppleTurkish.pm',
);
my %ReverseCharsetMaps = (
! 'iso-8859-1' => 'MHonArc/CharEnt/ISO8859_1R.pm',
! 'iso-8859-3' => 'MHonArc/CharEnt/ISO8859_3R.pm',
! 'iso-8859-7' => 'MHonArc/CharEnt/ISO8859_7R.pm',
! 'iso-8859-8' => 'MHonArc/CharEnt/ISO8859_8R.pm',
! 'iso-8859-9' => 'MHonArc/CharEnt/ISO8859_9R.pm',
! 'iso-8859-15' => 'MHonArc/CharEnt/ISO8859_15R.pm',
);
***************
*** 135,139 ****
$ret .= pack("C", $char);
} elsif ($map->{$char}) {
! $ret .= join('', '&', $map->{$char}, ';');
} elsif ($ASCIIMap{$char}) {
$ret .= join('', '&', $ASCIIMap{$char}, ';');
--- 156,162 ----
$ret .= pack("C", $char);
} elsif ($map->{$char}) {
! $ret .= ref($map->{$char}) ?
! join('', map { '&'.$_.';' } @{$map->{$char}}) :
! join('', '&', $map->{$char}, ';');
} elsif ($ASCIIMap{$char}) {
$ret .= join('', '&', $ASCIIMap{$char}, ';');
***************
*** 203,206 ****
--- 226,230 ----
$map = _load_charmap($charset);
}
+ # XXX: Does not handle list values!
$map = $ent2char_maps{$charset} = { reverse %$map };
***************
*** 220,222 ****
##---------------------------------------------------------------------------##
1;
-
--- 244,245 ----
---------------------------------------------------------------------
To sign-off this list, send email to majordomo(_at_)mhonarc(_dot_)org with the
message text UNSUBSCRIBE MHONARC-DEV