Initial Commit
This commit is contained in:
69
database/perl/lib/Encode/KR.pm
Normal file
69
database/perl/lib/Encode/KR.pm
Normal file
@@ -0,0 +1,69 @@
|
||||
package Encode::KR;
|
||||
BEGIN {
|
||||
if ( ord("A") == 193 ) {
|
||||
die "Encode::KR not supported on EBCDIC\n";
|
||||
}
|
||||
}
|
||||
use strict;
|
||||
use warnings;
|
||||
use Encode;
|
||||
our $VERSION = do { my @r = ( q$Revision: 2.3 $ =~ /\d+/g ); sprintf "%d." . "%02d" x $#r, @r };
|
||||
use XSLoader;
|
||||
XSLoader::load( __PACKAGE__, $VERSION );
|
||||
|
||||
use Encode::KR::2022_KR;
|
||||
|
||||
1;
|
||||
__END__
|
||||
|
||||
=head1 NAME
|
||||
|
||||
Encode::KR - Korean Encodings
|
||||
|
||||
=head1 SYNOPSIS
|
||||
|
||||
use Encode qw/encode decode/;
|
||||
$euc_kr = encode("euc-kr", $utf8); # loads Encode::KR implicitly
|
||||
$utf8 = decode("euc-kr", $euc_kr); # ditto
|
||||
|
||||
=head1 DESCRIPTION
|
||||
|
||||
This module implements Korean charset encodings. Encodings supported
|
||||
are as follows.
|
||||
|
||||
|
||||
Canonical Alias Description
|
||||
--------------------------------------------------------------------
|
||||
euc-kr /\beuc.*kr$/i EUC (Extended Unix Character)
|
||||
/\bkr.*euc$/i
|
||||
ksc5601-raw Korean standard code set (as is)
|
||||
cp949 /(?:x-)?uhc$/i
|
||||
/(?:x-)?windows-949$/i
|
||||
/\bks_c_5601-1987$/i
|
||||
Code Page 949 (EUC-KR + 8,822
|
||||
(additional Hangul syllables)
|
||||
MacKorean EUC-KR + Apple Vendor Mappings
|
||||
johab JOHAB A supplementary encoding defined in
|
||||
Annex 3 of KS X 1001:1998
|
||||
iso-2022-kr iso-2022-kr [RFC1557]
|
||||
--------------------------------------------------------------------
|
||||
|
||||
To find how to use this module in detail, see L<Encode>.
|
||||
|
||||
=head1 BUGS
|
||||
|
||||
When you see C<charset=ks_c_5601-1987> on mails and web pages, they really
|
||||
mean "cp949" encodings. To fix that, the following aliases are set;
|
||||
|
||||
qr/(?:x-)?uhc$/i => '"cp949"'
|
||||
qr/(?:x-)?windows-949$/i => '"cp949"'
|
||||
qr/ks_c_5601-1987$/i => '"cp949"'
|
||||
|
||||
The ASCII region (0x00-0x7f) is preserved for all encodings, even
|
||||
though this conflicts with mappings by the Unicode Consortium.
|
||||
|
||||
=head1 SEE ALSO
|
||||
|
||||
L<Encode>
|
||||
|
||||
=cut
|
||||
Reference in New Issue
Block a user