Commit | Line | Data |
---|---|---|
5129552c JH |
1 | package Encode::Byte; |
2 | use Encode; | |
48e3bbdd | 3 | our $VERSION = do { my @r = (q$Revision: 1.0 $ =~ /\d+/g); sprintf "%d."."%02d" x $#r, @r }; |
5129552c JH |
4 | |
5 | use XSLoader; | |
6 | XSLoader::load('Encode::Byte',$VERSION); | |
7 | ||
8 | 1; | |
9 | __END__ | |
48e3bbdd | 10 | |
5129552c JH |
11 | =head1 NAME |
12 | ||
13 | Encode::Byte - Single Byte Encodings | |
14 | ||
15 | =head1 SYNOPSIS | |
16 | ||
17 | use Encode qw/encode decode/; | |
18 | $latin1 = encode("iso-8859-1", $utf8); # loads Encode::Byte implicitly | |
19 | $utf8 = decode("iso-8859-1", $latin1); # ditto | |
20 | ||
21 | =head1 ABSTRACT | |
22 | ||
23 | This module implements various single byte encodings. For most cases it uses | |
24 | \x80-\xff (upper half) to map non-ASCII characters. Encodings | |
25 | supported are as follows. | |
26 | ||
27 | Canonical Alias Description | |
28 | -------------------------------------------------------------------- | |
48e3bbdd NIS |
29 | # ISO 8859 series |
30 | (iso-8859-1 is in built-in) | |
31 | iso-8859-2 latin2 [ISO] | |
32 | iso-8859-3 latin3 [ISO] | |
33 | iso-8859-4 latin4 [ISO] | |
34 | iso-8859-5 [ISO] | |
35 | iso-8859-6 [ISO] | |
36 | iso-8859-7 [ISO] | |
37 | iso-8859-8 [ISO] | |
38 | iso-8859-9 latin5 [ISO] | |
39 | iso-8859-10 latin6 [ISO] | |
5129552c JH |
40 | iso-8859-11 |
41 | (iso-8859-12 is nonexistent) | |
48e3bbdd NIS |
42 | iso-8859-13 latin7 [ISO] |
43 | iso-8859-14 latin8 [ISO] | |
44 | iso-8859-15 latin9 [ISO] | |
45 | iso-8859-16 latin10 [ISO] | |
46 | ||
47 | # Cyrillic | |
48 | koi8-f | |
49 | koi8-r [RFC1489] | |
50 | koi8-u [RFC2319] | |
51 | ||
52 | # Vietnamese | |
53 | viscii | |
54 | ||
55 | # all cp* are also available as ibm-*, ms-*, and windows-* | |
56 | # also see L<http://msdn.microsoft.com/workshop/author/dhtml/reference/charsets/charset4.asp> | |
57 | cp1250 WinLatin2 | |
58 | cp1251 WinCyrillic | |
59 | cp1252 WinLatin1 | |
60 | cp1253 WinGreek | |
61 | cp1254 WinTurkiskh | |
62 | cp1255 WinHebrew | |
63 | cp1256 WinArabic | |
64 | cp1257 WinBaltic | |
65 | cp1258 WinVietnamese | |
66 | ||
67 | # Macintosh | |
68 | # Also see L<http://developer.apple.com/technotes/tn/tn1150.html> | |
69 | MacCentralEurRoman | |
70 | MacCroatian | |
71 | MacRoman | |
72 | MacCyrillic | |
73 | MacRomanian | |
74 | MacSami | |
75 | MacGreek | |
76 | MacThai | |
77 | MacIcelandic | |
78 | MacTurkish | |
79 | MacUkrainian | |
80 | ||
81 | # More vendor encodings | |
82 | nextstep | |
83 | gsm0338 # used in GSM handsets | |
84 | hp-roman8 | |
5129552c JH |
85 | |
86 | =head1 DESCRIPTION | |
87 | ||
88 | To find how to use this module in detail, see L<Encode>. | |
89 | ||
90 | =head1 SEE ALSO | |
91 | ||
92 | L<Encode> | |
93 | ||
94 | =cut |