This is a live mirror of the Perl 5 development currently hosted at https://github.com/perl/perl5
NetWare updates from C Aditya.
[perl5.git] / ext / Encode / t / guess.t
CommitLineData
af1f55d9
JH
1BEGIN {
2 if ($ENV{'PERL_CORE'}){
3 chdir 't';
4 unshift @INC, '../lib';
5 }
6 require Config; import Config;
7 if ($Config{'extensions'} !~ /\bEncode\b/) {
8 print "1..0 # Skip: Encode was not built\n";
9 exit 0;
10 }
11 $| = 1;
12}
13
14use strict;
15use File::Basename;
16use File::Spec;
17use Encode qw(decode encode find_encoding _utf8_off);
18
19#use Test::More qw(no_plan);
7e19fb92 20use Test::More tests => 17;
af1f55d9
JH
21use_ok("Encode::Guess");
22{
23 no warnings;
24 $Encode::Guess::DEBUG = shift || 0;
25}
26
27my $ascii = join('' => map {chr($_)}(0x21..0x7e));
28my $latin1 = join('' => map {chr($_)}(0xa1..0xfe));
29my $utf8on = join('' => map {chr($_)}(0x3000..0x30fe));
30my $utf8off = $utf8on; _utf8_off($utf8off);
7e19fb92
JH
31my $utf16 = encode('UTF-16', $utf8on);
32my $utf32 = encode('UTF-32', $utf8on);
af1f55d9 33
7e19fb92
JH
34is(guess_encoding($ascii)->name, 'ascii', 'ascii');
35like(guess_encoding($latin1), qr/No appropriate encoding/io, 'no ascii');
36is(guess_encoding($latin1, 'latin1')->name, 'iso-8859-1', 'iso-8859-1');
37is(guess_encoding($utf8on)->name, 'utf8', 'utf8 w/ flag');
38is(guess_encoding($utf8off)->name, 'utf8', 'utf8 w/o flag');
39is(guess_encoding($utf16)->name, 'UTF-16', 'UTF-16');
40is(guess_encoding($utf32)->name, 'UTF-32', 'UTF-32');
af1f55d9
JH
41
42my $jisx0201 = File::Spec->catfile(dirname(__FILE__), 'jisx0201.utf');
43my $jisx0208 = File::Spec->catfile(dirname(__FILE__), 'jisx0208.utf');
44my $jisx0212 = File::Spec->catfile(dirname(__FILE__), 'jisx0212.utf');
45
46open my $fh, $jisx0208 or die "$jisx0208: $!";
47$utf8off = join('' => <$fh>);
48close $fh;
49$utf8on = decode('utf8', $utf8off);
7e19fb92 50
af1f55d9
JH
51my @jp = qw(7bit-jis shiftjis euc-jp);
52
7e19fb92 53Encode::Guess->set_suspects(@jp);
af1f55d9
JH
54
55for my $jp (@jp){
56 my $test = encode($jp, $utf8on);
7e19fb92 57 is(guess_encoding($test)->name, $jp, "JP:$jp");
af1f55d9 58}
7e19fb92 59
af1f55d9
JH
60is (decode('Guess', encode('euc-jp', $utf8on)), $utf8on, "decode('Guess')");
61eval{ encode('Guess', $utf8on) };
10c5ecbb 62like($@, qr/not defined/io, "no encode()");
7e19fb92
JH
63
64my %CJKT =
65 (
66 'euc-cn' => File::Spec->catfile(dirname(__FILE__), 'gb2312.utf'),
67 'euc-jp' => File::Spec->catfile(dirname(__FILE__), 'jisx0208.utf'),
68 'euc-kr' => File::Spec->catfile(dirname(__FILE__), 'ksc5601.utf'),
69 'big5-eten' => File::Spec->catfile(dirname(__FILE__), 'big5-eten.utf'),
70);
71
72Encode::Guess->set_suspects(keys %CJKT);
73
74for my $name (keys %CJKT){
75 open my $fh, $CJKT{$name} or die "$CJKT{$name}: $!";
76 $utf8off = join('' => <$fh>);
77 close $fh;
78
79 my $test = encode($name, decode('utf8', $utf8off));
80 is(guess_encoding($test)->name, $name, "CJKT:$name");
81}
82
af1f55d9 83__END__;