2010-06-04 05:12:19 -04:00
|
|
|
#!/usr/bin/env perl
|
2008-12-04 17:25:12 -05:00
|
|
|
|
|
|
|
use strict;
|
|
|
|
use warnings;
|
|
|
|
|
2009-09-05 16:54:05 -04:00
|
|
|
use WgetFeature qw(iri);
|
2008-12-04 17:25:12 -05:00
|
|
|
use HTTPTest;
|
|
|
|
|
|
|
|
# " Kon'nichiwa <dot> Japan
|
|
|
|
my $euc_jp_hostname = "\272\243\306\374\244\317.\306\374\313\334";
|
|
|
|
my $punycoded_hostname = 'xn--v9ju72g90p.xn--wgv71a';
|
2013-10-07 17:37:42 -04:00
|
|
|
my $escaped_hostname = "%ba%a3%c6%fc%a4%cf.%c6%fc%cb%dc";
|
2008-12-04 17:25:12 -05:00
|
|
|
|
|
|
|
###############################################################################
|
|
|
|
|
|
|
|
my $starter_file = <<EOF;
|
|
|
|
<a href="http://$euc_jp_hostname/foo.txt">The link</a>
|
2013-10-07 17:37:42 -04:00
|
|
|
<a href="http://$punycoded_hostname/foo2.txt">The second link</a>
|
|
|
|
<a href="http://$escaped_hostname/foo3.txt">The third link</a>
|
2008-12-04 17:25:12 -05:00
|
|
|
EOF
|
|
|
|
|
|
|
|
my $result_file = <<EOF;
|
|
|
|
Found me!
|
|
|
|
EOF
|
|
|
|
|
|
|
|
# code, msg, headers, content
|
|
|
|
my %urls = (
|
|
|
|
"http://$punycoded_hostname/index.html" => {
|
|
|
|
code => "200",
|
|
|
|
msg => "Yes, please",
|
|
|
|
headers => {
|
|
|
|
'Content-Type' => 'text/html; charset=EUC-JP',
|
|
|
|
},
|
|
|
|
content => $starter_file,
|
|
|
|
},
|
|
|
|
"http://$punycoded_hostname/foo.txt" => {
|
|
|
|
code => "200",
|
|
|
|
msg => "Uh-huh",
|
|
|
|
headers => {
|
|
|
|
'Content-Type' => 'text/plain',
|
|
|
|
},
|
|
|
|
content => $result_file,
|
|
|
|
},
|
2013-10-07 17:37:42 -04:00
|
|
|
"http://$punycoded_hostname/foo2.txt" => {
|
|
|
|
code => "200",
|
|
|
|
msg => "Uh-huh2",
|
|
|
|
headers => {
|
|
|
|
'Content-Type' => 'text/plain',
|
|
|
|
},
|
|
|
|
content => $result_file,
|
|
|
|
},
|
|
|
|
"http://$punycoded_hostname/foo3.txt" => {
|
|
|
|
code => "200",
|
|
|
|
msg => "Uh-huh3",
|
|
|
|
headers => {
|
|
|
|
'Content-Type' => 'text/plain',
|
|
|
|
},
|
|
|
|
content => $result_file,
|
|
|
|
},
|
2008-12-04 17:25:12 -05:00
|
|
|
"http://$punycoded_hostname/robots.txt" => {
|
|
|
|
code => "200",
|
|
|
|
msg => "Uh-huh",
|
|
|
|
headers => {
|
|
|
|
'Content-Type' => 'text/plain',
|
|
|
|
},
|
|
|
|
content => '',
|
|
|
|
},
|
|
|
|
);
|
|
|
|
|
2013-10-07 17:37:42 -04:00
|
|
|
my $cmdline = $WgetTest::WGETPATH . " --iri -r"
|
2009-07-27 00:50:19 -04:00
|
|
|
. " -e http_proxy=localhost:{{port}} --local-encoding=EUC-JP"
|
2008-12-04 17:25:12 -05:00
|
|
|
. " http://$euc_jp_hostname/";
|
|
|
|
|
|
|
|
my $expected_error_code = 0;
|
|
|
|
|
|
|
|
my %expected_downloaded_files = (
|
|
|
|
"$punycoded_hostname/index.html" => {
|
|
|
|
content => $starter_file,
|
|
|
|
},
|
|
|
|
"$punycoded_hostname/foo.txt" => {
|
|
|
|
content => $result_file,
|
|
|
|
},
|
2013-10-07 17:37:42 -04:00
|
|
|
"$punycoded_hostname/foo2.txt" => {
|
|
|
|
content => $result_file,
|
|
|
|
},
|
|
|
|
"$punycoded_hostname/foo3.txt" => {
|
|
|
|
content => $result_file,
|
|
|
|
},
|
2008-12-04 17:25:12 -05:00
|
|
|
"$punycoded_hostname/robots.txt" => {
|
|
|
|
content => '',
|
|
|
|
},
|
|
|
|
);
|
|
|
|
|
|
|
|
###############################################################################
|
|
|
|
|
|
|
|
my $the_test = HTTPTest->new (name => "Test-idn-robots",
|
2009-09-21 23:39:44 -04:00
|
|
|
input => \%urls,
|
|
|
|
cmdline => $cmdline,
|
|
|
|
errcode => $expected_error_code,
|
2008-12-04 17:25:12 -05:00
|
|
|
output => \%expected_downloaded_files);
|
|
|
|
exit $the_test->run();
|
|
|
|
|
|
|
|
# vim: et ts=4 sw=4
|