forked from lifenjoiner/wget-for-windows
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathTest-iri-percent.px
executable file
·120 lines (101 loc) · 3.08 KB
/
Test-iri-percent.px
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
#!/usr/bin/env perl
use strict;
use warnings;
use WgetFeature qw(iri);
use HTTPTest;
use Encode::Locale;
use Encode::Locale qw($ENCODING_LOCALE $ENCODING_CONSOLE_IN $ENCODING_CONSOLE_OUT);
use Encode;
# Just a sanity check to verify that %-encoded values are always left
# untouched.
# URL should always be encoded from utf-8.
my $ccedilla_l15 = "\xE7";
my $ccedilla_u8 = "\xC3\xA7";
my $ccedilla_u8_pct = "%C3%A7";
my $eacute_l1 = "\xE9";
my $eacute_u8 = "\xC3\xA9";
my $eacute_u8_pct = "%C3%A9";
my $pageindex = <<EOF;
<html>
<head>
<title>Main Page</title>
</head>
<body>
<p>
Link to page 1 <a
href="http://localhost:{{port}}/hello_${ccedilla_u8_pct}${eacute_l1}.html">La seule page en français</a>.
</p>
</body>
</html>
EOF
my $pagefrancais = <<EOF;
<html>
<head>
<title>La seule page en français</title>
<meta http-equiv="Content-Type" content="text/html; charset=ISO-8859-1"/>
</head>
<body>
<p>
</p>
</body>
</html>
EOF
# code, msg, headers, content
my %urls = (
'/index.html' => {
code => "200",
msg => "Ok",
headers => {
"Content-type" => "text/html; charset=ISO-8859-15",
},
content => $pageindex,
},
"/hello_${ccedilla_u8_pct}${eacute_u8_pct}.html" => {
code => "200",
msg => "Ok",
headers => {
"Content-type" => "text/html; charset=UTF-8",
},
content => $pagefrancais,
},
);
my $cmdline = $WgetTest::WGETPATH . " --iri -e robots=off --restrict-file-names=nocontrol -nH -r http://localhost:{{port}}/";
my $expected_error_code = 0;
my $native_encoding = $ENCODING_LOCALE;
# To make the downloaded (OS encoding) to here got (maybe transcoded) the same with expected!
# Encode::Locale::reinit() would make: locale == `locale -n`, but locale != (console_in == console_out)
print "LC_CTYPE: " . ($ENV{'LC_CTYPE'} || "") . "\n"; # ~> wget findlocale()
print "ENCODING_LOCALE: " . $ENCODING_LOCALE . "\n";
print "ENCODING_CONSOLE_IN: " . $ENCODING_CONSOLE_IN . "\n";
print "ENCODING_CONSOLE_OUT: " . $ENCODING_CONSOLE_OUT . "\n";
if ($^O eq "msys" || $^O eq "cygwin") {
use Win32;
$native_encoding = "CP" . Win32::GetACP();
print "native encoding: " . $native_encoding . "\n";
}
sub can_transcode_to_locale
{
my ($from, $str, $to) = @_;
my $m = Encode::encode($to, Encode::decode($from, $str));
return Encode::encode($from, Encode::decode($to, $m)) eq $str;
}
my $str_out = ${ccedilla_u8} . ${eacute_u8};
if (!can_transcode_to_locale("UTF-8", $str_out, $native_encoding))
{
$str_out = ${ccedilla_u8_pct} . ${eacute_u8_pct};
}
my %expected_downloaded_files = (
'index.html' => {
content => $pageindex,
},
"hello_${str_out}.html" => {
content => $pagefrancais,
},
);
###############################################################################
my $the_test = HTTPTest->new (input => \%urls,
cmdline => $cmdline,
errcode => $expected_error_code,
output => \%expected_downloaded_files);
exit $the_test->run();
# vim: et ts=4 sw=4