wget/tests/Test-restrict-ascii.px

68 lines
1.8 KiB
Plaintext
Raw Normal View History

2022-05-14 03:18:11 +08:00
#!/usr/bin/env -S perl -I .
use strict;
use warnings;
use HTTPTest;
# This program tests that --restrict-file-names=ascii can be used to
# ensure that all high-valued bytes are escaped. The sample filename was
# chosen because in former versions of Wget, one could either choose not
# to escape any portion of the UTF-8 filename via
# --restrict-file-names=nocontrol (which would only be helpful if one
# was _on_ a UTF-8 system), or else Wget would escape _portions_ of
# characters, leaving irrelevant "latin1"-looking characters combined
# with percent-encoded "control" characters, instead of encoding all the
# bytes of an entire non-ASCII UTF-8 character.
###############################################################################
# "gnosis" in UTF-8 greek.
my $gnosis = '%CE%B3%CE%BD%CF%89%CF%83%CE%B9%CF%82';
my $mainpage = <<EOF;
<html>
<head>
<title>Some Page Title</title>
</head>
<body>
<p>
Some text...
</p>
</body>
</html>
EOF
# code, msg, headers, content
my %urls = (
"/$gnosis.html" => {
code => "200",
msg => "Dontcare",
headers => {
"Content-type" => "text/html",
},
content => $mainpage,
},
);
my $cmdline = $WgetTest::WGETPATH . " --restrict-file-names=ascii "
. "http://localhost:{{port}}/${gnosis}.html";
my $expected_error_code = 0;
my %expected_downloaded_files = (
"${gnosis}.html" => {
content => $mainpage,
},
);
###############################################################################
my $the_test = HTTPTest->new (input => \%urls,
cmdline => $cmdline,
errcode => $expected_error_code,
output => \%expected_downloaded_files);
exit $the_test->run();
# vim: et ts=4 sw=4