wget/tests/Test-restrict-ascii.px

#!/usr/bin/env -S perl -I .

use strict;
use warnings;

use HTTPTest;

# This program tests that --restrict-file-names=ascii can be used to
# ensure that all high-valued bytes are escaped. The sample filename was
# chosen because in former versions of Wget, one could either choose not
# to escape any portion of the UTF-8 filename via
# --restrict-file-names=nocontrol (which would only be helpful if one
# was _on_ a UTF-8 system), or else Wget would escape _portions_ of
# characters, leaving irrelevant "latin1"-looking characters combined
# with percent-encoded "control" characters, instead of encoding all the
# bytes of an entire non-ASCII UTF-8 character.

###############################################################################

# "gnosis" in UTF-8 greek.
my $gnosis = '%CE%B3%CE%BD%CF%89%CF%83%CE%B9%CF%82';

my $mainpage = <<EOF;
<html>
<head>
  <title>Some Page Title</title>
</head>
<body>
  <p>
    Some text...
  </p>
</body>
</html>
EOF

# code, msg, headers, content
my %urls = (
    "/$gnosis.html" => {
        code => "200",
        msg => "Dontcare",
        headers => {
            "Content-type" => "text/html",
        },
        content => $mainpage,
    },
);

my $cmdline = $WgetTest::WGETPATH . " --restrict-file-names=ascii "
    . "http://localhost:{{port}}/${gnosis}.html";

my $expected_error_code = 0;

my %expected_downloaded_files = (
    "${gnosis}.html" => {
        content => $mainpage,
    },
);

###############################################################################

my $the_test = HTTPTest->new (input => \%urls,
                              cmdline => $cmdline,
                              errcode => $expected_error_code,
                              output => \%expected_downloaded_files);
exit $the_test->run();

# vim: et ts=4 sw=4
Import Upstream version 1.20.3 2022-05-14 03:18:11 +08:00			`#!/usr/bin/env -S perl -I .`

			`use strict;`
			`use warnings;`

			`use HTTPTest;`

			`# This program tests that --restrict-file-names=ascii can be used to`
			`# ensure that all high-valued bytes are escaped. The sample filename was`
			`# chosen because in former versions of Wget, one could either choose not`
			`# to escape any portion of the UTF-8 filename via`
			`# --restrict-file-names=nocontrol (which would only be helpful if one`
			`# was _on_ a UTF-8 system), or else Wget would escape _portions_ of`
			`# characters, leaving irrelevant "latin1"-looking characters combined`
			`# with percent-encoded "control" characters, instead of encoding all the`
			`# bytes of an entire non-ASCII UTF-8 character.`

			`###############################################################################`

			`# "gnosis" in UTF-8 greek.`
			`my $gnosis = '%CE%B3%CE%BD%CF%89%CF%83%CE%B9%CF%82';`

			`my $mainpage = <<EOF;`
			`<html>`
			`<head>`
			`<title>Some Page Title</title>`
			`</head>`
			`<body>`
			`<p>`
			`Some text...`
			`</p>`
			`</body>`
			`</html>`
			`EOF`

			`# code, msg, headers, content`
			`my %urls = (`
			`"/$gnosis.html" => {`
			`code => "200",`
			`msg => "Dontcare",`
			`headers => {`
			`"Content-type" => "text/html",`
			`},`
			`content => $mainpage,`
			`},`
			`);`

			`my $cmdline = $WgetTest::WGETPATH . " --restrict-file-names=ascii "`
			`. "http://localhost:{{port}}/${gnosis}.html";`

			`my $expected_error_code = 0;`

			`my %expected_downloaded_files = (`
			`"${gnosis}.html" => {`
			`content => $mainpage,`
			`},`
			`);`

			`###############################################################################`

			`my $the_test = HTTPTest->new (input => \%urls,`
			`cmdline => $cmdline,`
			`errcode => $expected_error_code,`
			`output => \%expected_downloaded_files);`
			`exit $the_test->run();`

			`# vim: et ts=4 sw=4`