mirror of
https://gitlab.com/gnuwget/wget2.git
synced 2026-01-14 02:01:39 +00:00
408 lines
13 KiB
C
408 lines
13 KiB
C
/*
|
|
* Copyright (c) 2013 Tim Ruehsen
|
|
* Copyright (c) 2015-2022 Free Software Foundation, Inc.
|
|
*
|
|
* This file is part of Wget
|
|
*
|
|
* Wget is free software: you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation, either version 3 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* Wget is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with Wget If not, see <https://www.gnu.org/licenses/>.
|
|
*
|
|
*
|
|
* Testing Wget
|
|
*
|
|
* Changelog
|
|
* 08.07.2013 Tim Ruehsen created
|
|
* 02.07.2014 Tim Ruehsen added uppercase combinations of <a href...> (issue #21)
|
|
*
|
|
*/
|
|
|
|
#include <config.h>
|
|
|
|
#include <stdlib.h> // exit()
|
|
#include "libtest.h"
|
|
|
|
int main(void)
|
|
{
|
|
wget_test_url_t urls[]={
|
|
{ .name = "/index.html",
|
|
.code = "200 Dontcare",
|
|
.body =
|
|
"<html><head><title>Main Page</title></head><body><p>A link to a" \
|
|
" <A hreF=\"http://localhost:{{port}}/secondpage.html\">second page</a>." \
|
|
" <a href=\"picture_a.jpeg\">Picture a</a>." \
|
|
" <a href=\"picture_aa.jpeg\">Picture aa</a>." \
|
|
"</p></body></html>",
|
|
.headers = {
|
|
"Content-Type: text/html",
|
|
}
|
|
},
|
|
{ .name = "/secondpage.html",
|
|
.code = "200 Dontcare",
|
|
.body =
|
|
"<html><head><title>Second Page</title></head><body><p>A link to a" \
|
|
" <a href=\"picture_b.jpeg\">Picture b</a>." \
|
|
" <a href=\"picture_bb.JpeG\">Picture bb</a>." \
|
|
" <a href=\"picture_c.png\">Picture c</a>." \
|
|
"</p></body></html>",
|
|
.headers = {
|
|
"Content-Type: text/html",
|
|
}
|
|
},
|
|
{ .name = "/picture_a.jpeg",
|
|
.code = "200 Dontcare",
|
|
.body = "don't care",
|
|
.headers = { "Content-Type: image/jpeg" }
|
|
},
|
|
{ .name = "/picture_aa.jpeg",
|
|
.code = "200 Dontcare",
|
|
.body = "don't care",
|
|
.headers = { "Content-Type: image/jpeg" }
|
|
},
|
|
{ .name = "/picture_b.jpeg",
|
|
.code = "200 Dontcare",
|
|
.body = "don't care",
|
|
.headers = { "Content-Type: image/jpeg" }
|
|
},
|
|
{ .name = "/picture_bb.JpeG",
|
|
.code = "200 Dontcare",
|
|
.body = "don't care",
|
|
.headers = { "Content-Type: image/jpeg" }
|
|
},
|
|
{ .name = "/picture_c.png",
|
|
.code = "200 Dontcare",
|
|
.body = "don't care",
|
|
.headers = { "Content-Type: image/png" }
|
|
},
|
|
};
|
|
|
|
// functions won't come back if an error occurs
|
|
wget_test_start_server(
|
|
WGET_TEST_RESPONSE_URLS, &urls, countof(urls),
|
|
WGET_TEST_FEATURE_MHD,
|
|
0);
|
|
|
|
// --accept using just suffixes
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --accept \".jpeg\"",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[2].name + 1, urls[2].body },
|
|
{ urls[3].name + 1, urls[3].body },
|
|
{ urls[4].name + 1, urls[4].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --reject using just suffixes
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --reject \".jpeg\"",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[0].name + 1, urls[0].body },
|
|
{ urls[1].name + 1, urls[1].body },
|
|
{ urls[5].name + 1, urls[5].body },
|
|
{ urls[6].name + 1, urls[6].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --accept using just suffixes and ignore case
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --accept \".jpeg\" --ignore-case",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[2].name + 1, urls[2].body },
|
|
{ urls[3].name + 1, urls[3].body },
|
|
{ urls[4].name + 1, urls[4].body },
|
|
{ urls[5].name + 1, urls[5].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --reject using just suffixes and ignore case
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --reject \".jpeg\" --ignore-case",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[0].name + 1, urls[0].body },
|
|
{ urls[1].name + 1, urls[1].body },
|
|
{ urls[6].name + 1, urls[6].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --accept using wildcards
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --accept \"*.jpeg\"",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[2].name + 1, urls[2].body },
|
|
{ urls[3].name + 1, urls[3].body },
|
|
{ urls[4].name + 1, urls[4].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --reject using wildcards
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --reject \"*.jpeg\"",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[0].name + 1, urls[0].body },
|
|
{ urls[1].name + 1, urls[1].body },
|
|
{ urls[5].name + 1, urls[5].body },
|
|
{ urls[6].name + 1, urls[6].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --accept using wildcards and ignore case
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --accept \"*.jpeg\" --ignore-case",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[2].name + 1, urls[2].body },
|
|
{ urls[3].name + 1, urls[3].body },
|
|
{ urls[4].name + 1, urls[4].body },
|
|
{ urls[5].name + 1, urls[5].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --reject using wildcards and ignore case
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --reject \"*.jpeg\" --ignore-case",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[0].name + 1, urls[0].body },
|
|
{ urls[1].name + 1, urls[1].body },
|
|
{ urls[6].name + 1, urls[6].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --accept using wildcards
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --accept \"*picture*\"",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[2].name + 1, urls[2].body },
|
|
{ urls[3].name + 1, urls[3].body },
|
|
{ urls[4].name + 1, urls[4].body },
|
|
{ urls[5].name + 1, urls[5].body },
|
|
{ urls[6].name + 1, urls[6].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --reject using wildcards
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --reject \"*picture*\"",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[0].name + 1, urls[0].body },
|
|
{ urls[1].name + 1, urls[1].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --accept using wildcards
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --accept \"*picture_[ab]*\"",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[2].name + 1, urls[2].body },
|
|
{ urls[3].name + 1, urls[3].body },
|
|
{ urls[4].name + 1, urls[4].body },
|
|
{ urls[5].name + 1, urls[5].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --reject using wildcards
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --reject \"*picture_[ab]*\"",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[0].name + 1, urls[0].body },
|
|
{ urls[1].name + 1, urls[1].body },
|
|
{ urls[6].name + 1, urls[6].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --accept using wildcards
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --accept \"*picture_a*\" --accept \"*picture_c*\"",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[2].name + 1, urls[2].body },
|
|
{ urls[3].name + 1, urls[3].body },
|
|
{ urls[6].name + 1, urls[6].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --reject using wildcards
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --reject \"*picture_a*\" --reject \"*picture_c*\"",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[0].name + 1, urls[0].body },
|
|
{ urls[1].name + 1, urls[1].body },
|
|
{ urls[4].name + 1, urls[4].body },
|
|
{ urls[5].name + 1, urls[5].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --accept-regex (posix)
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --accept-regex \"^(.*)(\\/)?picture_[ab]+\\.jpeg$\"",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[2].name + 1, urls[2].body },
|
|
{ urls[3].name + 1, urls[3].body },
|
|
{ urls[4].name + 1, urls[4].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --reject-regex (posix)
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --reject-regex \"^(.*)picture_[a]+\\.jpeg$\"",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[0].name + 1, urls[0].body },
|
|
{ urls[1].name + 1, urls[1].body },
|
|
{ urls[4].name + 1, urls[4].body },
|
|
{ urls[5].name + 1, urls[5].body },
|
|
{ urls[6].name + 1, urls[6].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --accept-regex and --reject-regex (posix)
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --accept-regex \"^(.*)picture_(.*)$\" --reject-regex \"\\.(jpeg|JpeG)+\"",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[6].name + 1, urls[6].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
|
|
#if defined WITH_LIBPCRE2 || defined WITH_LIBPCRE
|
|
// --accept-regex (pcre)
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --accept-regex \"^(.*)(\\/)?picture_[ab]+\\.jpeg$\" --regex-type pcre",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[2].name + 1, urls[2].body },
|
|
{ urls[3].name + 1, urls[3].body },
|
|
{ urls[4].name + 1, urls[4].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --reject-regex (pcre)
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --reject-regex \"^(.*)picture_[a]+\\.jpeg$\" --regex-type pcre",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[0].name + 1, urls[0].body },
|
|
{ urls[1].name + 1, urls[1].body },
|
|
{ urls[4].name + 1, urls[4].body },
|
|
{ urls[5].name + 1, urls[5].body },
|
|
{ urls[6].name + 1, urls[6].body },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --accept-regex and --reject-regex (pcre)
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --accept-regex \"^(.*)picture_(.*)$\" --reject-regex \"(?i)\\.jpeg\" --regex-type pcre",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[6].name + 1, urls[6].body },
|
|
{ NULL } },
|
|
0);
|
|
#endif
|
|
|
|
// tests with -N --no-if-modified-since
|
|
int n_urls = countof(urls);
|
|
for (int i = 0; i < n_urls; i++) {
|
|
urls[i].headers[1] = "Last-Modified: Sat, 09 Oct 2004 08:30:00 GMT";
|
|
}
|
|
// --accept using just suffixes
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --accept \".jpeg\" -N --no-if-modified-since",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[2].name + 1, urls[2].body, 1097310600 },
|
|
{ urls[3].name + 1, urls[3].body, 1097310600 },
|
|
{ urls[4].name + 1, urls[4].body, 1097310600 },
|
|
{ NULL } },
|
|
0);
|
|
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --accept \".jpeg\" -N --no-if-modified-since",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXISTING_FILES, &(wget_test_file_t []) {
|
|
{ urls[2].name + 1, "anycontent.", 1097310600 },
|
|
{ urls[3].name + 1, "anycontent", 1097310600 },
|
|
{ urls[4].name + 1, urls[4].body, 1097310000 },
|
|
{ NULL } },
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[2].name + 1, urls[2].body, 1097310600 },
|
|
{ urls[3].name + 1, "anycontent", 1097310600 },
|
|
{ urls[4].name + 1, urls[4].body, 1097310600 },
|
|
{ NULL } },
|
|
0);
|
|
|
|
// --reject using just suffixes
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --reject \".jpeg\" -N --no-if-modified-since",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[0].name + 1, urls[0].body, 1097310600 },
|
|
{ urls[1].name + 1, urls[1].body, 1097310600 },
|
|
{ urls[5].name + 1, urls[5].body, 1097310600 },
|
|
{ urls[6].name + 1, urls[6].body, 1097310600 },
|
|
{ NULL } },
|
|
0);
|
|
|
|
wget_test(
|
|
WGET_TEST_OPTIONS, "-r -nH --reject \".jpeg\" -N --no-if-modified-since",
|
|
WGET_TEST_REQUEST_URL, "index.html",
|
|
WGET_TEST_EXPECTED_ERROR_CODE, 0,
|
|
WGET_TEST_EXISTING_FILES, &(wget_test_file_t []) {
|
|
{ urls[5].name + 1, urls[5].body, 1097310000 },
|
|
{ urls[6].name + 1, "anycontent", 1097310600 },
|
|
{ NULL } },
|
|
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
|
|
{ urls[0].name + 1, urls[0].body, 1097310600 },
|
|
{ urls[1].name + 1, urls[1].body, 1097310600 },
|
|
{ urls[5].name + 1, urls[5].body, 1097310600 },
|
|
{ urls[6].name + 1, "anycontent", 1097310600 },
|
|
{ NULL } },
|
|
0);
|
|
|
|
exit(EXIT_SUCCESS);
|
|
}
|