Files
wget2/tests/test-accept.c
2022-02-25 17:46:43 +01:00

408 lines
13 KiB
C

/*
* Copyright (c) 2013 Tim Ruehsen
* Copyright (c) 2015-2022 Free Software Foundation, Inc.
*
* This file is part of Wget
*
* Wget is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Wget is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with Wget If not, see <https://www.gnu.org/licenses/>.
*
*
* Testing Wget
*
* Changelog
* 08.07.2013 Tim Ruehsen created
* 02.07.2014 Tim Ruehsen added uppercase combinations of <a href...> (issue #21)
*
*/
#include <config.h>
#include <stdlib.h> // exit()
#include "libtest.h"
int main(void)
{
wget_test_url_t urls[]={
{ .name = "/index.html",
.code = "200 Dontcare",
.body =
"<html><head><title>Main Page</title></head><body><p>A link to a" \
" <A hreF=\"http://localhost:{{port}}/secondpage.html\">second page</a>." \
" <a href=\"picture_a.jpeg\">Picture a</a>." \
" <a href=\"picture_aa.jpeg\">Picture aa</a>." \
"</p></body></html>",
.headers = {
"Content-Type: text/html",
}
},
{ .name = "/secondpage.html",
.code = "200 Dontcare",
.body =
"<html><head><title>Second Page</title></head><body><p>A link to a" \
" <a href=\"picture_b.jpeg\">Picture b</a>." \
" <a href=\"picture_bb.JpeG\">Picture bb</a>." \
" <a href=\"picture_c.png\">Picture c</a>." \
"</p></body></html>",
.headers = {
"Content-Type: text/html",
}
},
{ .name = "/picture_a.jpeg",
.code = "200 Dontcare",
.body = "don't care",
.headers = { "Content-Type: image/jpeg" }
},
{ .name = "/picture_aa.jpeg",
.code = "200 Dontcare",
.body = "don't care",
.headers = { "Content-Type: image/jpeg" }
},
{ .name = "/picture_b.jpeg",
.code = "200 Dontcare",
.body = "don't care",
.headers = { "Content-Type: image/jpeg" }
},
{ .name = "/picture_bb.JpeG",
.code = "200 Dontcare",
.body = "don't care",
.headers = { "Content-Type: image/jpeg" }
},
{ .name = "/picture_c.png",
.code = "200 Dontcare",
.body = "don't care",
.headers = { "Content-Type: image/png" }
},
};
// functions won't come back if an error occurs
wget_test_start_server(
WGET_TEST_RESPONSE_URLS, &urls, countof(urls),
WGET_TEST_FEATURE_MHD,
0);
// --accept using just suffixes
wget_test(
WGET_TEST_OPTIONS, "-r -nH --accept \".jpeg\"",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[2].name + 1, urls[2].body },
{ urls[3].name + 1, urls[3].body },
{ urls[4].name + 1, urls[4].body },
{ NULL } },
0);
// --reject using just suffixes
wget_test(
WGET_TEST_OPTIONS, "-r -nH --reject \".jpeg\"",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[0].name + 1, urls[0].body },
{ urls[1].name + 1, urls[1].body },
{ urls[5].name + 1, urls[5].body },
{ urls[6].name + 1, urls[6].body },
{ NULL } },
0);
// --accept using just suffixes and ignore case
wget_test(
WGET_TEST_OPTIONS, "-r -nH --accept \".jpeg\" --ignore-case",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[2].name + 1, urls[2].body },
{ urls[3].name + 1, urls[3].body },
{ urls[4].name + 1, urls[4].body },
{ urls[5].name + 1, urls[5].body },
{ NULL } },
0);
// --reject using just suffixes and ignore case
wget_test(
WGET_TEST_OPTIONS, "-r -nH --reject \".jpeg\" --ignore-case",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[0].name + 1, urls[0].body },
{ urls[1].name + 1, urls[1].body },
{ urls[6].name + 1, urls[6].body },
{ NULL } },
0);
// --accept using wildcards
wget_test(
WGET_TEST_OPTIONS, "-r -nH --accept \"*.jpeg\"",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[2].name + 1, urls[2].body },
{ urls[3].name + 1, urls[3].body },
{ urls[4].name + 1, urls[4].body },
{ NULL } },
0);
// --reject using wildcards
wget_test(
WGET_TEST_OPTIONS, "-r -nH --reject \"*.jpeg\"",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[0].name + 1, urls[0].body },
{ urls[1].name + 1, urls[1].body },
{ urls[5].name + 1, urls[5].body },
{ urls[6].name + 1, urls[6].body },
{ NULL } },
0);
// --accept using wildcards and ignore case
wget_test(
WGET_TEST_OPTIONS, "-r -nH --accept \"*.jpeg\" --ignore-case",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[2].name + 1, urls[2].body },
{ urls[3].name + 1, urls[3].body },
{ urls[4].name + 1, urls[4].body },
{ urls[5].name + 1, urls[5].body },
{ NULL } },
0);
// --reject using wildcards and ignore case
wget_test(
WGET_TEST_OPTIONS, "-r -nH --reject \"*.jpeg\" --ignore-case",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[0].name + 1, urls[0].body },
{ urls[1].name + 1, urls[1].body },
{ urls[6].name + 1, urls[6].body },
{ NULL } },
0);
// --accept using wildcards
wget_test(
WGET_TEST_OPTIONS, "-r -nH --accept \"*picture*\"",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[2].name + 1, urls[2].body },
{ urls[3].name + 1, urls[3].body },
{ urls[4].name + 1, urls[4].body },
{ urls[5].name + 1, urls[5].body },
{ urls[6].name + 1, urls[6].body },
{ NULL } },
0);
// --reject using wildcards
wget_test(
WGET_TEST_OPTIONS, "-r -nH --reject \"*picture*\"",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[0].name + 1, urls[0].body },
{ urls[1].name + 1, urls[1].body },
{ NULL } },
0);
// --accept using wildcards
wget_test(
WGET_TEST_OPTIONS, "-r -nH --accept \"*picture_[ab]*\"",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[2].name + 1, urls[2].body },
{ urls[3].name + 1, urls[3].body },
{ urls[4].name + 1, urls[4].body },
{ urls[5].name + 1, urls[5].body },
{ NULL } },
0);
// --reject using wildcards
wget_test(
WGET_TEST_OPTIONS, "-r -nH --reject \"*picture_[ab]*\"",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[0].name + 1, urls[0].body },
{ urls[1].name + 1, urls[1].body },
{ urls[6].name + 1, urls[6].body },
{ NULL } },
0);
// --accept using wildcards
wget_test(
WGET_TEST_OPTIONS, "-r -nH --accept \"*picture_a*\" --accept \"*picture_c*\"",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[2].name + 1, urls[2].body },
{ urls[3].name + 1, urls[3].body },
{ urls[6].name + 1, urls[6].body },
{ NULL } },
0);
// --reject using wildcards
wget_test(
WGET_TEST_OPTIONS, "-r -nH --reject \"*picture_a*\" --reject \"*picture_c*\"",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[0].name + 1, urls[0].body },
{ urls[1].name + 1, urls[1].body },
{ urls[4].name + 1, urls[4].body },
{ urls[5].name + 1, urls[5].body },
{ NULL } },
0);
// --accept-regex (posix)
wget_test(
WGET_TEST_OPTIONS, "-r -nH --accept-regex \"^(.*)(\\/)?picture_[ab]+\\.jpeg$\"",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[2].name + 1, urls[2].body },
{ urls[3].name + 1, urls[3].body },
{ urls[4].name + 1, urls[4].body },
{ NULL } },
0);
// --reject-regex (posix)
wget_test(
WGET_TEST_OPTIONS, "-r -nH --reject-regex \"^(.*)picture_[a]+\\.jpeg$\"",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[0].name + 1, urls[0].body },
{ urls[1].name + 1, urls[1].body },
{ urls[4].name + 1, urls[4].body },
{ urls[5].name + 1, urls[5].body },
{ urls[6].name + 1, urls[6].body },
{ NULL } },
0);
// --accept-regex and --reject-regex (posix)
wget_test(
WGET_TEST_OPTIONS, "-r -nH --accept-regex \"^(.*)picture_(.*)$\" --reject-regex \"\\.(jpeg|JpeG)+\"",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[6].name + 1, urls[6].body },
{ NULL } },
0);
#if defined WITH_LIBPCRE2 || defined WITH_LIBPCRE
// --accept-regex (pcre)
wget_test(
WGET_TEST_OPTIONS, "-r -nH --accept-regex \"^(.*)(\\/)?picture_[ab]+\\.jpeg$\" --regex-type pcre",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[2].name + 1, urls[2].body },
{ urls[3].name + 1, urls[3].body },
{ urls[4].name + 1, urls[4].body },
{ NULL } },
0);
// --reject-regex (pcre)
wget_test(
WGET_TEST_OPTIONS, "-r -nH --reject-regex \"^(.*)picture_[a]+\\.jpeg$\" --regex-type pcre",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[0].name + 1, urls[0].body },
{ urls[1].name + 1, urls[1].body },
{ urls[4].name + 1, urls[4].body },
{ urls[5].name + 1, urls[5].body },
{ urls[6].name + 1, urls[6].body },
{ NULL } },
0);
// --accept-regex and --reject-regex (pcre)
wget_test(
WGET_TEST_OPTIONS, "-r -nH --accept-regex \"^(.*)picture_(.*)$\" --reject-regex \"(?i)\\.jpeg\" --regex-type pcre",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[6].name + 1, urls[6].body },
{ NULL } },
0);
#endif
// tests with -N --no-if-modified-since
int n_urls = countof(urls);
for (int i = 0; i < n_urls; i++) {
urls[i].headers[1] = "Last-Modified: Sat, 09 Oct 2004 08:30:00 GMT";
}
// --accept using just suffixes
wget_test(
WGET_TEST_OPTIONS, "-r -nH --accept \".jpeg\" -N --no-if-modified-since",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[2].name + 1, urls[2].body, 1097310600 },
{ urls[3].name + 1, urls[3].body, 1097310600 },
{ urls[4].name + 1, urls[4].body, 1097310600 },
{ NULL } },
0);
wget_test(
WGET_TEST_OPTIONS, "-r -nH --accept \".jpeg\" -N --no-if-modified-since",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXISTING_FILES, &(wget_test_file_t []) {
{ urls[2].name + 1, "anycontent.", 1097310600 },
{ urls[3].name + 1, "anycontent", 1097310600 },
{ urls[4].name + 1, urls[4].body, 1097310000 },
{ NULL } },
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[2].name + 1, urls[2].body, 1097310600 },
{ urls[3].name + 1, "anycontent", 1097310600 },
{ urls[4].name + 1, urls[4].body, 1097310600 },
{ NULL } },
0);
// --reject using just suffixes
wget_test(
WGET_TEST_OPTIONS, "-r -nH --reject \".jpeg\" -N --no-if-modified-since",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[0].name + 1, urls[0].body, 1097310600 },
{ urls[1].name + 1, urls[1].body, 1097310600 },
{ urls[5].name + 1, urls[5].body, 1097310600 },
{ urls[6].name + 1, urls[6].body, 1097310600 },
{ NULL } },
0);
wget_test(
WGET_TEST_OPTIONS, "-r -nH --reject \".jpeg\" -N --no-if-modified-since",
WGET_TEST_REQUEST_URL, "index.html",
WGET_TEST_EXPECTED_ERROR_CODE, 0,
WGET_TEST_EXISTING_FILES, &(wget_test_file_t []) {
{ urls[5].name + 1, urls[5].body, 1097310000 },
{ urls[6].name + 1, "anycontent", 1097310600 },
{ NULL } },
WGET_TEST_EXPECTED_FILES, &(wget_test_file_t []) {
{ urls[0].name + 1, urls[0].body, 1097310600 },
{ urls[1].name + 1, urls[1].body, 1097310600 },
{ urls[5].name + 1, urls[5].body, 1097310600 },
{ urls[6].name + 1, "anycontent", 1097310600 },
{ NULL } },
0);
exit(EXIT_SUCCESS);
}