ClamAV is an open source (GPLv2) anti-virus toolkit.
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 
 
 
 
clamav/unit_tests/check_htmlnorm.c

203 lines
6.4 KiB

/*
* Unit tests for HTML normalizer;
*
* Copyright (C) 2013-2022 Cisco Systems, Inc. and/or its affiliates. All rights reserved.
* Copyright (C) 2008-2013 Sourcefire, Inc.
*
* Authors: Török Edvin
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License version 2 as
* published by the Free Software Foundation.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
* MA 02110-1301, USA.
*/
#if HAVE_CONFIG_H
#include "clamav-config.h"
#endif
#include <stdio.h>
#include <check.h>
#include <fcntl.h>
#include <string.h>
// libclamav
#include "clamav.h"
#include "fmap.h"
#include "dconf.h"
#include "htmlnorm.h"
#include "others.h"
#include "fmap.h"
#include "checks.h"
static char *dir;
static void htmlnorm_setup(void)
{
cl_init(CL_INIT_DEFAULT);
dconf_setup();
dir = cli_gentemp(NULL);
ck_assert_msg(!!dir, "cli_gentemp failed");
}
static void htmlnorm_teardown(void)
{
dconf_teardown();
/* can't call fail() functions in teardown, it can cause SEGV */
cli_rmdirs(dir);
free(dir);
dir = NULL;
}
static struct test {
const char *input;
const char *nocommentref;
const char *notagsref;
const char *jsref;
} tests[] = {
/* NULL means don't test it */
{"input" PATHSEP "htmlnorm_scanfiles" PATHSEP "htmlnorm_buf.html",
"input" PATHSEP "htmlnorm_reffiles" PATHSEP "buf.nocomment.ref",
"input" PATHSEP "htmlnorm_reffiles" PATHSEP "buf.notags.ref",
NULL},
{"input" PATHSEP "htmlnorm_scanfiles" PATHSEP "htmlnorm_encode.html",
"input" PATHSEP "htmlnorm_reffiles" PATHSEP "encode.nocomment.ref",
NULL,
"input" PATHSEP "htmlnorm_reffiles" PATHSEP "encode.js.ref"},
{"input" PATHSEP "htmlnorm_scanfiles" PATHSEP "htmlnorm_js_test.html",
"input" PATHSEP "htmlnorm_reffiles" PATHSEP "js.nocomment.ref",
NULL,
"input" PATHSEP "htmlnorm_reffiles" PATHSEP "js.js.ref"},
{"input" PATHSEP "htmlnorm_scanfiles" PATHSEP "htmlnorm_test.html",
"input" PATHSEP "htmlnorm_reffiles" PATHSEP "test.nocomment.ref",
"input" PATHSEP "htmlnorm_reffiles" PATHSEP "test.notags.ref",
NULL},
{"input" PATHSEP "htmlnorm_scanfiles" PATHSEP "htmlnorm_urls.html",
"input" PATHSEP "htmlnorm_reffiles" PATHSEP "urls.nocomment.ref",
"input" PATHSEP "htmlnorm_reffiles" PATHSEP "urls.notags.ref",
NULL}};
static void check_dir(const char *dire, const struct test *test)
{
char filename[4096];
int fd, reffd;
if (test->nocommentref) {
snprintf(filename, sizeof(filename), "%s" PATHSEP "nocomment.html", dire);
fd = open(filename, O_RDONLY | O_BINARY);
ck_assert_msg(fd > 0, "unable to open: %s", filename);
reffd = open_testfile(test->nocommentref, O_RDONLY | O_BINARY);
diff_files(fd, reffd);
/* diff_files will close both fd's */
}
if (test->notagsref) {
snprintf(filename, sizeof(filename), "%s" PATHSEP "notags.html", dire);
fd = open(filename, O_RDONLY | O_BINARY);
ck_assert_msg(fd > 0, "unable to open: %s", filename);
reffd = open_testfile(test->notagsref, O_RDONLY | O_BINARY);
diff_files(fd, reffd);
/* diff_files will close both fd's */
}
if (test->jsref) {
snprintf(filename, sizeof(filename), "%s" PATHSEP "javascript", dire);
fd = open(filename, O_RDONLY | O_BINARY);
ck_assert_msg(fd > 0, "unable to open: %s", filename);
reffd = open_testfile(test->jsref, O_RDONLY | O_BINARY);
diff_files(fd, reffd);
/* diff_files will close both fd's */
}
}
START_TEST(test_htmlnorm_api)
{
int fd;
tag_arguments_t hrefs;
fmap_t *map;
memset(&hrefs, 0, sizeof(hrefs));
fd = open_testfile(tests[_i].input, O_RDONLY | O_BINARY);
ck_assert_msg(fd > 0, "open_testfile failed");
map = fmap(fd, 0, 0, tests[_i].input);
ck_assert_msg(!!map, "fmap failed");
ck_assert_msg(mkdir(dir, 0700) == 0, "mkdir failed: %s", dir);
ck_assert_msg(html_normalise_map(map, dir, NULL, dconf) == 1, "html_normalise_map failed");
check_dir(dir, &tests[_i]);
ck_assert_msg(cli_rmdirs(dir) == 0, "rmdirs failed: %s", dir);
ck_assert_msg(mkdir(dir, 0700) == 0, "mkdir failed: %s", dir);
ck_assert_msg(html_normalise_map(map, dir, NULL, NULL) == 1, "html_normalise_map failed");
ck_assert_msg(cli_rmdirs(dir) == 0, "rmdirs failed: %s", dir);
ck_assert_msg(mkdir(dir, 0700) == 0, "mkdir failed: %s", dir);
ck_assert_msg(html_normalise_map(map, dir, &hrefs, dconf) == 1, "html_normalise_map failed");
ck_assert_msg(cli_rmdirs(dir) == 0, "rmdirs failed: %s", dir);
html_tag_arg_free(&hrefs);
memset(&hrefs, 0, sizeof(hrefs));
hrefs.scanContents = 1;
ck_assert_msg(mkdir(dir, 0700) == 0, "mkdir failed: %s", dir);
ck_assert_msg(html_normalise_map(map, dir, &hrefs, dconf) == 1, "html_normalise_map failed");
ck_assert_msg(cli_rmdirs(dir) == 0, "rmdirs failed: %s", dir);
html_tag_arg_free(&hrefs);
funmap(map);
close(fd);
}
END_TEST
START_TEST(test_screnc_nullterminate)
{
int fd = open_testfile("input" PATHSEP "other_scanfiles" PATHSEP "screnc_test", O_RDONLY | O_BINARY);
fmap_t *map;
ck_assert_msg(mkdir(dir, 0700) == 0, "mkdir failed");
map = fmap(fd, 0, 0, "screnc_test");
ck_assert_msg(!!map, "fmap failed");
ck_assert_msg(html_screnc_decode(map, dir) == 1, "html_screnc_decode failed");
funmap(map);
ck_assert_msg(cli_rmdirs(dir) == 0, "rmdirs failed");
close(fd);
}
END_TEST
Suite *test_htmlnorm_suite(void)
{
Suite *s = suite_create("htmlnorm");
TCase *tc_htmlnorm_api;
tc_htmlnorm_api = tcase_create("htmlnorm api");
suite_add_tcase(s, tc_htmlnorm_api);
tcase_add_loop_test(tc_htmlnorm_api, test_htmlnorm_api, 0, sizeof(tests) / sizeof(tests[0]));
tcase_add_unchecked_fixture(tc_htmlnorm_api,
htmlnorm_setup, htmlnorm_teardown);
tcase_add_test(tc_htmlnorm_api, test_screnc_nullterminate);
return s;
}