ClamAV is an open source (GPLv2) anti-virus toolkit.
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 
 
 
 
clamav/clamav-devel/libclamav/matcher.c

583 lines
13 KiB

/*
* Copyright (C) 2002 - 2005 Tomasz Kojm <tkojm@clamav.net>
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
*/
#if HAVE_CONFIG_H
#include "clamav-config.h"
#endif
#include <string.h>
#include <ctype.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <unistd.h>
#include "clamav.h"
#include "others.h"
#include "matcher-ac.h"
#include "matcher-bm.h"
#include "md5.h"
#include "filetypes.h"
#include "matcher.h"
#include "pe.h"
#include "elf.h"
#include "execs.h"
#include "special.h"
#define MD5_BLOCKSIZE 4096
#define MAX(a,b) ((a > b) ? a : b)
static int targettab[CL_TARGET_TABLE_SIZE] = { 0, CL_TYPE_MSEXE, CL_TYPE_MSOLE2, CL_TYPE_HTML, CL_TYPE_MAIL, CL_TYPE_GRAPHICS, CL_TYPE_ELF };
extern short cli_debug_flag;
#ifdef CL_THREAD_SAFE
# include <pthread.h>
static pthread_mutex_t cli_ref_mutex = PTHREAD_MUTEX_INITIALIZER;
#endif
int cli_scanbuff(const char *buffer, unsigned int length, const char **virname, const struct cl_engine *engine, unsigned short ftype)
{
int ret, i, tid = 0, *partcnt;
unsigned long int *partoff;
struct cli_matcher *groot, *troot = NULL;
if(!engine) {
cli_errmsg("cli_scanbuff: engine == NULL\n");
return CL_ENULLARG;
}
groot = engine->root[0]; /* generic signatures */
if(ftype) {
for(i = 0; i < CL_TARGET_TABLE_SIZE; i++) {
if(targettab[i] == ftype) {
tid = i;
break;
}
}
if(tid)
troot = engine->root[tid];
}
if(troot) {
if((partcnt = (int *) cli_calloc(troot->ac_partsigs + 1, sizeof(int))) == NULL) {
cli_dbgmsg("cli_scanbuff(): unable to cli_calloc(%d, %d)\n", troot->ac_partsigs + 1, sizeof(int));
return CL_EMEM;
}
if((partoff = (unsigned long int *) cli_calloc(troot->ac_partsigs + 1, sizeof(unsigned long int))) == NULL) {
cli_dbgmsg("cli_scanbuff(): unable to cli_calloc(%d, %d)\n", troot->ac_partsigs + 1, sizeof(unsigned long int));
free(partcnt);
return CL_EMEM;
}
if(troot->ac_only || (ret = cli_bm_scanbuff(buffer, length, virname, troot, 0, ftype, -1)) != CL_VIRUS)
ret = cli_ac_scanbuff(buffer, length, virname, troot, partcnt, 0, 0, partoff, ftype, -1, NULL);
free(partcnt);
free(partoff);
if(ret == CL_VIRUS)
return ret;
}
if((partcnt = (int *) cli_calloc(groot->ac_partsigs + 1, sizeof(int))) == NULL) {
cli_dbgmsg("cli_scanbuff(): unable to cli_calloc(%d, %d)\n", groot->ac_partsigs + 1, sizeof(int));
return CL_EMEM;
}
if((partoff = (unsigned long int *) cli_calloc(groot->ac_partsigs + 1, sizeof(unsigned long int))) == NULL) {
cli_dbgmsg("cli_scanbuff(): unable to cli_calloc(%d, %d)\n", groot->ac_partsigs + 1, sizeof(unsigned long int));
free(partcnt);
return CL_EMEM;
}
if(groot->ac_only || (ret = cli_bm_scanbuff(buffer, length, virname, groot, 0, ftype, -1)) != CL_VIRUS)
ret = cli_ac_scanbuff(buffer, length, virname, groot, partcnt, 0, 0, partoff, ftype, -1, NULL);
free(partcnt);
free(partoff);
return ret;
}
static struct cli_md5_node *cli_vermd5(const unsigned char *md5, const struct cl_engine *engine)
{
struct cli_md5_node *pt;
if(!(pt = engine->md5_hlist[md5[0] & 0xff]))
return NULL;
while(pt) {
if(!memcmp(pt->md5, md5, 16))
return pt;
pt = pt->next;
}
return NULL;
}
static long int cli_caloff(const char *offstr, int fd, unsigned short ftype)
{
struct cli_exe_info exeinfo;
int (*einfo)(int, struct cli_exe_info *) = NULL;
long int offset = -1;
int n;
if(ftype == CL_TYPE_MSEXE)
einfo = cli_peheader;
else if(ftype == CL_TYPE_ELF)
einfo = cli_elfheader;
if(isdigit(offstr[0])) {
return atoi(offstr);
} else if(einfo && (!strncmp(offstr, "EP+", 3) || !strncmp(offstr, "EP-", 3))) {
if((n = lseek(fd, 0, SEEK_CUR)) == -1) {
cli_dbgmsg("Invalid descriptor\n");
return -1;
}
lseek(fd, 0, SEEK_SET);
if(einfo(fd, &exeinfo)) {
lseek(fd, n, SEEK_SET);
return -1;
}
free(exeinfo.section);
lseek(fd, n, SEEK_SET);
if(offstr[2] == '+')
return exeinfo.ep + atoi(offstr + 3);
else
return exeinfo.ep - atoi(offstr + 3);
} else if(einfo && offstr[0] == 'S') {
if((n = lseek(fd, 0, SEEK_CUR)) == -1) {
cli_dbgmsg("Invalid descriptor\n");
return -1;
}
lseek(fd, 0, SEEK_SET);
if(einfo(fd, &exeinfo)) {
lseek(fd, n, SEEK_SET);
return -1;
}
lseek(fd, n, SEEK_SET);
if(!strncmp(offstr, "SL", 2)) {
if(sscanf(offstr, "SL+%ld", &offset) != 1) {
free(exeinfo.section);
return -1;
}
offset += exeinfo.section[exeinfo.nsections - 1].raw;
} else {
if(sscanf(offstr, "S%d+%ld", &n, &offset) != 2) {
free(exeinfo.section);
return -1;
}
if(n >= exeinfo.nsections) {
free(exeinfo.section);
return -1;
}
offset += exeinfo.section[n].raw;
}
free(exeinfo.section);
return offset;
} else if(!strncmp(offstr, "EOF-", 4)) {
struct stat sb;
if(fstat(fd, &sb) == -1)
return -1;
return sb.st_size - atoi(offstr + 4);
}
return -1;
}
int cli_checkfp(int fd, const struct cl_engine *engine)
{
struct cli_md5_node *md5_node;
unsigned char *digest;
if(engine->md5_hlist) {
if(!(digest = cli_md5digest(fd))) {
cli_errmsg("cli_checkfp(): Can't generate MD5 checksum\n");
return 0;
}
if((md5_node = cli_vermd5(digest, engine)) && md5_node->fp) {
struct stat sb;
if(fstat(fd, &sb))
return CL_EIO;
if((unsigned int) sb.st_size != md5_node->size) {
cli_warnmsg("Detected false positive MD5 match. Please report.\n");
} else {
cli_dbgmsg("Eliminated false positive match (fp sig: %s)\n", md5_node->virname);
free(digest);
return 1;
}
}
free(digest);
}
return 0;
}
int cli_validatesig(unsigned short target, unsigned short ftype, const char *offstr, unsigned long int fileoff, int desc, const char *virname)
{
if(offstr && desc != -1) {
long int off = cli_caloff(offstr, desc, ftype);
if(off == -1) {
cli_dbgmsg("Bad offset in signature (%s)\n", virname);
return 0;
}
if(fileoff != (unsigned long int) off) {
cli_dbgmsg("Virus offset: %d, expected: %d (%s)\n", fileoff, off, virname);
return 0;
}
}
return 1;
}
int cli_scandesc(int desc, const char **virname, long int *scanned, const struct cl_engine *engine, short otfrec, unsigned short ftype, unsigned long int *ftoffset)
{
char *buffer, *buff, *endbl, *pt;
int bytes, buffsize, length, ret, *gpartcnt, *tpartcnt;
int type = CL_CLEAN, i, tid = 0;
unsigned int maxpatlen;
unsigned long int *gpartoff, *tpartoff, offset = 0;
MD5_CTX ctx;
unsigned char digest[16];
struct cli_md5_node *md5_node;
struct cli_matcher *groot, *troot = NULL;
if(!engine) {
cli_errmsg("cli_scandesc: engine == NULL\n");
return CL_ENULLARG;
}
groot = engine->root[0]; /* generic signatures */
if(ftype) {
for(i = 0; i < CL_TARGET_TABLE_SIZE; i++) {
if(targettab[i] == ftype) {
tid = i;
break;
}
}
if(tid)
troot = engine->root[tid];
}
if(troot)
maxpatlen = MAX(troot->maxpatlen, groot->maxpatlen);
else
maxpatlen = groot->maxpatlen;
/* prepare the buffer */
buffsize = maxpatlen + SCANBUFF;
if(!(buffer = (char *) cli_calloc(buffsize, sizeof(char)))) {
cli_dbgmsg("cli_scandesc(): unable to cli_calloc(%d)\n", buffsize);
return CL_EMEM;
}
if((gpartcnt = (int *) cli_calloc(groot->ac_partsigs + 1, sizeof(int))) == NULL) {
cli_dbgmsg("cli_scandesc(): unable to cli_calloc(%d, %d)\n", groot->ac_partsigs + 1, sizeof(int));
free(buffer);
return CL_EMEM;
}
if((gpartoff = (unsigned long int *) cli_calloc(groot->ac_partsigs + 1, sizeof(unsigned long int))) == NULL) {
cli_dbgmsg("cli_scandesc(): unable to cli_calloc(%d, %d)\n", groot->ac_partsigs + 1, sizeof(unsigned long int));
free(buffer);
free(gpartcnt);
return CL_EMEM;
}
if(troot) {
if((tpartcnt = (int *) cli_calloc(troot->ac_partsigs + 1, sizeof(int))) == NULL) {
cli_dbgmsg("cli_scandesc(): unable to cli_calloc(%d, %d)\n", troot->ac_partsigs + 1, sizeof(int));
free(buffer);
free(gpartcnt);
free(gpartoff);
return CL_EMEM;
}
if((tpartoff = (unsigned long int *) cli_calloc(troot->ac_partsigs + 1, sizeof(unsigned long int))) == NULL) {
cli_dbgmsg("cli_scandesc(): unable to cli_calloc(%d, %d)\n", troot->ac_partsigs + 1, sizeof(unsigned long int));
free(buffer);
free(gpartcnt);
free(gpartoff);
free(tpartcnt);
return CL_EMEM;
}
}
if(engine->md5_hlist)
MD5_Init(&ctx);
buff = buffer;
buff += maxpatlen; /* pointer to read data block */
endbl = buff + SCANBUFF - maxpatlen; /* pointer to the last block
* length of maxpatlen
*/
pt = buff;
length = SCANBUFF;
while((bytes = read(desc, buff, SCANBUFF)) > 0) {
if(scanned)
*scanned += bytes / CL_COUNT_PRECISION;
if(bytes < SCANBUFF)
length -= SCANBUFF - bytes;
if(troot) {
if(troot->ac_only || (ret = cli_bm_scanbuff(pt, length, virname, troot, offset, ftype, desc)) != CL_VIRUS)
ret = cli_ac_scanbuff(pt, length, virname, troot, tpartcnt, otfrec, offset, tpartoff, ftype, desc, ftoffset);
if(ret == CL_VIRUS) {
free(buffer);
free(gpartcnt);
free(gpartoff);
free(tpartcnt);
free(tpartoff);
lseek(desc, 0, SEEK_SET);
if(cli_checkfp(desc, engine))
return CL_CLEAN;
else
return CL_VIRUS;
}
}
if(groot->ac_only || (ret = cli_bm_scanbuff(pt, length, virname, groot, offset, ftype, desc)) != CL_VIRUS)
ret = cli_ac_scanbuff(pt, length, virname, groot, gpartcnt, otfrec, offset, gpartoff, ftype, desc, ftoffset);
if(ret == CL_VIRUS) {
free(buffer);
free(gpartcnt);
free(gpartoff);
if(troot) {
free(tpartcnt);
free(tpartoff);
}
lseek(desc, 0, SEEK_SET);
if(cli_checkfp(desc, engine))
return CL_CLEAN;
else
return CL_VIRUS;
} else if(otfrec && ret >= CL_TYPENO) {
if(ret >= type)
type = ret;
}
if(bytes == SCANBUFF) {
memmove(buffer, endbl, maxpatlen);
if(pt == buffer) {
offset += SCANBUFF;
} else {
offset += SCANBUFF - maxpatlen;
pt = buffer;
length = buffsize;
}
}
if(engine->md5_hlist)
MD5_Update(&ctx, buff, bytes);
}
free(buffer);
free(gpartcnt);
free(gpartoff);
if(troot) {
free(tpartcnt);
free(tpartoff);
}
if(engine->md5_hlist) {
MD5_Final(digest, &ctx);
if(cli_debug_flag) {
char md5str[33];
int i;
pt = md5str;
for(i = 0; i < 16; i++) {
sprintf(pt, "%02x", digest[i]);
pt += 2;
}
md5str[32] = 0;
}
if((md5_node = cli_vermd5(digest, engine)) && !md5_node->fp) {
struct stat sb;
if(fstat(desc, &sb))
return CL_EIO;
if((unsigned int) sb.st_size != md5_node->size) {
cli_warnmsg("Detected false positive MD5 match. Please report.\n");
} else {
if(virname)
*virname = md5_node->virname;
return CL_VIRUS;
}
}
}
return otfrec ? type : CL_CLEAN;
}
int cl_build(struct cl_engine *engine)
{
int i, ret;
struct cli_matcher *root;
if((ret = cli_addtypesigs(engine)))
return ret;
for(i = 0; i < CL_TARGET_TABLE_SIZE; i++)
if((root = engine->root[i]))
cli_ac_buildtrie(root);
/* FIXME: check return values of cli_ac_buildtree */
return 0;
}
struct cl_engine *cl_dup(struct cl_engine *engine)
{
if(!engine) {
cli_errmsg("cl_dup: engine == NULL\n");
return NULL;
}
#ifdef CL_THREAD_SAFE
pthread_mutex_lock(&cli_ref_mutex);
#endif
engine->refcount++;
#ifdef CL_THREAD_SAFE
pthread_mutex_unlock(&cli_ref_mutex);
#endif
return engine;
}
void cl_free(struct cl_engine *engine)
{
int i;
struct cli_md5_node *md5pt, *md5h;
struct cli_meta_node *metapt, *metah;
struct cli_matcher *root;
if(!engine) {
cli_errmsg("cl_free: engine == NULL\n");
return;
}
#ifdef CL_THREAD_SAFE
pthread_mutex_lock(&cli_ref_mutex);
#endif
engine->refcount--;
if(engine->refcount) {
#ifdef CL_THREAD_SAFE
pthread_mutex_unlock(&cli_ref_mutex);
#endif
return;
}
#ifdef CL_THREAD_SAFE
pthread_mutex_unlock(&cli_ref_mutex);
#endif
for(i = 0; i < CL_TARGET_TABLE_SIZE; i++) {
if((root = engine->root[i])) {
cli_ac_free(root);
if(!engine->root[i]->ac_only)
cli_bm_free(root);
}
}
if(engine->md5_hlist) {
for(i = 0; i < 256; i++) {
md5pt = engine->md5_hlist[i];
while(md5pt) {
md5h = md5pt;
md5pt = md5pt->next;
free(md5h->md5);
free(md5h->virname);
if(md5h->viralias)
free(md5h->viralias);
free(md5h);
}
}
free(engine->md5_hlist);
}
metapt = engine->zip_mlist;
while(metapt) {
metah = metapt;
metapt = metapt->next;
free(metah->virname);
if(metah->filename)
free(metah->filename);
free(metah);
}
metapt = engine->rar_mlist;
while(metapt) {
metah = metapt;
metapt = metapt->next;
free(metah->virname);
if(metah->filename)
free(metah->filename);
free(metah);
}
free(engine);
}