mirror of https://github.com/Cisco-Talos/clamav
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
97 lines
3.1 KiB
97 lines
3.1 KiB
/*
|
|
* Copyright (C) 2013-2022 Cisco Systems, Inc. and/or its affiliates. All rights reserved.
|
|
* Copyright (C) 2011-2013 Sourcefire, Inc.
|
|
*
|
|
* Authors: aCaB <acab@clamav.net>
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License version 2 as
|
|
* published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
|
|
* MA 02110-1301, USA.
|
|
*/
|
|
|
|
#if HAVE_CONFIG_H
|
|
#include "clamav-config.h"
|
|
#endif
|
|
|
|
#include <Windows.h>
|
|
#include <string.h>
|
|
|
|
#include "utf8_util.h"
|
|
|
|
char *cli_strdup_to_utf8(const char *s)
|
|
{
|
|
char *r = cli_to_utf8_maybe_alloc(s);
|
|
if (!r) return NULL;
|
|
if (r == s) return _strdup(r);
|
|
return r;
|
|
}
|
|
|
|
#define MAYBE_FREE_W \
|
|
do { \
|
|
if (wdup != tmpw) free(wdup); \
|
|
} while (0)
|
|
#define MAYBE_FREE_U \
|
|
do { \
|
|
if (utf8 != tmpu) free(utf8); \
|
|
} while (0)
|
|
char *cli_to_utf8_maybe_alloc(const char *s)
|
|
{
|
|
int len = strlen(s) + 1;
|
|
wchar_t tmpw[1024], *wdup;
|
|
char tmpu[1024], *utf8;
|
|
|
|
if (len >= sizeof(tmpw) / sizeof(*tmpw)) {
|
|
wdup = (wchar_t *)malloc(len * sizeof(wchar_t));
|
|
if (!wdup) return NULL;
|
|
} else
|
|
wdup = tmpw;
|
|
|
|
/* Check if already UTF8 first... */
|
|
if (MultiByteToWideChar(CP_UTF8, MB_ERR_INVALID_CHARS, s, -1, wdup, len)) {
|
|
/* XP acts funny on MB_ERR_INVALID_CHARS, so we translate back and compare
|
|
On Vista+ the flag is honored and there is no such overhead */
|
|
int ulen;
|
|
if ((ulen = WideCharToMultiByte(CP_UTF8, 0, wdup, -1, NULL, 0, NULL, NULL))) {
|
|
if (ulen > sizeof(tmpu)) {
|
|
utf8 = (char *)malloc(ulen);
|
|
if (!utf8) {
|
|
MAYBE_FREE_W;
|
|
return NULL;
|
|
}
|
|
} else
|
|
utf8 = tmpu;
|
|
if (WideCharToMultiByte(CP_UTF8, 0, wdup, -1, utf8, ulen, NULL, NULL) && !strcmp(s, utf8)) {
|
|
MAYBE_FREE_W;
|
|
MAYBE_FREE_U;
|
|
return s;
|
|
}
|
|
MAYBE_FREE_U;
|
|
}
|
|
/* We should never land here */
|
|
}
|
|
|
|
/* ... then assume ANSI */
|
|
if (MultiByteToWideChar(CP_ACP, MB_ERR_INVALID_CHARS, s, -1, wdup, len)) {
|
|
if ((len = WideCharToMultiByte(CP_UTF8, 0, wdup, -1, NULL, 0, NULL, NULL))) {
|
|
if ((utf8 = (char *)malloc(len))) {
|
|
if (WideCharToMultiByte(CP_UTF8, 0, wdup, -1, utf8, len, NULL, NULL)) {
|
|
MAYBE_FREE_W;
|
|
return utf8;
|
|
}
|
|
free(utf8);
|
|
}
|
|
}
|
|
}
|
|
MAYBE_FREE_W;
|
|
return NULL;
|
|
}
|
|
|