2019-01-30 00:44:31 +03:30
|
|
|
/*
|
|
|
|
* Copyright 2000 Alexandre Julliard
|
|
|
|
* Copyright 2019 Zhiyi Zhang for CodeWeavers
|
|
|
|
*
|
|
|
|
* This library is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
|
|
* License as published by the Free Software Foundation; either
|
|
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This library is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
* Lesser General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
|
|
* License along with this library; if not, write to the Free Software
|
|
|
|
* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "vkd3d_memory.h"
|
|
|
|
#include "vkd3d_utf8.h"
|
|
|
|
|
|
|
|
#include <inttypes.h>
|
|
|
|
|
|
|
|
static size_t vkd3d_utf8_len(uint32_t c)
|
|
|
|
{
|
|
|
|
/* 0x00-0x7f: 1 byte */
|
|
|
|
if (c < 0x80)
|
|
|
|
return 1;
|
|
|
|
/* 0x80-0x7ff: 2 bytes */
|
|
|
|
if (c < 0x800)
|
|
|
|
return 2;
|
|
|
|
/* 0x800-0xffff: 3 bytes */
|
|
|
|
if (c < 0x10000)
|
|
|
|
return 3;
|
|
|
|
/* 0x10000-0x10ffff: 4 bytes */
|
|
|
|
return 4;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void vkd3d_utf8_append(char **dst, uint32_t c)
|
|
|
|
{
|
|
|
|
char *d = *dst;
|
|
|
|
|
|
|
|
/* 0x00-0x7f: 1 byte */
|
|
|
|
if (c < 0x80)
|
|
|
|
{
|
|
|
|
d[0] = c;
|
|
|
|
*dst += 1;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* 0x80-0x7ff: 2 bytes */
|
|
|
|
if (c < 0x800)
|
|
|
|
{
|
|
|
|
d[1] = 0x80 | (c & 0x3f);
|
|
|
|
c >>= 6;
|
|
|
|
d[0] = 0xc0 | c;
|
|
|
|
*dst += 2;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* 0x800-0xffff: 3 bytes */
|
|
|
|
if (c < 0x10000) /* 0x800-0xffff: 3 bytes */
|
|
|
|
{
|
|
|
|
d[2] = 0x80 | (c & 0x3f);
|
|
|
|
c >>= 6;
|
|
|
|
d[1] = 0x80 | (c & 0x3f);
|
|
|
|
c >>= 6;
|
|
|
|
d[0] = 0xe0 | c;
|
|
|
|
*dst += 3;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* 0x10000-0x10ffff: 4 bytes */
|
|
|
|
d[3] = 0x80 | (c & 0x3f);
|
|
|
|
c >>= 6;
|
|
|
|
d[2] = 0x80 | (c & 0x3f);
|
|
|
|
c >>= 6;
|
|
|
|
d[1] = 0x80 | (c & 0x3f);
|
|
|
|
c >>= 6;
|
|
|
|
d[0] = 0xf0 | c;
|
|
|
|
*dst += 4;
|
|
|
|
}
|
|
|
|
|
|
|
|
static uint32_t vkd3d_utf16_read(const uint16_t **src)
|
|
|
|
{
|
|
|
|
const uint16_t *s = *src;
|
|
|
|
|
|
|
|
if (s[0] < 0xd800 || s[0] > 0xdfff) /* Not a surrogate pair. */
|
|
|
|
{
|
|
|
|
*src += 1;
|
|
|
|
return s[0];
|
|
|
|
}
|
|
|
|
|
|
|
|
if (s[0] > 0xdbff /* Invalid high surrogate. */
|
|
|
|
|| s[1] < 0xdc00 || s[1] > 0xdfff) /* Invalid low surrogate. */
|
|
|
|
{
|
|
|
|
*src += 1;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
*src += 2;
|
|
|
|
return 0x10000 + ((s[0] & 0x3ff) << 10) + (s[1] & 0x3ff);
|
|
|
|
}
|
|
|
|
|
|
|
|
static char *vkd3d_strdup_w16_utf8(const uint16_t *wstr)
|
|
|
|
{
|
|
|
|
const uint16_t *src = wstr;
|
|
|
|
size_t dst_size = 0;
|
2019-02-01 09:42:51 +01:00
|
|
|
char *dst, *utf8;
|
2019-01-30 00:44:31 +03:30
|
|
|
uint32_t c;
|
|
|
|
|
|
|
|
while (*src)
|
|
|
|
{
|
|
|
|
if (!(c = vkd3d_utf16_read(&src)))
|
|
|
|
continue;
|
|
|
|
dst_size += vkd3d_utf8_len(c);
|
|
|
|
}
|
|
|
|
++dst_size;
|
|
|
|
|
|
|
|
if (!(dst = vkd3d_malloc(dst_size)))
|
|
|
|
return NULL;
|
|
|
|
|
2019-02-01 09:42:51 +01:00
|
|
|
utf8 = dst;
|
2019-01-30 00:44:31 +03:30
|
|
|
src = wstr;
|
|
|
|
while (*src)
|
|
|
|
{
|
|
|
|
if (!(c = vkd3d_utf16_read(&src)))
|
|
|
|
continue;
|
2019-02-01 09:42:51 +01:00
|
|
|
vkd3d_utf8_append(&utf8, c);
|
2019-01-30 00:44:31 +03:30
|
|
|
}
|
2019-02-01 09:42:51 +01:00
|
|
|
*utf8 = 0;
|
2019-01-30 00:44:31 +03:30
|
|
|
|
|
|
|
return dst;
|
|
|
|
}
|
|
|
|
|
|
|
|
static char *vkd3d_strdup_w32_utf8(const uint32_t *wstr)
|
|
|
|
{
|
|
|
|
const uint32_t *src = wstr;
|
|
|
|
size_t dst_size = 0;
|
2019-02-01 09:42:51 +01:00
|
|
|
char *dst, *utf8;
|
2019-01-30 00:44:31 +03:30
|
|
|
|
|
|
|
while (*src)
|
|
|
|
dst_size += vkd3d_utf8_len(*src++);
|
|
|
|
++dst_size;
|
|
|
|
|
|
|
|
if (!(dst = vkd3d_malloc(dst_size)))
|
|
|
|
return NULL;
|
|
|
|
|
2019-02-01 09:42:51 +01:00
|
|
|
utf8 = dst;
|
2019-01-30 00:44:31 +03:30
|
|
|
src = wstr;
|
|
|
|
while (*src)
|
2019-02-01 09:42:51 +01:00
|
|
|
vkd3d_utf8_append(&utf8, *src++);
|
|
|
|
*utf8 = 0;
|
2019-01-30 00:44:31 +03:30
|
|
|
|
|
|
|
return dst;
|
|
|
|
}
|
|
|
|
|
|
|
|
char *vkd3d_strdup_w_utf8(const WCHAR *wstr, size_t wchar_size)
|
|
|
|
{
|
|
|
|
if (wchar_size == 2)
|
|
|
|
return vkd3d_strdup_w16_utf8((const uint16_t *)wstr);
|
|
|
|
return vkd3d_strdup_w32_utf8((const uint32_t *)wstr);
|
|
|
|
}
|