⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 utf-16.c

📁 Apache 2.0.63 is the current stable version of the 2.0 series, and is recommended over any previous
💻 C
字号:
/*-
 * Copyright (c) 1999,2000
 *	Konstantin Chuguev.  All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. All advertising materials mentioning features or use of this software
 *    must display the following acknowledgement:
 *	This product includes software developed by Konstantin Chuguev
 *	and its contributors.
 *
 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 *
 *	iconv (Charset Conversion Library) v1.0
 */

#define ICONV_INTERNAL
#include <iconv.h>

static const char * const names[] = {
	"utf-16", "iso-10646-utf-16", "utf16", NULL
};

static const char * const *
utf16_names(struct iconv_ces *ces)
{
	return names;
}

static apr_ssize_t
convert_from_ucs(struct iconv_ces *ces, ucs_t in,
	    unsigned char **outbuf, apr_size_t *outbytesleft)
{
	unsigned char *cp;
	int *state = (int *)ces->data;
	int bytes;

	if (in == UCS_CHAR_NONE)
		return 1;	/* No state reinitialization for table charsets */
	if (in > 0x10FFFF)
		return -1;
	bytes = *state ? 2 : 4;
	if (in > 0xFFFF)
		bytes += 2;
	if (*outbytesleft < bytes)
		return 0;	/* No space in the output buffer */
	cp = *outbuf;
	if (*state == 0) {
		*cp++ = 0xFE;
		*cp++ = 0xFF;
		*state = 1;
	}
	if (in > 0xFFFF) {
		*cp++ = ((in -= 0x10000) >> 18) | 0xD8;
		*cp++ = (in >> 10) & 0xFF;
		*cp++ = ((in >> 8) & 3) | 0xDC;
	} else
		*cp++ = (in >> 8) & 0xFF;
	*cp++ = in & 0xFF;
	(*outbuf) += bytes;
	*outbytesleft -= bytes;
	return 1;
}

static APR_INLINE ucs_t
msb(const unsigned char *buf)
{
	return (buf[0] << 8) | buf[1];
}

static ucs_t
convert_to_ucs(struct iconv_ces *ces,
	const unsigned char **inbuf, apr_size_t *inbytesleft)
{
	ucs_t res, res2;
	int *state = (int *)ces->data;
	int mark;

	if (*inbytesleft < 2)
		return UCS_CHAR_NONE;	/* Not enough bytes in the input buffer */
	res = msb(*inbuf);
	switch (res) {
	    case UCS_CHAR_ZERO_WIDTH_NBSP:
		*state = 1;
		mark = 1;
		break;
	    case UCS_CHAR_INVALID:
		*state = 2;
		mark = 1;
		break;
	    default:
		mark = 0;
	}
	if (mark) {
		if (*inbytesleft < 4)
			return UCS_CHAR_NONE;	/* Not enough bytes in the input buffer */
		*inbytesleft -= 2;
		res = msb((*inbuf) += 2);
	}
	if (*state == 2) {		/* LSB order */
		res = (*(*inbuf) ++);
		res |= (*(*inbuf) ++) << 8;
	} else
		*inbuf += 2;
	*inbytesleft -= 2;
	if ((res & 0xFC00) != 0xD800)	/* Non-surrogate character */
		return res;
	if (*inbytesleft < 2)
		return UCS_CHAR_NONE;	/* Not enough bytes in the input buffer */
	if (*state == 2) {
		res2 = (*inbuf)[0];
		res2 |= (*inbuf)[1] << 8;
	} else
		res2 = msb(*inbuf);
	if ((res2 & 0xFC00) != 0xDC00)	/* Broken surrogate pair */
	    return -1;
	(*inbuf) += 2;
	(*inbytesleft) -= 2;
	return (((res & 0x3FF) << 10) | (res2 & 0x3FF)) + 0x10000;
}

static const struct iconv_ces_desc iconv_ces_desc = {
	apr_iconv_ces_open_func,
	apr_iconv_ces_close_func,
	apr_iconv_ces_reset_func,
	utf16_names,
	apr_iconv_ces_nbits8,
	apr_iconv_ces_zero,
	convert_from_ucs,
	convert_to_ucs,
	NULL
};

struct iconv_module_desc iconv_module = {
	ICMOD_UC_CES,
	apr_iconv_mod_noevent,
	NULL,
	&iconv_ces_desc
};

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -