utf8_and_iso8859_1.c

来自「postgresql8.3.4源码,开源数据库」· C语言 代码 · 共 120 行

C
120
字号
/*------------------------------------------------------------------------- * *	  ISO8859_1 <--> UTF8 * * Portions Copyright (c) 1996-2008, PostgreSQL Global Development Group * Portions Copyright (c) 1994, Regents of the University of California * * IDENTIFICATION *	  $PostgreSQL: pgsql/src/backend/utils/mb/conversion_procs/utf8_and_iso8859_1/utf8_and_iso8859_1.c,v 1.20 2008/01/01 19:45:54 momjian Exp $ * *------------------------------------------------------------------------- */#include "postgres.h"#include "fmgr.h"#include "mb/pg_wchar.h"PG_MODULE_MAGIC;PG_FUNCTION_INFO_V1(iso8859_1_to_utf8);PG_FUNCTION_INFO_V1(utf8_to_iso8859_1);extern Datum iso8859_1_to_utf8(PG_FUNCTION_ARGS);extern Datum utf8_to_iso8859_1(PG_FUNCTION_ARGS);/* ---------- * conv_proc( *		INTEGER,	-- source encoding id *		INTEGER,	-- destination encoding id *		CSTRING,	-- source string (null terminated C string) *		CSTRING,	-- destination string (null terminated C string) *		INTEGER		-- source string length * ) returns VOID; * ---------- */Datumiso8859_1_to_utf8(PG_FUNCTION_ARGS){	unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);	unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);	int			len = PG_GETARG_INT32(4);	unsigned short c;	Assert(PG_GETARG_INT32(0) == PG_LATIN1);	Assert(PG_GETARG_INT32(1) == PG_UTF8);	Assert(len >= 0);	while (len > 0)	{		c = *src;		if (c == 0)			report_invalid_encoding(PG_LATIN1, (const char *) src, len);		if (!IS_HIGHBIT_SET(c))			*dest++ = c;		else		{			*dest++ = (c >> 6) | 0xc0;			*dest++ = (c & 0x003f) | HIGHBIT;		}		src++;		len--;	}	*dest = '\0';	PG_RETURN_VOID();}Datumutf8_to_iso8859_1(PG_FUNCTION_ARGS){	unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);	unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);	int			len = PG_GETARG_INT32(4);	unsigned short c,				c1;	Assert(PG_GETARG_INT32(0) == PG_UTF8);	Assert(PG_GETARG_INT32(1) == PG_LATIN1);	Assert(len >= 0);	while (len > 0)	{		c = *src;		if (c == 0)			report_invalid_encoding(PG_UTF8, (const char *) src, len);		/* fast path for ASCII-subset characters */		if (!IS_HIGHBIT_SET(c))		{			*dest++ = c;			src++;			len--;		}		else		{			int			l = pg_utf_mblen(src);			if (l > len || !pg_utf8_islegal(src, l))				report_invalid_encoding(PG_UTF8, (const char *) src, len);			if (l != 2)				report_untranslatable_char(PG_UTF8, PG_LATIN1,										   (const char *) src, len);			c1 = src[1] & 0x3f;			c = ((c & 0x1f) << 6) | c1;			if (c >= 0x80 && c <= 0xff)			{				*dest++ = (unsigned char) c;				src += 2;				len -= 2;			}			else				report_untranslatable_char(PG_UTF8, PG_LATIN1,										   (const char *) src, len);		}	}	*dest = '\0';	PG_RETURN_VOID();}

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?