⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 euc_tw_and_big5.c

📁 PostgreSQL 8.1.4的源码 适用于Linux下的开源数据库系统
💻 C
字号:
/*------------------------------------------------------------------------- * *	  EUC_TW, BIG5 and MULE_INTERNAL * * Portions Copyright (c) 1996-2005, PostgreSQL Global Development Group * Portions Copyright (c) 1994, Regents of the University of California * * IDENTIFICATION *	  $PostgreSQL: pgsql/src/backend/utils/mb/conversion_procs/euc_tw_and_big5/euc_tw_and_big5.c,v 1.10.2.1 2006/05/21 20:05:48 tgl Exp $ * *------------------------------------------------------------------------- */#include "postgres.h"#include "fmgr.h"#include "mb/pg_wchar.h"#define ENCODING_GROWTH_RATE 4PG_FUNCTION_INFO_V1(euc_tw_to_big5);PG_FUNCTION_INFO_V1(big5_to_euc_tw);PG_FUNCTION_INFO_V1(euc_tw_to_mic);PG_FUNCTION_INFO_V1(mic_to_euc_tw);PG_FUNCTION_INFO_V1(big5_to_mic);PG_FUNCTION_INFO_V1(mic_to_big5);extern Datum euc_tw_to_big5(PG_FUNCTION_ARGS);extern Datum big5_to_euc_tw(PG_FUNCTION_ARGS);extern Datum euc_tw_to_mic(PG_FUNCTION_ARGS);extern Datum mic_to_euc_tw(PG_FUNCTION_ARGS);extern Datum big5_to_mic(PG_FUNCTION_ARGS);extern Datum mic_to_big5(PG_FUNCTION_ARGS);/* ---------- * conv_proc( *		INTEGER,	-- source encoding id *		INTEGER,	-- destination encoding id *		CSTRING,	-- source string (null terminated C string) *		CSTRING,	-- destination string (null terminated C string) *		INTEGER		-- source string length * ) returns VOID; * ---------- */static void big52mic(const unsigned char *big5, unsigned char *p, int len);static void mic2big5(const unsigned char *mic, unsigned char *p, int len);static void euc_tw2mic(const unsigned char *euc, unsigned char *p, int len);static void mic2euc_tw(const unsigned char *mic, unsigned char *p, int len);Datumeuc_tw_to_big5(PG_FUNCTION_ARGS){	unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);	unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);	int			len = PG_GETARG_INT32(4);	unsigned char *buf;	Assert(PG_GETARG_INT32(0) == PG_EUC_TW);	Assert(PG_GETARG_INT32(1) == PG_BIG5);	Assert(len >= 0);	buf = palloc(len * ENCODING_GROWTH_RATE);	euc_tw2mic(src, buf, len);	mic2big5(buf, dest, strlen((char *) buf));	pfree(buf);	PG_RETURN_VOID();}Datumbig5_to_euc_tw(PG_FUNCTION_ARGS){	unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);	unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);	int			len = PG_GETARG_INT32(4);	unsigned char *buf;	Assert(PG_GETARG_INT32(0) == PG_BIG5);	Assert(PG_GETARG_INT32(1) == PG_EUC_TW);	Assert(len >= 0);	buf = palloc(len * ENCODING_GROWTH_RATE);	big52mic(src, buf, len);	mic2euc_tw(buf, dest, strlen((char *) buf));	pfree(buf);	PG_RETURN_VOID();}Datumeuc_tw_to_mic(PG_FUNCTION_ARGS){	unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);	unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);	int			len = PG_GETARG_INT32(4);	Assert(PG_GETARG_INT32(0) == PG_EUC_TW);	Assert(PG_GETARG_INT32(1) == PG_MULE_INTERNAL);	Assert(len >= 0);	euc_tw2mic(src, dest, len);	PG_RETURN_VOID();}Datummic_to_euc_tw(PG_FUNCTION_ARGS){	unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);	unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);	int			len = PG_GETARG_INT32(4);	Assert(PG_GETARG_INT32(0) == PG_MULE_INTERNAL);	Assert(PG_GETARG_INT32(1) == PG_EUC_TW);	Assert(len >= 0);	mic2euc_tw(src, dest, len);	PG_RETURN_VOID();}Datumbig5_to_mic(PG_FUNCTION_ARGS){	unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);	unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);	int			len = PG_GETARG_INT32(4);	Assert(PG_GETARG_INT32(0) == PG_BIG5);	Assert(PG_GETARG_INT32(1) == PG_MULE_INTERNAL);	Assert(len >= 0);	big52mic(src, dest, len);	PG_RETURN_VOID();}Datummic_to_big5(PG_FUNCTION_ARGS){	unsigned char *src = (unsigned char *) PG_GETARG_CSTRING(2);	unsigned char *dest = (unsigned char *) PG_GETARG_CSTRING(3);	int			len = PG_GETARG_INT32(4);	Assert(PG_GETARG_INT32(0) == PG_MULE_INTERNAL);	Assert(PG_GETARG_INT32(1) == PG_BIG5);	Assert(len >= 0);	mic2big5(src, dest, len);	PG_RETURN_VOID();}/* * EUC_TW ---> MIC */static voideuc_tw2mic(const unsigned char *euc, unsigned char *p, int len){	int			c1;	int			l;	while (len > 0)	{		c1 = *euc;		if (IS_HIGHBIT_SET(c1))		{			l = pg_encoding_verifymb(PG_EUC_TW, (const char *) euc, len);			if (l < 0)				report_invalid_encoding(PG_EUC_TW,										(const char *) euc, len);			if (c1 == SS2)			{				c1 = euc[1];		/* plane No. */				if (c1 == 0xa1)					*p++ = LC_CNS11643_1;				else if (c1 == 0xa2)					*p++ = LC_CNS11643_2;				else				{					*p++ = 0x9d;	/* LCPRV2 */					*p++ = c1 - 0xa3 + LC_CNS11643_3;				}				*p++ = euc[2];				*p++ = euc[3];			}			else			{						/* CNS11643-1 */				*p++ = LC_CNS11643_1;				*p++ = c1;				*p++ = euc[1];			}			euc += l;			len -= l;		}		else		{						/* should be ASCII */			if (c1 == 0)				report_invalid_encoding(PG_EUC_TW,										(const char *) euc, len);			*p++ = c1;			euc++;			len--;		}	}	*p = '\0';}/* * MIC ---> EUC_TW */static voidmic2euc_tw(const unsigned char *mic, unsigned char *p, int len){	int			c1;	int			l;	while (len > 0)	{		c1 = *mic;		if (!IS_HIGHBIT_SET(c1))		{			/* ASCII */			if (c1 == 0)				report_invalid_encoding(PG_MULE_INTERNAL,										(const char *) mic, len);			*p++ = c1;			mic++;			len--;			continue;		}		l = pg_encoding_verifymb(PG_MULE_INTERNAL, (const char *) mic, len);		if (l < 0)			report_invalid_encoding(PG_MULE_INTERNAL,									(const char *) mic, len);		if (c1 == LC_CNS11643_1)		{			*p++ = mic[1];			*p++ = mic[2];		}		else if (c1 == LC_CNS11643_2)		{			*p++ = SS2;			*p++ = 0xa2;			*p++ = mic[1];			*p++ = mic[2];		}		else if (c1 == 0x9d &&				 mic[1] >= LC_CNS11643_3 && mic[1] <= LC_CNS11643_7)		{						/* LCPRV2? */			*p++ = SS2;			*p++ = mic[1] - LC_CNS11643_3 + 0xa3;			*p++ = mic[2];			*p++ = mic[3];		}		else			report_untranslatable_char(PG_MULE_INTERNAL, PG_EUC_TW,									   (const char *) mic, len);		mic += l;		len -= l;	}	*p = '\0';}/* * Big5 ---> MIC */static voidbig52mic(const unsigned char *big5, unsigned char *p, int len){	unsigned short c1;	unsigned short big5buf,				cnsBuf;	unsigned char lc;	int			l;	while (len > 0)	{		c1 = *big5;		if (!IS_HIGHBIT_SET(c1))		{			/* ASCII */			if (c1 == 0)				report_invalid_encoding(PG_BIG5,										(const char *) big5, len);			*p++ = c1;			big5++;			len--;			continue;		}		l = pg_encoding_verifymb(PG_BIG5, (const char *) big5, len);		if (l < 0)			report_invalid_encoding(PG_BIG5,									(const char *) big5, len);		big5buf = (c1 << 8) | big5[1];		cnsBuf = BIG5toCNS(big5buf, &lc);		if (lc != 0)		{			if (lc == LC_CNS11643_3 || lc == LC_CNS11643_4)			{				*p++ = 0x9d;	/* LCPRV2 */			}			*p++ = lc;		/* Plane No. */			*p++ = (cnsBuf >> 8) & 0x00ff;			*p++ = cnsBuf & 0x00ff;		}		else			report_untranslatable_char(PG_BIG5, PG_MULE_INTERNAL,									   (const char *) big5, len);		big5 += l;		len -= l;	}	*p = '\0';}/* * MIC ---> Big5 */static voidmic2big5(const unsigned char *mic, unsigned char *p, int len){	unsigned short c1;	unsigned short big5buf,				cnsBuf;	int			l;	while (len > 0)	{		c1 = *mic;		if (!IS_HIGHBIT_SET(c1))		{			/* ASCII */			if (c1 == 0)				report_invalid_encoding(PG_MULE_INTERNAL,										(const char *) mic, len);			*p++ = c1;			mic++;			len--;			continue;		}		l = pg_encoding_verifymb(PG_MULE_INTERNAL, (const char *) mic, len);		if (l < 0)			report_invalid_encoding(PG_MULE_INTERNAL,									(const char *) mic, len);		/* 0x9d means LCPRV2 */		if (c1 == LC_CNS11643_1 || c1 == LC_CNS11643_2 || c1 == 0x9d)		{			if (c1 == 0x9d)			{				c1 = mic[1];	/* get plane no. */				cnsBuf = (mic[2] << 8) | mic[3];			}			else			{				cnsBuf = (mic[1] << 8) | mic[2];			}			big5buf = CNStoBIG5(cnsBuf, c1);			if (big5buf == 0)				report_untranslatable_char(PG_MULE_INTERNAL, PG_BIG5,										   (const char *) mic, len);			*p++ = (big5buf >> 8) & 0x00ff;			*p++ = big5buf & 0x00ff;		}		else			report_untranslatable_char(PG_MULE_INTERNAL, PG_BIG5,									   (const char *) mic, len);		mic += l;		len -= l;	}	*p = '\0';}

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -