joliet.c

来自「一款功能很强的光盘镜象制作工具」· C语言代码 · 共 1,397 行 · 第 1/3 页
1,397 行
/* @(#)joliet.c	1.34 02/11/22 joerg */#ifndef lintstatic	char sccsid[] =	"@(#)joliet.c	1.34 02/11/22 joerg";#endif/* * File joliet.c - handle Win95/WinNT long file/unicode extensions for iso9660.   Copyright 1997 Eric Youngdale.   APPLE_HYB James Pearson j.pearson@ge.ucl.ac.uk 22/2/2000   Copyright (c) 1999,2000,2001 J. Schilling   This program is free software; you can redistribute it and/or modify   it under the terms of the GNU General Public License as published by   the Free Software Foundation; either version 2, or (at your option)   any later version.   This program is distributed in the hope that it will be useful,   but WITHOUT ANY WARRANTY; without even the implied warranty of   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the   GNU General Public License for more details.   You should have received a copy of the GNU General Public License   along with this program; if not, write to the Free Software   Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.  *//* * Joliet extensions for ISO9660.  These are spottily documented by * Microsoft.  In their infinite stupidity, they completely ignored * the possibility of using an SUSP record with the long filename * in it, and instead wrote out a duplicate directory tree with the * long filenames in it. * * I am not sure why they did this.  One reason is that they get the path * tables with the long filenames in them. * * There are two basic principles to Joliet, and the non-Unicode variant * known as Romeo.  Long filenames seem to be the main one, and the second * is that the character set and a few other things is substantially relaxed. * * The SVD is identical to the PVD, except: * *	Id is 2, not 1 (indicates SVD). *	escape_sequences contains UCS-2 indicator (levels 1, 2 or 3). *	The root directory record points to a different extent (with different *		size). *	There are different path tables for the two sets of directory trees. * * The Unicode level is coded in the SVD as follows: * *	Standard	Level	ASCII escape code *	UCS-2		Level-1	%/@ *	UCS-2		Level-2	%/C *	UCS-2		Level-3	%/E * * The following fields are recorded in Unicode: *	system_id *	volume_id *	volume_set_id *	publisher_id *	preparer_id *	application_id *	copyright_file_id *	abstract_file_id *	bibliographic_file_id * * Unicode strings are always encoded in big-endian format. * * In a directory record, everything is the same as with iso9660, except * that the name is recorded in unicode.  The name length is specified in * total bytes, not in number of unicode characters. * * The character set used for the names is different with UCS - the * restrictions are that the following are not allowed: * *	Characters (00)(00) through (00)(1f) (control chars) *	(00)(2a) '*' *	(00)(2f) '/' *	(00)(3a) ':' *	(00)(3b) ';' *	(00)(3f) '?' *	(00)(5c) '\' */#include <mconfig.h>#include "mkisofs.h"#include "gbk2uni.h"#include <timedefs.h>#include <utypes.h>#include <intcvt.h>#include <unls.h>	/* For UNICODE translation */#include <schily.h>static Uint	jpath_table_index;static struct directory **jpathlist;static int      next_jpath_index = 1;static int      sort_goof;static	char	ucs_codes[] = {		'\0',		/* UCS-level 0 is illegal	*/		'@',		/* UCS-level 1			*/		'C',		/* UCS-level 2			*/		'E',		/* UCS-level 3			*/};	#ifdef	UDF       void	convert_to_unicode	__PR((unsigned char *buffer,		int size, char *source, struct nls_table *inls, int flag));       int	joliet_strlen		__PR((const char *string, int flag));#elsestatic void	convert_to_unicode	__PR((unsigned char *buffer,		int size, char *source, struct nls_table *inls, int flag));static int	joliet_strlen		__PR((const char *string, int flag));#endifstatic void	get_joliet_vol_desc	__PR((struct iso_primary_descriptor *jvol_desc));static void	assign_joliet_directory_addresses __PR((struct directory *node));static void	build_jpathlist		__PR((struct directory *node));static int	joliet_compare_paths	__PR((void const *r, void const *l));static int	generate_joliet_path_tables __PR((void));static void	generate_one_joliet_directory __PR((struct directory *dpnt,						FILE *outfile));static int	joliet_sort_n_finish	__PR((struct directory *this_dir));static int	joliet_compare_dirs	__PR((const void *rr, const void *ll));static int	joliet_sort_directory	__PR((struct directory_entry **sort_dir));	int	joliet_sort_tree	__PR((struct directory *node));static void	generate_joliet_directories __PR((struct directory *node,						FILE *outfile));static int	jpathtab_write		__PR((FILE *outfile));static int	jdirtree_size		__PR((int starting_extent));static int	jroot_gen		__PR((void));static int	jdirtree_write		__PR((FILE *outfile));static int	jvd_write		__PR((FILE *outfile));static int	jpathtab_size		__PR((int starting_extent));/* *	conv_charset: convert to/from charsets via Unicode. * *	Any unknown character is set to '_' * */#ifdef	PROTOTYPESunsigned char conv_charset(unsigned char c,	struct nls_table *inls,	struct nls_table *onls)#elseunsigned char conv_charset(c, inls, onls)	unsigned char c;	struct nls_table *inls;	struct nls_table *onls;#endif{	unsigned char uh,		      ul,		      uc,		      *up;	/* if we have a null mapping, just return the input character */	if (inls == onls)		return c;	/* get high and low UNICODE bytes */	uh = inls->charset2uni[c].uni2;	ul = inls->charset2uni[c].uni1;	/* get the backconverted page from the output charset */	up = onls->page_uni2charset[uh];	/* if the page exists, get the backconverted character */	if (up == NULL)		uc = '\0';	else		uc = up[ul];	/* return the backconverted, if it's not NULL */	return (uc ? uc : '_');}/* * Function:		convert_to_unicode * * Purpose:		Perform a unicode conversion on a text string *			using the supplied input character set. * * Notes: */#ifdef	UDFvoid#elsestatic void#endifconvert_to_unicode(buffer, size, source, inls, flag)	int             flag;	unsigned char	*buffer;	int		size;	char		*source;	struct nls_table *inls;{	unsigned char	*tmpbuf;	int		i;	int		j;	int             p;	u_int16_t       code, 	                unicode;	unsigned char	uh,			ul,			uc,			*up;	/*	 * If we get a NULL pointer for the source, it means we have an	 * inplace copy, and we need to make a temporary working copy first.	 */	if (source == NULL) {		tmpbuf = (Uchar *) e_malloc(size);		memcpy(tmpbuf, buffer, size);	} else {		tmpbuf = (Uchar *) source;	}	/*	 * Now start copying characters.  If the size was specified to be 0,	 * then assume the input was 0 terminated.	 */	j = 0;	for (i = 0; (i + 1) < size; i += 2, j++) {	/* Size may be odd!!!*/		/*		 * JS integrated from: Achim_Kaiser@t-online.de		 * SGE modified according to Linux kernel source		 * Let all valid unicode characters pass		 * through (according to charset). Others are set to '_' .		 */		uc = tmpbuf[j];			/* temporary copy */		if (uc != '\0') {		/* must be converted */			uh = inls->charset2uni[uc].uni2;	/* convert forward:							   hibyte...	     */			ul = inls->charset2uni[uc].uni1;	/* ...lobyte	     */			up = inls->page_uni2charset[uh];	/* convert backward:							   page...	     */			if (up == NULL)				uc = '\0';	/* ...wrong unicode page     */			else				uc = up[ul];	/* backconverted character   */			if (uc != tmpbuf[j])				uc = '\0';	/* should be identical */			if (uc <= 0x1f || uc == 0x7f)				uc = '\0';	/* control char */			switch (uc) {		/* test special characters */			case '*':			case '/':			case ':':			case ';':			case '?':			case '\\':			case '\0':		/* illegal char mark */				/*				 * Even Joliet has some standards as to what is				 * allowed in a pathname. Pretty tame in				 * comparison to what DOS restricts you to.				 */				uc = '_';			}		}		buffer[i] = inls->charset2uni[uc].uni2;	/* final UNICODE							   conversion */		buffer[i + 1] = inls->charset2uni[uc].uni1;		/**===================================**//* big5 to unicode patch, flag=gbk4win *//* use flag param to call external int *//**===================================**/ if  (flag >= 1) { 	 if  ( tmpbuf[j] >= 0x81 ) { /* **** 00 A4 00 A4 00 A4 00 E5 **** */ /* ****          中          文 **** */ /* ***j=A4 A4 A4 E5 --> code=0xa4a4 ->find unicode **** */  /* ****  E 2D 65 87 <--- result **** */  code = tmpbuf[j];  code = code << 8;  code += tmpbuf[j+1];    unicode = gbk2uni[(((code&0xFF00)>>8)-0x81)*192 + ((code&0x00FF)-0x40)];    if (unicode) {    buffer[i] = unicode >> 8;    buffer[i+1] = unicode ;    j++;     }   }}	}	if (size & 1) {	/* beautification */		buffer[size - 1] = 0;	}	if (source == NULL) {		free(tmpbuf);	}}/* * Function:	joliet_strlen * * Purpose:	Return length in bytes of string after conversion to unicode. * * Notes:	This is provided mainly as a convenience so that when more * 		intelligent Unicode conversion for either Multibyte or 8-bit *		codes is available that we can easily adapt. */#ifdef	UDFint#elsestatic int#endifjoliet_strlen(string, flag)	int             flag;	const char	*string;{	int		rtn;        unsigned char   *tmpbuf;
        int             i;
        int             j;

        int             p;
        u_int16_t       code,                         unicode;
        int             tmpsize ;		rtn = strlen(string) << 1;/**===================================**//* big5 to unicode patch, flag=gbk4win *//* use flag param to call external int *//**===================================**/  tmpsize = rtn;  if (flag >= 1) {      tmpbuf = (u_char *)string;
  j=0;
  for(i=0; i < tmpsize ; i += 2, j++)
    {
/******/ /* big5 to unicode patch*/

 if( tmpbuf[j] >= 0x81 ){

 /* **** 00 A4 00 A4 00 A4 00 E5 **** */
 /* ****          中          文 **** */
 /* **** j=A4 A4 A4 E5 -->       **** */ /*   code=0xa4a4 ->find unicode **** */ 
 /* **** 4E 2D 65 87 <--- result **** */

  code = tmpbuf[j];
  code = code << 8;
  code += tmpbuf[j+1];
    unicode = gbk2uni[(((code&0xFF00)>>8)-0x81)*192 + ((code&0x00FF)-0x40)];
    if(unicode) {
       j++;
       tmpsize -= 2;
      }
    }  }}  rtn = tmpsize; 	/*	 * We do clamp the maximum length of a Joliet string to be the	 * maximum path size.  This helps to ensure that we don't completely	 * bolix things up with very long paths.    The Joliet specs say that	 * the maximum length is 128 bytes, or 64 unicode characters.	 */	if (rtn > 2*jlen) {		rtn = 2*jlen;	}	return rtn;}/* * Function:		get_joliet_vol_desc * * Purpose:		generate a Joliet compatible volume desc. * * Notes:		Assume that we have the non-joliet vol desc *			already present in the buffer.  Just modifiy the *			appropriate fields. */static voidget_joliet_vol_desc(jvol_desc)	struct iso_primary_descriptor	*jvol_desc;{	jvol_desc->type[0] = ISO_VD_SUPPLEMENTARY;	/*	 * For now, always do Unicode level 3.	 * I don't really know what 1 and 2 are - perhaps a more limited	 * Unicode set.	 * FIXME(eric) - how does Romeo fit in here?	 */	sprintf(jvol_desc->escape_sequences, "%%/%c", ucs_codes[ucs_level]);	/* Until we have Unicode path tables, leave these unset. */	set_733((char *) jvol_desc->path_table_size, jpath_table_size);	set_731(jvol_desc->type_l_path_table, jpath_table[0]);	set_731(jvol_desc->opt_type_l_path_table, jpath_table[1]);	set_732(jvol_desc->type_m_path_table, jpath_table[2]);	set_732(jvol_desc->opt_type_m_path_table, jpath_table[3]);	/* Set this one up. */	memcpy(jvol_desc->root_directory_record, &jroot_record,		offsetof(struct iso_directory_record, name[0]) + 1);	/*	 * Finally, we have a bunch of strings to convert to Unicode.	 * FIXME(eric) - I don't know how to do this in general,	 * so we will just be really lazy and do a char -> short conversion.	 *  We probably will want to filter any characters >= 0x80.	 */	convert_to_unicode((Uchar *) jvol_desc->system_id,			sizeof(jvol_desc->system_id), NULL, in_nls, gbk4win_filenames);	convert_to_unicode((Uchar *) jvol_desc->volume_id,			sizeof(jvol_desc->volume_id), NULL, in_nls, gbk4win_filenames);	convert_to_unicode((Uchar *) jvol_desc->volume_set_id,			sizeof(jvol_desc->volume_set_id), NULL, in_nls, gbk4win_filenames);	convert_to_unicode((Uchar *) jvol_desc->publisher_id,			sizeof(jvol_desc->publisher_id), NULL, in_nls, gbk4win_filenames);	convert_to_unicode((Uchar *) jvol_desc->preparer_id,			sizeof(jvol_desc->preparer_id), NULL, in_nls, gbk4win_filenames);	convert_to_unicode((Uchar *) jvol_desc->application_id,			sizeof(jvol_desc->application_id), NULL, in_nls, gbk4win_filenames);	convert_to_unicode((Uchar *) jvol_desc->copyright_file_id,			sizeof(jvol_desc->copyright_file_id), NULL, in_nls, gbk4win_filenames);	convert_to_unicode((Uchar *) jvol_desc->abstract_file_id,			sizeof(jvol_desc->abstract_file_id), NULL, in_nls, gbk4win_filenames);	convert_to_unicode((Uchar *) jvol_desc->bibliographic_file_id,			sizeof(jvol_desc->bibliographic_file_id), NULL, in_nls, gbk4win_filenames);}static voidassign_joliet_directory_addresses(node)	struct directory	*node;{	int		dir_size;	struct directory *dpnt;	dpnt = node;	while (dpnt) {		if ((dpnt->dir_flags & INHIBIT_JOLIET_ENTRY) == 0) {			/*			 * If we already have an extent for this			 * (i.e. it came from a multisession disc), then			 * don't reassign a new extent.			 */			dpnt->jpath_index = next_jpath_index++;			if (dpnt->jextent == 0) {				dpnt->jextent = last_extent;
joliet.c - 源码说明

本页面展示了「一款功能很强的光盘镜象制作工具」中的 joliet.c 源码文件，采用 C语言编程语言编写，共 1,397 行代码。您可以在线阅读完整代码内容，也可以返回资源详情页下载完整源码包进行本地学习和开发。
虫虫下载站收录了大量与光盘相关的技术资源，包括源代码、技术文档、电路图等，是电子工程师和嵌入式开发者的专业学习平台。
⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?