git.saurik.com Git - apple/icu.git/blame_incremental - icuSources/tools/icuswap/icuswap.cpp

0 / 774 ( 0%)

Commit	Line	Data
	1	/*
	2	*******************************************************************************
	3	*
	4	* Copyright (C) 2003-2004, International Business Machines
	5	* Corporation and others. All Rights Reserved.
	6	*
	7	*******************************************************************************
	8	* file name: icuswap.cpp
	9	* encoding: US-ASCII
	10	* tab size: 8 (not used)
	11	* indentation:4
	12	*
	13	* created on: 2003aug08
	14	* created by: Markus W. Scherer
	15	*
	16	* This tool takes an ICU data file and "swaps" it, that is, changes its
	17	* platform properties between big-/little-endianness and ASCII/EBCDIC charset
	18	* families.
	19	* The modified data file is written to a new file.
	20	* Useful as an install-time tool for shipping only one flavor of ICU data
	21	* and preparing data files for the target platform.
	22	* Will not work with data DLLs (shared libraries).
	23	*/
	24
	25	#include "unicode/utypes.h"
	26	#include "unicode/putil.h"
	27	#include "unicode/udata.h"
	28	#include "cmemory.h"
	29	#include "cstring.h"
	30	#include "uinvchar.h"
	31	#include "uarrsort.h"
	32	#include "ucmndata.h"
	33	#include "udataswp.h"
	34	#include "toolutil.h"
	35	#include "uoptions.h"
	36
	37	/* swapping implementations in common */
	38
	39	#include "uresdata.h"
	40	#include "ucnv_io.h"
	41	#include "uprops.h"
	42	#include "ucase.h"
	43	#include "ucol_swp.h"
	44	#include "ucnv_bld.h"
	45	#include "unormimp.h"
	46	#include "sprpimpl.h"
	47	#include "propname.h"
	48	#include "rbbidata.h"
	49
	50	#include <stdio.h>
	51	#include <stdlib.h>
	52	#include <string.h>
	53
	54	/* swapping implementations in i18n */
	55
	56	/* definitions */
	57
	58	#define LENGTHOF(array) (int32_t)(sizeof(array)/sizeof((array)[0]))
	59
	60	static UOption options[]={
	61	UOPTION_HELP_H,
	62	UOPTION_HELP_QUESTION_MARK,
	63	UOPTION_DEF("type", 't', UOPT_REQUIRES_ARG)
	64	};
	65
	66	enum {
	67	OPT_HELP_H,
	68	OPT_HELP_QUESTION_MARK,
	69	OPT_OUT_TYPE
	70	};
	71
	72	static int32_t
	73	fileSize(FILE *f) {
	74	int32_t size;
	75
	76	fseek(f, 0, SEEK_END);
	77	size=(int32_t)ftell(f);
	78	fseek(f, 0, SEEK_SET);
	79	return size;
	80	}
	81
	82	/**
	83	* Identifies and then transforms the ICU data piece in-place, or determines
	84	* its length. See UDataSwapFn.
	85	* This function handles .dat data packages as well as single data pieces
	86	* and internally dispatches to per-type swap functions.
	87	* Sets a U_UNSUPPORTED_ERROR if the data format is not recognized.
	88	*
	89	* @see UDataSwapFn
	90	* @see udata_openSwapper
	91	* @see udata_openSwapperForInputData
	92	* @draft ICU 2.8
	93	*/
	94	static int32_t
	95	udata_swap(const UDataSwapper *ds,
	96	const void inData, int32_t length, void outData,
	97	UErrorCode *pErrorCode);
	98
	99	/**
	100	* Swap an ICU .dat package, including swapping of enclosed items.
	101	*/
	102	U_CFUNC int32_t U_CALLCONV
	103	udata_swapPackage(const UDataSwapper *ds,
	104	const void inData, int32_t length, void outData,
	105	UErrorCode *pErrorCode);
	106
	107	/*
	108	* udata_swapPackage() needs to rename ToC name entries from the old package
	109	* name to the new one.
	110	* We store the filenames here, and udata_swapPackage() will extract the
	111	* package names.
	112	*/
	113	static const char inFilename, outFilename;
	114
	115	U_CDECL_BEGIN
	116	static void U_CALLCONV
	117	printError(void context, const char fmt, va_list args) {
	118	vfprintf((FILE *)context, fmt, args);
	119	}
	120	U_CDECL_END
	121
	122	static int
	123	printUsage(const char *pname, UBool ishelp) {
	124	fprintf(stderr,
	125	"%csage: %s [ -h, -?, --help ] -tl\|-tb\|-te\|--type=b\|... infilename outfilename\n",
	126	ishelp ? 'U' : 'u', pname);
	127	if(ishelp) {
	128	fprintf(stderr,
	129	"\nOptions: -h, -?, --help print this message and exit\n"
	130	" Read the input file, swap its platform properties according\n"
	131	" to the -t or --type option, and write the result to the output file.\n"
	132	" -tl change to little-endian/ASCII charset family\n"
	133	" -tb change to big-endian/ASCII charset family\n"
	134	" -te change to big-endian/EBCDIC charset family\n");
	135	}
	136
	137	return !ishelp;
	138	}
	139
	140	extern int
	141	main(int argc, char *argv[]) {
	142	FILE in, out;
	143	const char *pname;
	144	char *data;
	145	int32_t length;
	146	UBool ishelp;
	147	int rc;
	148
	149	UDataSwapper *ds;
	150	UErrorCode errorCode;
	151	uint8_t outCharset;
	152	UBool outIsBigEndian;
	153
	154	U_MAIN_INIT_ARGS(argc, argv);
	155
	156	/* get the program basename */
	157	pname=strrchr(argv[0], U_FILE_SEP_CHAR);
	158	if(pname==NULL) {
	159	pname=strrchr(argv[0], '/');
	160	}
	161	if(pname!=NULL) {
	162	++pname;
	163	} else {
	164	pname=argv[0];
	165	}
	166
	167	argc=u_parseArgs(argc, argv, LENGTHOF(options), options);
	168	ishelp=options[OPT_HELP_H].doesOccur \|\| options[OPT_HELP_QUESTION_MARK].doesOccur;
	169	if(ishelp \|\| argc!=3) {
	170	return printUsage(pname, ishelp);
	171	}
	172
	173	/* parse the output type option */
	174	data=(char *)options[OPT_OUT_TYPE].value;
	175	if(data[0]==0 \|\| data[1]!=0) {
	176	/* the type must be exactly one letter */
	177	return printUsage(pname, FALSE);
	178	}
	179	switch(data[0]) {
	180	case 'l':
	181	outIsBigEndian=FALSE;
	182	outCharset=U_ASCII_FAMILY;
	183	break;
	184	case 'b':
	185	outIsBigEndian=TRUE;
	186	outCharset=U_ASCII_FAMILY;
	187	break;
	188	case 'e':
	189	outIsBigEndian=TRUE;
	190	outCharset=U_EBCDIC_FAMILY;
	191	break;
	192	default:
	193	return printUsage(pname, FALSE);
	194	}
	195
	196	in=out=NULL;
	197	data=NULL;
	198
	199	/* udata_swapPackage() needs the filenames */
	200	inFilename=argv[1];
	201	outFilename=argv[2];
	202
	203	/* open the input file, get its length, allocate memory for it, read the file */
	204	in=fopen(argv[1], "rb");
	205	if(in==NULL) {
	206	fprintf(stderr, "%s: unable to open input file \"%s\"\n", pname, argv[1]);
	207	rc=2;
	208	goto done;
	209	}
	210
	211	length=fileSize(in);
	212	if(length<=0) {
	213	fprintf(stderr, "%s: empty input file \"%s\"\n", pname, argv[1]);
	214	rc=2;
	215	goto done;
	216	}
	217
	218	/*
	219	* +15: udata_swapPackage() may need to add a few padding bytes to the
	220	* last item if charset swapping is done,
	221	* because the last item may be resorted into the middle and then needs
	222	* additional padding bytes
	223	*/
	224	data=(char *)malloc(length+15);
	225	if(data==NULL) {
	226	fprintf(stderr, "%s: error allocating memory for \"%s\"\n", pname, argv[1]);
	227	rc=2;
	228	goto done;
	229	}
	230
	231	/* set the last 15 bytes to the usual padding byte, see udata_swapPackage() */
	232	uprv_memset(data+length-15, 0xaa, 15);
	233
	234	if(length!=(int32_t)fread(data, 1, length, in)) {
	235	fprintf(stderr, "%s: error reading \"%s\"\n", pname, argv[1]);
	236	rc=3;
	237	goto done;
	238	}
	239
	240	fclose(in);
	241	in=NULL;
	242
	243	/* swap the data in-place */
	244	errorCode=U_ZERO_ERROR;
	245	ds=udata_openSwapperForInputData(data, length, outIsBigEndian, outCharset, &errorCode);
	246	if(U_FAILURE(errorCode)) {
	247	fprintf(stderr, "%s: udata_openSwapperForInputData(\"%s\") failed - %s\n",
	248	pname, argv[1], u_errorName(errorCode));
	249	rc=4;
	250	goto done;
	251	}
	252
	253	ds->printError=printError;
	254	ds->printErrorContext=stderr;
	255
	256	length=udata_swap(ds, data, length, data, &errorCode);
	257	udata_closeSwapper(ds);
	258	if(U_FAILURE(errorCode)) {
	259	fprintf(stderr, "%s: udata_swap(\"%s\") failed - %s\n",
	260	pname, argv[1], u_errorName(errorCode));
	261	rc=4;
	262	goto done;
	263	}
	264
	265	out=fopen(argv[2], "wb");
	266	if(out==NULL) {
	267	fprintf(stderr, "%s: unable to open output file \"%s\"\n", pname, argv[2]);
	268	rc=5;
	269	goto done;
	270	}
	271
	272	if(length!=(int32_t)fwrite(data, 1, length, out)) {
	273	fprintf(stderr, "%s: error writing \"%s\"\n", pname, argv[2]);
	274	rc=6;
	275	goto done;
	276	}
	277
	278	fclose(out);
	279	out=NULL;
	280
	281	/* all done */
	282	rc=0;
	283
	284	done:
	285	if(in!=NULL) {
	286	fclose(in);
	287	}
	288	if(out!=NULL) {
	289	fclose(out);
	290	}
	291	if(data!=NULL) {
	292	free(data);
	293	}
	294	return rc;
	295	}
	296
	297	/* swap the data ------------------------------------------------------------ */
	298
	299	static const struct {
	300	uint8_t dataFormat[4];
	301	UDataSwapFn *swapFn;
	302	} swapFns[]={
	303	{ { 0x52, 0x65, 0x73, 0x42 }, ures_swap }, /* dataFormat="ResB" */
	304	#if !UCONFIG_NO_LEGACY_CONVERSION
	305	{ { 0x63, 0x6e, 0x76, 0x74 }, ucnv_swap }, /* dataFormat="cnvt" */
	306	{ { 0x43, 0x76, 0x41, 0x6c }, ucnv_swapAliases }, /* dataFormat="CvAl" */
	307	#endif
	308	{ { 0x43, 0x6d, 0x6e, 0x44 }, udata_swapPackage }, /* dataFormat="CmnD" */
	309	#if !UCONFIG_NO_IDNA
	310	{ { 0x53, 0x50, 0x52, 0x50 }, usprep_swap }, /* dataFormat="SPRP" */
	311	#endif
	312	/* insert data formats here, descending by expected frequency of occurrence */
	313	{ { 0x55, 0x50, 0x72, 0x6f }, uprops_swap }, /* dataFormat="UPro" */
	314
	315	{ { UCASE_FMT_0, UCASE_FMT_1, UCASE_FMT_2, UCASE_FMT_3 },
	316	ucase_swap }, /* dataFormat="cAsE" */
	317
	318	#if !UCONFIG_NO_NORMALIZATION
	319	{ { 0x4e, 0x6f, 0x72, 0x6d }, unorm_swap }, /* dataFormat="Norm" */
	320	#endif
	321	#if !UCONFIG_NO_COLLATION
	322	{ { 0x55, 0x43, 0x6f, 0x6c }, ucol_swap }, /* dataFormat="UCol" */
	323	{ { 0x49, 0x6e, 0x76, 0x43 }, ucol_swapInverseUCA },/* dataFormat="InvC" */
	324	#endif
	325	#if !UCONFIG_NO_BREAK_ITERATION
	326	{ { 0x42, 0x72, 0x6b, 0x20 }, ubrk_swap }, /* dataFormat="Brk " */
	327	#endif
	328	{ { 0x70, 0x6e, 0x61, 0x6d }, upname_swap }, /* dataFormat="pnam" */
	329	{ { 0x75, 0x6e, 0x61, 0x6d }, uchar_swapNames } /* dataFormat="unam" */
	330	};
	331
	332	static int32_t
	333	udata_swap(const UDataSwapper *ds,
	334	const void inData, int32_t length, void outData,
	335	UErrorCode *pErrorCode) {
	336	char dataFormatChars[4];
	337	const UDataInfo *pInfo;
	338	int32_t headerSize, i, swappedLength;
	339
	340	if(pErrorCode==NULL \|\| U_FAILURE(*pErrorCode)) {
	341	return 0;
	342	}
	343
	344	/*
	345	* Preflight the header first; checks for illegal arguments, too.
	346	* Do not swap the header right away because the format-specific swapper
	347	* will swap it, get the headerSize again, and also use the header
	348	* information. Otherwise we would have to pass some of the information
	349	* and not be able to use the UDataSwapFn signature.
	350	*/
	351	headerSize=udata_swapDataHeader(ds, inData, -1, NULL, pErrorCode);
	352
	353	/*
	354	* If we wanted udata_swap() to also handle non-loadable data like a UTrie,
	355	* then we could check here for further known magic values and structures.
	356	*/
	357	if(U_FAILURE(*pErrorCode)) {
	358	return 0; /* the data format was not recognized */
	359	}
	360
	361	pInfo=(const UDataInfo )((const char )inData+4);
	362
	363	{
	364	/* convert the data format from ASCII to Unicode to the system charset */
	365	UChar u[4]={
	366	pInfo->dataFormat[0], pInfo->dataFormat[1],
	367	pInfo->dataFormat[2], pInfo->dataFormat[3]
	368	};
	369
	370	if(uprv_isInvariantUString(u, 4)) {
	371	u_UCharsToChars(u, dataFormatChars, 4);
	372	} else {
	373	dataFormatChars[0]=dataFormatChars[1]=dataFormatChars[2]=dataFormatChars[3]='?';
	374	}
	375	}
	376
	377	/* dispatch to the swap function for the dataFormat */
	378	for(i=0; i<LENGTHOF(swapFns); ++i) {
	379	if(0==memcmp(swapFns[i].dataFormat, pInfo->dataFormat, 4)) {
	380	swappedLength=swapFns[i].swapFn(ds, inData, length, outData, pErrorCode);
	381
	382	if(U_FAILURE(*pErrorCode)) {
	383	udata_printError(ds, "udata_swap(): failure swapping data format %02x.%02x.%02x.%02x (\"%c%c%c%c\") - %s\n",
	384	pInfo->dataFormat[0], pInfo->dataFormat[1],
	385	pInfo->dataFormat[2], pInfo->dataFormat[3],
	386	dataFormatChars[0], dataFormatChars[1],
	387	dataFormatChars[2], dataFormatChars[3],
	388	u_errorName(*pErrorCode));
	389	} else if(swappedLength<(length-15)) {
	390	/* swapped less than expected */
	391	udata_printError(ds, "udata_swap() warning: swapped only %d out of %d bytes - data format %02x.%02x.%02x.%02x (\"%c%c%c%c\")\n",
	392	swappedLength, length,
	393	pInfo->dataFormat[0], pInfo->dataFormat[1],
	394	pInfo->dataFormat[2], pInfo->dataFormat[3],
	395	dataFormatChars[0], dataFormatChars[1],
	396	dataFormatChars[2], dataFormatChars[3],
	397	u_errorName(*pErrorCode));
	398	}
	399
	400	return swappedLength;
	401	}
	402	}
	403
	404	/* the dataFormat was not recognized */
	405	udata_printError(ds, "udata_swap(): unknown data format %02x.%02x.%02x.%02x (\"%c%c%c%c\")\n",
	406	pInfo->dataFormat[0], pInfo->dataFormat[1],
	407	pInfo->dataFormat[2], pInfo->dataFormat[3],
	408	dataFormatChars[0], dataFormatChars[1],
	409	dataFormatChars[2], dataFormatChars[3]);
	410
	411	*pErrorCode=U_UNSUPPORTED_ERROR;
	412	return 0;
	413	}
	414
	415	/* swap .dat package files -------------------------------------------------- */
	416
	417	static int32_t
	418	extractPackageName(const UDataSwapper ds, const char filename,
	419	char pkg[], int32_t capacity,
	420	UErrorCode *pErrorCode) {
	421	const char *basename;
	422	int32_t len;
	423
	424	if(U_FAILURE(*pErrorCode)) {
	425	return 0;
	426	}
	427
	428	basename=findBasename(filename);
	429	len=(int32_t)uprv_strlen(basename)-4; /* -4: subtract the length of ".dat" */
	430
	431	if(len<=0 \|\| 0!=uprv_strcmp(basename+len, ".dat")) {
	432	udata_printError(ds, "udata_swapPackage(): \"%s\" is not recognized as a package filename (must end with .dat)\n",
	433	basename);
	434	*pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
	435	return 0;
	436	}
	437
	438	if(len>=capacity) {
	439	udata_printError(ds, "udata_swapPackage(): the package name \"%s\" is too long (>=%ld)\n",
	440	(long)capacity);
	441	*pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
	442	return 0;
	443	}
	444
	445	uprv_memcpy(pkg, basename, len);
	446	pkg[len]=0;
	447	return len;
	448	}
	449
	450	struct ToCEntry {
	451	uint32_t nameOffset, inOffset, outOffset, length;
	452	};
	453
	454	U_CDECL_BEGIN
	455	static int32_t U_CALLCONV
	456	compareToCEntries(const void context, const void left, const void *right) {
	457	const char chars=(const char )context;
	458	return (int32_t)uprv_strcmp(chars+((const ToCEntry *)left)->nameOffset,
	459	chars+((const ToCEntry *)right)->nameOffset);
	460	}
	461	U_CDECL_END
	462
	463	U_CFUNC int32_t U_CALLCONV
	464	udata_swapPackage(const UDataSwapper *ds,
	465	const void inData, int32_t length, void outData,
	466	UErrorCode *pErrorCode) {
	467	const UDataInfo *pInfo;
	468	int32_t headerSize;
	469
	470	const uint8_t *inBytes;
	471	uint8_t *outBytes;
	472
	473	uint32_t itemCount, offset, i;
	474	int32_t itemLength;
	475
	476	const UDataOffsetTOCEntry *inEntries;
	477	UDataOffsetTOCEntry *outEntries;
	478
	479	ToCEntry *table;
	480
	481	char inPkgName[32], outPkgName[32];
	482	int32_t inPkgNameLength, outPkgNameLength;
	483
	484	/* udata_swapDataHeader checks the arguments */
	485	headerSize=udata_swapDataHeader(ds, inData, length, outData, pErrorCode);
	486	if(pErrorCode==NULL \|\| U_FAILURE(*pErrorCode)) {
	487	return 0;
	488	}
	489
	490	/* check data format and format version */
	491	pInfo=(const UDataInfo )((const char )inData+4);
	492	if(!(
	493	pInfo->dataFormat[0]==0x43 && /* dataFormat="CmnD" */
	494	pInfo->dataFormat[1]==0x6d &&
	495	pInfo->dataFormat[2]==0x6e &&
	496	pInfo->dataFormat[3]==0x44 &&
	497	pInfo->formatVersion[0]==1
	498	)) {
	499	udata_printError(ds, "udata_swapPackage(): data format %02x.%02x.%02x.%02x (format version %02x) is not recognized as an ICU .dat package\n",
	500	pInfo->dataFormat[0], pInfo->dataFormat[1],
	501	pInfo->dataFormat[2], pInfo->dataFormat[3],
	502	pInfo->formatVersion[0]);
	503	*pErrorCode=U_UNSUPPORTED_ERROR;
	504	return 0;
	505	}
	506
	507	/*
	508	* We need to change the ToC name entries so that they have the correct
	509	* package name prefix.
	510	* Extract the package names from the in/out filenames.
	511	*/
	512	inPkgNameLength=extractPackageName(
	513	ds, inFilename,
	514	inPkgName, (int32_t)sizeof(inPkgName),
	515	pErrorCode);
	516	outPkgNameLength=extractPackageName(
	517	ds, outFilename,
	518	outPkgName, (int32_t)sizeof(outPkgName),
	519	pErrorCode);
	520	if(U_FAILURE(*pErrorCode)) {
	521	return 0;
	522	}
	523
	524	/*
	525	* It is possible to work with inPkgNameLength!=outPkgNameLength,
	526	* but then the length of the data file would change more significantly,
	527	* which we are not currently prepared for.
	528	*/
	529	if(inPkgNameLength!=outPkgNameLength) {
	530	udata_printError(ds, "udata_swapPackage(): the package names \"%s\" and \"%s\" must have the same length\n",
	531	inPkgName, outPkgName);
	532	*pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
	533	return 0;
	534	}
	535
	536	inBytes=(const uint8_t *)inData+headerSize;
	537	inEntries=(const UDataOffsetTOCEntry *)(inBytes+4);
	538
	539	if(length<0) {
	540	/* preflighting */
	541	itemCount=ds->readUInt32((const uint32_t )inBytes);
	542	if(itemCount==0) {
	543	/* no items: count only the item count and return */
	544	return headerSize+4;
	545	}
	546
	547	/* read the last item's offset and preflight it */
	548	offset=ds->readUInt32(inEntries[itemCount-1].dataOffset);
	549	itemLength=udata_swap(ds, inBytes+offset, -1, NULL, pErrorCode);
	550
	551	if(U_SUCCESS(*pErrorCode)) {
	552	return headerSize+offset+(uint32_t)itemLength;
	553	} else {
	554	return 0;
	555	}
	556	} else {
	557	/* check that the itemCount fits, then the ToC table, then at least the header of the last item */
	558	length-=headerSize;
	559	if(length<4) {
	560	/* itemCount does not fit */
	561	offset=0xffffffff;
	562	itemCount=0; /* make compilers happy */
	563	} else {
	564	itemCount=ds->readUInt32((const uint32_t )inBytes);
	565	if(itemCount==0) {
	566	offset=4;
	567	} else if((uint32_t)length<(4+8*itemCount)) {
	568	/* ToC table does not fit */
	569	offset=0xffffffff;
	570	} else {
	571	/* offset of the last item plus at least 20 bytes for its header */
	572	offset=20+ds->readUInt32(inEntries[itemCount-1].dataOffset);
	573	}
	574	}
	575	if((uint32_t)length<offset) {
	576	udata_printError(ds, "udata_swapPackage(): too few bytes (%d after header) for unames.icu\n",
	577	length);
	578	*pErrorCode=U_INDEX_OUTOFBOUNDS_ERROR;
	579	return 0;
	580	}
	581
	582	outBytes=(uint8_t *)outData+headerSize;
	583
	584	/* swap the item count */
	585	ds->swapArray32(ds, inBytes, 4, outBytes, pErrorCode);
	586
	587	if(itemCount==0) {
	588	/* no items: just return now */
	589	return headerSize+4;
	590	}
	591
	592	/* swap the item name strings */
	593	offset=4+8*itemCount;
	594	itemLength=(int32_t)(ds->readUInt32(inEntries[0].dataOffset)-offset);
	595	udata_swapInvStringBlock(ds, inBytes+offset, itemLength, outBytes+offset, pErrorCode);
	596	if(U_FAILURE(*pErrorCode)) {
	597	udata_printError(ds, "udata_swapPackage() failed to swap the data item name strings\n");
	598	return 0;
	599	}
	600	/* keep offset and itemLength in case we allocate and copy the strings below */
	601
	602	/* swap the package names into the output charset */
	603	if(ds->outCharset!=U_CHARSET_FAMILY) {
	604	UDataSwapper *ds2;
	605	ds2=udata_openSwapper(TRUE, U_CHARSET_FAMILY, TRUE, ds->outCharset, pErrorCode);
	606	ds2->swapInvChars(ds2, inPkgName, inPkgNameLength, inPkgName, pErrorCode);
	607	ds2->swapInvChars(ds2, outPkgName, outPkgNameLength, outPkgName, pErrorCode);
	608	udata_closeSwapper(ds2);
	609	if(U_FAILURE(*pErrorCode)) {
	610	udata_printError(ds, "udata_swapPackage() failed to swap the input/output package names\n");
	611	}
	612	}
	613
	614	/* change the prefix of each ToC entry name from the old to the new package name */
	615	{
	616	char *entryName;
	617
	618	for(i=0; i<itemCount; ++i) {
	619	entryName=(char *)inBytes+ds->readUInt32(inEntries[i].nameOffset);
	620
	621	if(0==uprv_memcmp(entryName, inPkgName, inPkgNameLength)) {
	622	uprv_memcpy(entryName, outPkgName, inPkgNameLength);
	623	} else {
	624	udata_printError(ds, "udata_swapPackage() failed: ToC item %ld does not have the input package name as a prefix\n",
	625	(long)i);
	626	*pErrorCode=U_INVALID_FORMAT_ERROR;
	627	return 0;
	628	}
	629	}
	630	}
	631
	632	/*
	633	* Allocate the ToC table and, if necessary, a temporary buffer for
	634	* pseudo-in-place swapping.
	635	*
	636	* We cannot swap in-place because:
	637	*
	638	* 1. If the swapping of an item fails mid-way, then in-place swapping
	639	* has destroyed its data.
	640	* Out-of-place swapping allows us to then copy its original data.
	641	*
	642	* 2. If swapping changes the charset family, then we must resort
	643	* not only the ToC table but also the data items themselves.
	644	* This requires a permutation and is best done with separate in/out
	645	* buffers.
	646	*
	647	* We swapped the strings above to avoid the malloc below if string swapping fails.
	648	*/
	649	if(inData==outData) {
	650	/* +15: prepare for extra padding of a newly-last item */
	651	table=(ToCEntry )uprv_malloc(itemCountsizeof(ToCEntry)+length+15);
	652	if(table!=NULL) {
	653	outBytes=(uint8_t *)(table+itemCount);
	654
	655	/* copy the item count and the swapped strings */
	656	uprv_memcpy(outBytes, inBytes, 4);
	657	uprv_memcpy(outBytes+offset, inBytes+offset, itemLength);
	658	}
	659	} else {
	660	table=(ToCEntry )uprv_malloc(itemCountsizeof(ToCEntry));
	661	}
	662	if(table==NULL) {
	663	udata_printError(ds, "udata_swapPackage(): out of memory allocating %d bytes\n",
	664	inData==outData ?
	665	itemCount*sizeof(ToCEntry)+length+15 :
	666	itemCount*sizeof(ToCEntry));
	667	*pErrorCode=U_MEMORY_ALLOCATION_ERROR;
	668	return 0;
	669	}
	670	outEntries=(UDataOffsetTOCEntry *)(outBytes+4);
	671
	672	/* read the ToC table */
	673	for(i=0; i<itemCount; ++i) {
	674	table[i].nameOffset=ds->readUInt32(inEntries[i].nameOffset);
	675	table[i].inOffset=ds->readUInt32(inEntries[i].dataOffset);
	676	if(i>0) {
	677	table[i-1].length=table[i].inOffset-table[i-1].inOffset;
	678	}
	679	}
	680	table[itemCount-1].length=(uint32_t)length-table[itemCount-1].inOffset;
	681
	682	if(ds->inCharset==ds->outCharset) {
	683	/* no charset swapping, no resorting: keep item offsets the same */
	684	for(i=0; i<itemCount; ++i) {
	685	table[i].outOffset=table[i].inOffset;
	686	}
	687	} else {
	688	/* charset swapping: resort items by their swapped names */
	689
	690	/*
	691	* Before the actual sorting, we need to make sure that each item
	692	* has a length that is a multiple of 16 bytes so that all items
	693	* are 16-aligned.
	694	* Only the old last item may be missing up to 15 padding bytes.
	695	* Add padding bytes for it.
	696	* Since the icuswap main() function has already allocated enough
	697	* input buffer space and set the last 15 bytes there to 0xaa,
	698	* we only need to increase the total data length and the length
	699	* of the last item here.
	700	*/
	701	if((length&0xf)!=0) {
	702	int32_t delta=16-(length&0xf);
	703	length+=delta;
	704	table[itemCount-1].length+=(uint32_t)delta;
	705	}
	706
	707	uprv_sortArray(table, (int32_t)itemCount, (int32_t)sizeof(ToCEntry),
	708	compareToCEntries, outBytes, FALSE, pErrorCode);
	709
	710	/*
	711	* Note: Before sorting, the inOffset values were in order.
	712	* Now the outOffset values are in order.
	713	*/
	714
	715	/* assign outOffset values */
	716	offset=table[0].inOffset;
	717	for(i=0; i<itemCount; ++i) {
	718	table[i].outOffset=offset;
	719	offset+=table[i].length;
	720	}
	721	}
	722
	723	/* write the output ToC table */
	724	for(i=0; i<itemCount; ++i) {
	725	ds->writeUInt32(&outEntries[i].nameOffset, table[i].nameOffset);
	726	ds->writeUInt32(&outEntries[i].dataOffset, table[i].outOffset);
	727	}
	728
	729	/* swap each data item */
	730	for(i=0; i<itemCount; ++i) {
	731	/* first copy the item bytes to make sure that unreachable bytes are copied */
	732	uprv_memcpy(outBytes+table[i].outOffset, inBytes+table[i].inOffset, table[i].length);
	733
	734	/* swap the item */
	735	udata_swap(ds, inBytes+table[i].inOffset, (int32_t)table[i].length,
	736	outBytes+table[i].outOffset, pErrorCode);
	737
	738	if(U_FAILURE(*pErrorCode)) {
	739	if(ds->outCharset==U_CHARSET_FAMILY) {
	740	udata_printError(ds, "warning: udata_swapPackage() failed to swap item \"%s\"\n"
	741	" at inOffset 0x%x length 0x%x - %s\n"
	742	" the data item will be copied, not swapped\n\n",
	743	(char *)outBytes+table[i].nameOffset,
	744	table[i].inOffset, table[i].length, u_errorName(*pErrorCode));
	745	} else {
	746	udata_printError(ds, "warning: udata_swapPackage() failed to swap an item\n"
	747	" at inOffset 0x%x length 0x%x - %s\n"
	748	" the data item will be copied, not swapped\n\n",
	749	table[i].inOffset, table[i].length, u_errorName(*pErrorCode));
	750	}
	751	/* reset the error code, copy the data item, and continue */
	752	*pErrorCode=U_ZERO_ERROR;
	753	uprv_memcpy(outBytes+table[i].outOffset, inBytes+table[i].inOffset, table[i].length);
	754	}
	755	}
	756
	757	if(inData==outData) {
	758	/* copy the data from the temporary buffer to the in-place buffer */
	759	uprv_memcpy((uint8_t *)outData+headerSize, outBytes, length);
	760	}
	761	uprv_free(table);
	762
	763	return headerSize+length;
	764	}
	765	}
	766
	767	/*
	768	* Hey, Emacs, please set the following:
	769	*
	770	* Local Variables:
	771	* indent-tabs-mode: nil
	772	* End:
	773	*
	774	*/