firebird-mirror/src/intl/utils/maptest.cpp

/*
 * The contents of this file are subject to the Interbase Public
 * License Version 1.0 (the "License"); you may not use this file
 * except in compliance with the License. You may obtain a copy
 * of the License at http://www.Inprise.com/IPL.html
 *
 * Software distributed under the License is distributed on an
 * "AS IS" basis, WITHOUT WARRANTY OF ANY KIND, either express
 * or implied. See the License for the specific language governing
 * rights and limitations under the License.
 *
 * The Original Code was created by Inprise Corporation
 * and its predecessors. Portions created by Inprise Corporation are
 * Copyright (C) Inprise Corporation.
 *
 * All Rights Reserved.
 * Contributor(s): ______________________________________.
 */

#include "firebird.h"
#include "../jrd/common.h"


/*
fixed
#include "cs_w1254.h"
#include "cs_cyrl.h"
#include "cs_865.h"
#include "cs_863.h"
#include "cs_861.h"
#include "cs_860.h"
#include "cs_857.h"
#include "cs_w1251.h"
#include "cs_437.h"
#include "cs_850.h"
#include "cs_852.h"
#include "cs_w1250.h"
#include "cs_w1252.h"
#include "cs_w1253.h"

fixed with errors
#include "cs_next.h" -- NeXT has two characters mapping to the same
			Unicode (FE & FF).  So round trip is not possible.
			They map to FFFD, which is the replacement character
			so this is not an error

No errors
#include "../intl/cs_iso8859_1.h"
*/

/* 
-- Multibyte character sets --
#include "../intl/cs_big5.h"
#include "../intl/cs_gb2312.h"
#include "../intl/cs_jis_0208_1990.h"
#include "../intl/cs_ksc5601.h"
#include "../intl/csjis2_p.h"
*/


#define UNICODE_INDEX(u)	(((u) % 256) + from_unicode_map [((u) / 256)])
#define UNICODE_LOOKUP(u)	from_unicode_mapping_array [ UNICODE_INDEX(u) ]

int main()
{
	int i;

	if (sizeof(to_unicode_map) != 256 * sizeof(to_unicode_map[0]))
		printf("The to_unicode_map is too small! %d entries!\n",
				  sizeof(to_unicode_map) / sizeof(to_unicode_map[0]));

	if (sizeof(from_unicode_map) != 256 * sizeof(from_unicode_map[0]))
		printf("The from_unicode_map is too small! %d entries!\n",
				  sizeof(from_unicode_map) / sizeof(from_unicode_map[0]));

	for (i = 0; i <= 255; i++) {
		const unsigned short uch = to_unicode_map[i];
		if (uch == CANT_MAP_CHARACTER)
			continue;
		const unsigned char ch2 = UNICODE_LOOKUP(uch);
		if (ch2 != i) {
			printf
				("Mapping error: Character %02x -> Unicode %04x (index %3d) -> Char %02x\n",
				 i, uch, UNICODE_INDEX(uch), ch2);

			/* Find the Character in the from_unicode_mapping_array */
			int j;
			for (j = 0; j < sizeof(from_unicode_mapping_array); j++)
				if (from_unicode_mapping_array[j] == i) {
					/* Mapping table is wrong - recommend a fix for it */
					printf
						("Recommend from_unicode_map[0x%02x] be set to %d\n",
						 uch / 256, j - (uch % 256));
					break;
				}

			if (j == sizeof(from_unicode_mapping_array)) {
				/* Oops - found a character that does exists in the character set
				   but not in unicode - an obvious error! */

				printf
					("Error: Character %d does not exist in the from_unicode_mapping_array\n",
					 i);

			}
		}
	}

	for (i = 0; i <= 255; i++) {
		if (from_unicode_map[i] + 0xFF >= sizeof(from_unicode_mapping_array)) {
			printf("From_unicode array bounds error at position %02x00\n",
					  i);
			continue;
		}

		for (int j = 0; j <= 255; j++) {
			const unsigned short uch = i * 256 + j;
			const unsigned char ch2 = UNICODE_LOOKUP(uch);
			if (ch2 == CANT_MAP_CHARACTER)
				continue;
			const unsigned short uch2 = to_unicode_map[ch2];
			if (uch != uch2) {
				printf
					("Mapping error: Unicode %04x -> ch %02x -> Unicode %04x\n",
					 uch, ch2, uch2);

				int k;
				for (k = 0; k <= 255; k++)
					if (to_unicode_map[k] == uch) {
						/* Can map this character from charset to unicode */
						/* Assume fix was printed out above */
					}
				if (k > 255) {
					/* This unicode doesn't exist in charset */
					/* Mapping table is wrong - recommend a fix for it */
					printf
						("Recommend from_unicode_map[0x%02x] be set to %d\n",
						 uch / 256, 0);
				}
			}
		}
	}

	printf("Test completed\n");
	return 0;
}
Create utils directory 2003-01-23 04:22:23 +01:00			`/*`
			`* The contents of this file are subject to the Interbase Public`
			`* License Version 1.0 (the "License"); you may not use this file`
			`* except in compliance with the License. You may obtain a copy`
			`* of the License at http://www.Inprise.com/IPL.html`
			`*`
			`* Software distributed under the License is distributed on an`
			`* "AS IS" basis, WITHOUT WARRANTY OF ANY KIND, either express`
			`* or implied. See the License for the specific language governing`
			`* rights and limitations under the License.`
			`*`
			`* The Original Code was created by Inprise Corporation`
			`* and its predecessors. Portions created by Inprise Corporation are`
			`* Copyright (C) Inprise Corporation.`
			`*`
			`* All Rights Reserved.`
			`* Contributor(s): ______________________________________.`
			`*/`

			`#include "firebird.h"`
			`#include "../jrd/common.h"`


			`/*`
			`fixed`
			`#include "cs_w1254.h"`
			`#include "cs_cyrl.h"`
			`#include "cs_865.h"`
			`#include "cs_863.h"`
			`#include "cs_861.h"`
			`#include "cs_860.h"`
			`#include "cs_857.h"`
			`#include "cs_w1251.h"`
			`#include "cs_437.h"`
			`#include "cs_850.h"`
			`#include "cs_852.h"`
			`#include "cs_w1250.h"`
			`#include "cs_w1252.h"`
			`#include "cs_w1253.h"`

			`fixed with errors`
			`#include "cs_next.h" -- NeXT has two characters mapping to the same`
			`Unicode (FE & FF). So round trip is not possible.`
			`They map to FFFD, which is the replacement character`
			`so this is not an error`

			`No errors`
New character sets (update intl sources) 2003-01-25 04:05:24 +01:00			`#include "../intl/cs_iso8859_1.h"`
Create utils directory 2003-01-23 04:22:23 +01:00			`*/`

			`/*`
			`-- Multibyte character sets --`
			`#include "../intl/cs_big5.h"`
			`#include "../intl/cs_gb2312.h"`
			`#include "../intl/cs_jis_0208_1990.h"`
			`#include "../intl/cs_ksc5601.h"`
			`#include "../intl/csjis2_p.h"`
			`*/`


			`#define UNICODE_INDEX(u) (((u) % 256) + from_unicode_map [((u) / 256)])`
			`#define UNICODE_LOOKUP(u) from_unicode_mapping_array [ UNICODE_INDEX(u) ]`

Cleanup Some minor corrections Second step to rename 2004-03-11 06:04:26 +01:00			`int main()`
Create utils directory 2003-01-23 04:22:23 +01:00			`{`
Cleanup Some minor corrections Second step to rename 2004-03-11 06:04:26 +01:00			`int i;`
Create utils directory 2003-01-23 04:22:23 +01:00
			`if (sizeof(to_unicode_map) != 256 * sizeof(to_unicode_map[0]))`
Removing ib_stdio.h 2004-04-29 00:36:29 +02:00			`printf("The to_unicode_map is too small! %d entries!\n",`
Create utils directory 2003-01-23 04:22:23 +01:00			`sizeof(to_unicode_map) / sizeof(to_unicode_map[0]));`

			`if (sizeof(from_unicode_map) != 256 * sizeof(from_unicode_map[0]))`
Removing ib_stdio.h 2004-04-29 00:36:29 +02:00			`printf("The from_unicode_map is too small! %d entries!\n",`
Create utils directory 2003-01-23 04:22:23 +01:00			`sizeof(from_unicode_map) / sizeof(from_unicode_map[0]));`

			`for (i = 0; i <= 255; i++) {`
Cleanup Some minor corrections Second step to rename 2004-03-11 06:04:26 +01:00			`const unsigned short uch = to_unicode_map[i];`
Create utils directory 2003-01-23 04:22:23 +01:00			`if (uch == CANT_MAP_CHARACTER)`
			`continue;`
Cleanup Some minor corrections Second step to rename 2004-03-11 06:04:26 +01:00			`const unsigned char ch2 = UNICODE_LOOKUP(uch);`
Create utils directory 2003-01-23 04:22:23 +01:00			`if (ch2 != i) {`
Removing ib_stdio.h 2004-04-29 00:36:29 +02:00			`printf`
Create utils directory 2003-01-23 04:22:23 +01:00			`("Mapping error: Character %02x -> Unicode %04x (index %3d) -> Char %02x\n",`
			`i, uch, UNICODE_INDEX(uch), ch2);`

			`/* Find the Character in the from_unicode_mapping_array */`
Cleanup Some minor corrections Second step to rename 2004-03-11 06:04:26 +01:00			`int j;`
Create utils directory 2003-01-23 04:22:23 +01:00			`for (j = 0; j < sizeof(from_unicode_mapping_array); j++)`
			`if (from_unicode_mapping_array[j] == i) {`
			`/* Mapping table is wrong - recommend a fix for it */`
Removing ib_stdio.h 2004-04-29 00:36:29 +02:00			`printf`
Create utils directory 2003-01-23 04:22:23 +01:00			`("Recommend from_unicode_map[0x%02x] be set to %d\n",`
			`uch / 256, j - (uch % 256));`
			`break;`
			`}`

			`if (j == sizeof(from_unicode_mapping_array)) {`
			`/* Oops - found a character that does exists in the character set`
			`but not in unicode - an obvious error! */`

Removing ib_stdio.h 2004-04-29 00:36:29 +02:00			`printf`
Create utils directory 2003-01-23 04:22:23 +01:00			`("Error: Character %d does not exist in the from_unicode_mapping_array\n",`
			`i);`

			`}`
			`}`
			`}`

			`for (i = 0; i <= 255; i++) {`
			`if (from_unicode_map[i] + 0xFF >= sizeof(from_unicode_mapping_array)) {`
Removing ib_stdio.h 2004-04-29 00:36:29 +02:00			`printf("From_unicode array bounds error at position %02x00\n",`
Create utils directory 2003-01-23 04:22:23 +01:00			`i);`
			`continue;`
			`}`

Cleanup Some minor corrections Second step to rename 2004-03-11 06:04:26 +01:00			`for (int j = 0; j <= 255; j++) {`
			`const unsigned short uch = i * 256 + j;`
			`const unsigned char ch2 = UNICODE_LOOKUP(uch);`
Create utils directory 2003-01-23 04:22:23 +01:00			`if (ch2 == CANT_MAP_CHARACTER)`
			`continue;`
Cleanup Some minor corrections Second step to rename 2004-03-11 06:04:26 +01:00			`const unsigned short uch2 = to_unicode_map[ch2];`
Create utils directory 2003-01-23 04:22:23 +01:00			`if (uch != uch2) {`
Removing ib_stdio.h 2004-04-29 00:36:29 +02:00			`printf`
Create utils directory 2003-01-23 04:22:23 +01:00			`("Mapping error: Unicode %04x -> ch %02x -> Unicode %04x\n",`
			`uch, ch2, uch2);`

Cleanup Some minor corrections Second step to rename 2004-03-11 06:04:26 +01:00			`int k;`
Create utils directory 2003-01-23 04:22:23 +01:00			`for (k = 0; k <= 255; k++)`
			`if (to_unicode_map[k] == uch) {`
			`/* Can map this character from charset to unicode */`
			`/* Assume fix was printed out above */`
			`}`
			`if (k > 255) {`
			`/* This unicode doesn't exist in charset */`
			`/* Mapping table is wrong - recommend a fix for it */`
Removing ib_stdio.h 2004-04-29 00:36:29 +02:00			`printf`
Create utils directory 2003-01-23 04:22:23 +01:00			`("Recommend from_unicode_map[0x%02x] be set to %d\n",`
			`uch / 256, 0);`
			`}`
			`}`
			`}`
			`}`

Removing ib_stdio.h 2004-04-29 00:36:29 +02:00			`printf("Test completed\n");`
Cleanup Some minor corrections Second step to rename 2004-03-11 06:04:26 +01:00			`return 0;`
Create utils directory 2003-01-23 04:22:23 +01:00			`}`
Cleanup Some minor corrections Second step to rename 2004-03-11 06:04:26 +01:00