summaryrefslogtreecommitdiffstats
path: root/tools/codepages.c
diff options
context:
space:
mode:
Diffstat (limited to 'tools/codepages.c')
-rw-r--r--tools/codepages.c231
1 files changed, 231 insertions, 0 deletions
diff --git a/tools/codepages.c b/tools/codepages.c
new file mode 100644
index 0000000000..94768860f4
--- /dev/null
+++ b/tools/codepages.c
@@ -0,0 +1,231 @@
+/***************************************************************************
+ * __________ __ ___.
+ * Open \______ \ ____ ____ | | _\_ |__ _______ ___
+ * Source | _// _ \_/ ___\| |/ /| __ \ / _ \ \/ /
+ * Jukebox | | ( <_> ) \___| < | \_\ ( <_> > < <
+ * Firmware |____|_ /\____/ \___ >__|_ \|___ /\____/__/\_ \
+ * \/ \/ \/ \/ \/
+ *
+ *
+ * Copyright (C) 2005 by Frank Dischner
+ *
+ * All files in this archive are subject to the GNU General Public License.
+ * See the file COPYING in the source tree root for full license agreement.
+ *
+ * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
+ * KIND, either express or implied.
+ *
+ ****************************************************************************/
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include "codepages.h"
+
+#define MAX_TABLE_SIZE 32768
+
+static unsigned short iso_table[MAX_TABLE_SIZE];
+
+static const unsigned short iso8859_7_to_uni[] = {
+ 0x2018, 0x2019, 0x00A3, 0x20AC, 0x20AF, 0x00A6, 0x00A7, /* A1-A7 */
+ 0x00A8, 0x00A9, 0x037A, 0x00AB, 0x00AC, 0x00AD, 0x00AE, 0x2015, /* A8-AF */
+ 0x00B0, 0x00B1, 0x00B2, 0x00B3, 0x0384, 0x0385, 0x0386, 0x00B7 /* B0-B7 */
+};
+
+static const unsigned short cp1251_to_uni[] = {
+ 0x0402, 0x0403, 0x201A, 0x0453, 0x201E, 0x2026, 0x2020, 0x2021, /* 80-87 */
+ 0x20AC, 0x2030, 0x0409, 0x2039, 0x040A, 0x040C, 0x040B, 0x040F, /* 88-8F */
+ 0x0452, 0x2018, 0x2019, 0x201C, 0x201D, 0x2022, 0x2013, 0x2014, /* 90-97 */
+ 0x0098, 0x2122, 0x0459, 0x203A, 0x045A, 0x045C, 0x045B, 0x045F, /* 98-9F */
+ 0x00A0, 0x040E, 0x045E, 0x0408, 0x00A4, 0x0490, 0x00A6, 0x00A7, /* A0-A7 */
+ 0x0401, 0x00A9, 0x0404, 0x00AB, 0x00AC, 0x00AD, 0x00AE, 0x0407, /* A8-AF */
+ 0x00B0, 0x00B1, 0x0406, 0x0456, 0x0491, 0x00B5, 0x00B6, 0x00B7, /* B0-B7 */
+ 0x0451, 0x2116, 0x0454, 0x00BB, 0x0458, 0x0405, 0x0455, 0x0457 /* B8-BF */
+};
+
+static const unsigned short iso8859_2_to_uni[] = {
+ 0x0104, 0x02D8, 0x0141, 0x00A4, 0x013D, 0x015A, 0x00A7, /* A1-A7 */
+ 0x00A8, 0x0160, 0x015E, 0x0164, 0x0179, 0x00AD, 0x017D, 0x017B, /* A8-AF */
+ 0x00B0, 0x0105, 0x02DB, 0x0142, 0x00B4, 0x013E, 0x015B, 0x02C7, /* B0-B7 */
+ 0x00B8, 0x0161, 0x015F, 0x0165, 0x017A, 0x02DD, 0x017E, 0x017C, /* B8-BF */
+ 0x0154, 0x00C1, 0x00C2, 0x0102, 0x00C4, 0x0139, 0x0106, 0x00C7, /* C0-C7 */
+ 0x010C, 0x00C9, 0x0118, 0x00CB, 0x011A, 0x00CD, 0x00CE, 0x010E, /* C8-CF */
+ 0x0110, 0x0143, 0x0147, 0x00D3, 0x00D4, 0x0150, 0x00D6, 0x00D7, /* D0-D7 */
+ 0x0158, 0x016E, 0x00DA, 0x0170, 0x00DC, 0x00DD, 0x0162, 0x00DF, /* D8-DF */
+ 0x0155, 0x00E1, 0x00E2, 0x0103, 0x00E4, 0x013A, 0x0107, 0x00E7, /* E0-E7 */
+ 0x010D, 0x00E9, 0x0119, 0x00EB, 0x011B, 0x00ED, 0x00EE, 0x010F, /* E8-EF */
+ 0x0111, 0x0144, 0x0148, 0x00F3, 0x00F4, 0x0151, 0x00F6, 0x00F7, /* F0-F7 */
+ 0x0159, 0x016F, 0x00FA, 0x0171, 0x00FC, 0x00FD, 0x0163, 0x02D9 /* F8-FF */
+};
+
+unsigned short iso_decode(unsigned char *latin1, int cp, int count)
+{
+ unsigned short ucs = 0;
+
+ /* cp tells us which codepage to convert from */
+ switch (cp) {
+ case 0x01: /* Greek (ISO-8859-7) */
+ while (count--) {
+ /* first convert to unicode */
+ if (*latin1 < 0xA1)
+ ucs = *latin1++;
+ else if (*latin1 > 0xB7)
+ ucs = *latin1++ + 0x02D0;
+ else
+ ucs = iso8859_7_to_uni[*latin1++ - 0xA1];
+ }
+ break;
+
+ case 0x02: /* Hebrew (ISO-8859-8) */
+ while (count--) {
+ /* first convert to unicode */
+ if (*latin1 == 0xAA) {
+ ucs = 0xD7;
+ latin1++;
+ } else if (*latin1 == 0xBA) {
+ ucs = 0xF7;
+ latin1++;
+ } else if (*latin1 == 0xDF) {
+ ucs = 0x2017;
+ latin1++;
+ } else if (*latin1 < 0xC0)
+ ucs = *latin1++;
+ else
+ ucs = *latin1++ + 0x04F0;
+ }
+ break;
+
+ case 0x03: /* Russian (CP1251) */
+ while (count--) {
+ /* first convert to unicode */
+ if (*latin1 < 0x80)
+ ucs = *latin1++;
+ else if (*latin1 > 0xBF)
+ ucs = *latin1++ + 0x0350;
+ else
+ ucs = cp1251_to_uni[*latin1++ - 0x80];
+ }
+ break;
+
+ case 0x04: /* Thai (ISO-8859-11) */
+ while (count--) {
+ /* first convert to unicode */
+ if (*latin1 < 0xA1)
+ ucs = *latin1++;
+ else
+ ucs = *latin1++ + 0x0D60;
+ }
+ break;
+
+ case 0x05: /* Arabic (ISO-8859-6) */
+ while (count--) {
+ /* first convert to unicode */
+ if (*latin1 < 0xAC || *latin1 == 0xAD)
+ ucs = *latin1++;
+ else
+ ucs = *latin1++ + 0x0560;
+ }
+ break;
+
+ case 0x06: /* Turkish (ISO-8859-9) */
+ while (count--) {
+ /* first convert to unicode */
+ switch (*latin1) {
+ case 0xD0:
+ ucs = 0x011E;
+ break;
+ case 0xDD:
+ ucs = 0x0130;
+ break;
+ case 0xDE:
+ ucs = 0x015E;
+ break;
+ case 0xF0:
+ ucs = 0x011F;
+ break;
+ case 0xFD:
+ ucs = 0x0131;
+ break;
+ case 0xFE:
+ ucs = 0x015F;
+ break;
+ default:
+ ucs = *latin1;
+ break;
+ }
+
+ latin1++;
+ }
+ break;
+
+ case 0x07: /* Latin Extended (ISO-8859-2) */
+ while (count--) {
+ /* first convert to unicode */
+ if (*latin1 < 0xA1)
+ ucs = *latin1++;
+ else
+ ucs = iso8859_2_to_uni[*latin1++ - 0xA1];
+ }
+ break;
+
+ default:
+ break;
+ }
+ return ucs;
+}
+
+int writeshort(FILE *f, unsigned short s)
+{
+ putc(s, f);
+ return putc(s>>8, f) != EOF;
+}
+
+int main(void)
+{
+
+ int i, j;
+ unsigned char k;
+ unsigned short uni;
+ FILE *of;
+
+ for (i=0; i < MAX_TABLE_SIZE; i++)
+ iso_table[i] = 0;
+
+ of = fopen("iso.cp", "wb");
+ if (!of) return 1;
+
+ for (i=1; i<8; i++) {
+
+ for (j=0; j<128; j++) {
+ k = (unsigned char)j + 128;
+ uni = iso_decode(&k, i, 1);
+ writeshort(of, uni);
+ }
+ }
+ fclose(of);
+
+ of = fopen("932.cp", "wb");
+ if (!of) return 1;
+ for (i=0; i < MAX_TABLE_SIZE; i++)
+ writeshort(of, cp932_table[i]);
+ fclose(of);
+
+ of = fopen("936.cp", "wb");
+ if (!of) return 1;
+ for (i=0; i < MAX_TABLE_SIZE; i++)
+ writeshort(of, cp936_table[i]);
+ fclose(of);
+
+ of = fopen("949.cp", "wb");
+ if (!of) return 1;
+ for (i=0; i < MAX_TABLE_SIZE; i++)
+ writeshort(of, cp949_table[i]);
+ fclose(of);
+
+ of = fopen("950.cp", "wb");
+ if (!of) return 1;
+ for (i=0; i < MAX_TABLE_SIZE; i++)
+ writeshort(of, cp950_table[i]);
+ fclose(of);
+
+ return 0;
+}