2005-12-06 13:27:15 +00:00
|
|
|
/***************************************************************************
|
|
|
|
* __________ __ ___.
|
|
|
|
* Open \______ \ ____ ____ | | _\_ |__ _______ ___
|
|
|
|
* Source | _// _ \_/ ___\| |/ /| __ \ / _ \ \/ /
|
|
|
|
* Jukebox | | ( <_> ) \___| < | \_\ ( <_> > < <
|
|
|
|
* Firmware |____|_ /\____/ \___ >__|_ \|___ /\____/__/\_ \
|
|
|
|
* \/ \/ \/ \/ \/
|
|
|
|
*
|
|
|
|
*
|
|
|
|
* Copyright (C) 2005 by Frank Dischner
|
|
|
|
*
|
|
|
|
* All files in this archive are subject to the GNU General Public License.
|
|
|
|
* See the file COPYING in the source tree root for full license agreement.
|
|
|
|
*
|
|
|
|
* This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
|
|
|
|
* KIND, either express or implied.
|
|
|
|
*
|
|
|
|
****************************************************************************/
|
|
|
|
#include <stdio.h>
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include <string.h>
|
2005-12-06 15:04:48 +00:00
|
|
|
#include "codepage_tables.h"
|
2005-12-06 13:27:15 +00:00
|
|
|
|
|
|
|
#define MAX_TABLE_SIZE 32768
|
|
|
|
|
2007-10-02 07:25:24 +00:00
|
|
|
static const int mini_index[6] = {
|
|
|
|
0, 1, 3, 6, 7, 8
|
2007-04-01 13:09:22 +00:00
|
|
|
};
|
|
|
|
|
2005-12-06 13:27:15 +00:00
|
|
|
static unsigned short iso_table[MAX_TABLE_SIZE];
|
|
|
|
|
|
|
|
unsigned short iso_decode(unsigned char *latin1, int cp, int count)
|
|
|
|
{
|
|
|
|
unsigned short ucs = 0;
|
|
|
|
|
|
|
|
/* cp tells us which codepage to convert from */
|
|
|
|
switch (cp) {
|
|
|
|
case 0x01: /* Greek (ISO-8859-7) */
|
|
|
|
while (count--) {
|
|
|
|
/* first convert to unicode */
|
|
|
|
if (*latin1 < 0xA1)
|
|
|
|
ucs = *latin1++;
|
|
|
|
else if (*latin1 > 0xB7)
|
|
|
|
ucs = *latin1++ + 0x02D0;
|
|
|
|
else
|
|
|
|
ucs = iso8859_7_to_uni[*latin1++ - 0xA1];
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 0x02: /* Hebrew (ISO-8859-8) */
|
|
|
|
while (count--) {
|
|
|
|
/* first convert to unicode */
|
|
|
|
if (*latin1 == 0xAA) {
|
|
|
|
ucs = 0xD7;
|
|
|
|
latin1++;
|
|
|
|
} else if (*latin1 == 0xBA) {
|
|
|
|
ucs = 0xF7;
|
|
|
|
latin1++;
|
|
|
|
} else if (*latin1 == 0xDF) {
|
|
|
|
ucs = 0x2017;
|
|
|
|
latin1++;
|
|
|
|
} else if (*latin1 < 0xC0)
|
|
|
|
ucs = *latin1++;
|
|
|
|
else
|
|
|
|
ucs = *latin1++ + 0x04F0;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
2006-04-05 14:23:57 +00:00
|
|
|
case 0x03: /* Cyrillic (CP1251) */
|
2005-12-06 13:27:15 +00:00
|
|
|
while (count--) {
|
|
|
|
/* first convert to unicode */
|
|
|
|
if (*latin1 < 0x80)
|
|
|
|
ucs = *latin1++;
|
|
|
|
else if (*latin1 > 0xBF)
|
|
|
|
ucs = *latin1++ + 0x0350;
|
|
|
|
else
|
|
|
|
ucs = cp1251_to_uni[*latin1++ - 0x80];
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 0x04: /* Thai (ISO-8859-11) */
|
|
|
|
while (count--) {
|
|
|
|
/* first convert to unicode */
|
|
|
|
if (*latin1 < 0xA1)
|
|
|
|
ucs = *latin1++;
|
|
|
|
else
|
|
|
|
ucs = *latin1++ + 0x0D60;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
2006-01-10 17:12:33 +00:00
|
|
|
case 0x05: /* Arabic (CP1256) */
|
2005-12-06 13:27:15 +00:00
|
|
|
while (count--) {
|
|
|
|
/* first convert to unicode */
|
2006-01-10 17:12:33 +00:00
|
|
|
if (*latin1 < 0x80)
|
2005-12-06 13:27:15 +00:00
|
|
|
ucs = *latin1++;
|
2006-01-10 17:12:33 +00:00
|
|
|
else
|
|
|
|
ucs = cp1256_to_uni[*latin1++ - 0x80];
|
2005-12-06 13:27:15 +00:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 0x06: /* Turkish (ISO-8859-9) */
|
|
|
|
while (count--) {
|
|
|
|
/* first convert to unicode */
|
|
|
|
switch (*latin1) {
|
|
|
|
case 0xD0:
|
|
|
|
ucs = 0x011E;
|
|
|
|
break;
|
|
|
|
case 0xDD:
|
|
|
|
ucs = 0x0130;
|
|
|
|
break;
|
|
|
|
case 0xDE:
|
|
|
|
ucs = 0x015E;
|
|
|
|
break;
|
|
|
|
case 0xF0:
|
|
|
|
ucs = 0x011F;
|
|
|
|
break;
|
|
|
|
case 0xFD:
|
|
|
|
ucs = 0x0131;
|
|
|
|
break;
|
|
|
|
case 0xFE:
|
|
|
|
ucs = 0x015F;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
ucs = *latin1;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
latin1++;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 0x07: /* Latin Extended (ISO-8859-2) */
|
|
|
|
while (count--) {
|
|
|
|
/* first convert to unicode */
|
|
|
|
if (*latin1 < 0xA1)
|
|
|
|
ucs = *latin1++;
|
|
|
|
else
|
|
|
|
ucs = iso8859_2_to_uni[*latin1++ - 0xA1];
|
|
|
|
}
|
|
|
|
break;
|
2007-10-01 17:16:31 +00:00
|
|
|
|
|
|
|
case 0x08: /* Central European (CP1250) */
|
|
|
|
while (count--) {
|
|
|
|
/* first convert to unicode */
|
|
|
|
if (*latin1 < 0x80)
|
|
|
|
ucs = *latin1++;
|
|
|
|
else
|
|
|
|
ucs = cp1250_to_uni[*latin1++ - 0x80];
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
2005-12-06 13:27:15 +00:00
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
return ucs;
|
|
|
|
}
|
|
|
|
|
|
|
|
int writeshort(FILE *f, unsigned short s)
|
|
|
|
{
|
|
|
|
putc(s, f);
|
|
|
|
return putc(s>>8, f) != EOF;
|
|
|
|
}
|
|
|
|
|
2007-04-01 13:09:22 +00:00
|
|
|
void print_usage(void)
|
2005-12-06 13:27:15 +00:00
|
|
|
{
|
2007-04-01 13:09:22 +00:00
|
|
|
printf("Usage: codepages [-m]\n"
|
|
|
|
"\t-m Create isomini.cp only\n");
|
|
|
|
printf("build date: " __DATE__ "\n\n");
|
|
|
|
}
|
2005-12-06 13:27:15 +00:00
|
|
|
|
2007-04-01 13:09:22 +00:00
|
|
|
int main(int argc, char **argv)
|
|
|
|
{
|
|
|
|
int mini = 0;
|
2005-12-06 13:27:15 +00:00
|
|
|
int i, j;
|
|
|
|
unsigned char k;
|
|
|
|
unsigned short uni;
|
|
|
|
FILE *of;
|
|
|
|
|
2007-04-01 13:09:22 +00:00
|
|
|
for (i = 1;i < argc;i++)
|
|
|
|
{
|
|
|
|
if (argv[i][0] == '-')
|
|
|
|
{
|
|
|
|
switch (argv[i][1])
|
|
|
|
{
|
|
|
|
case 'm': /* create isomini.cp only */
|
|
|
|
mini = 1;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 'h': /* help */
|
|
|
|
case '?':
|
|
|
|
print_usage();
|
|
|
|
exit(1);
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
print_usage();
|
|
|
|
exit(1);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2005-12-06 13:27:15 +00:00
|
|
|
for (i=0; i < MAX_TABLE_SIZE; i++)
|
|
|
|
iso_table[i] = 0;
|
|
|
|
|
2007-04-01 13:09:22 +00:00
|
|
|
if (mini) {
|
|
|
|
of = fopen("isomini.cp", "wb");
|
|
|
|
if (!of) return 1;
|
2005-12-06 13:27:15 +00:00
|
|
|
|
2007-10-02 07:25:24 +00:00
|
|
|
for (i=1; i<6; i++) {
|
2005-12-06 13:27:15 +00:00
|
|
|
|
2007-04-01 13:09:22 +00:00
|
|
|
for (j=0; j<128; j++) {
|
|
|
|
k = (unsigned char)j + 128;
|
|
|
|
uni = iso_decode(&k, mini_index[i], 1);
|
|
|
|
writeshort(of, uni);
|
|
|
|
}
|
2005-12-06 13:27:15 +00:00
|
|
|
}
|
2007-04-01 13:09:22 +00:00
|
|
|
fclose(of);
|
2005-12-06 13:27:15 +00:00
|
|
|
}
|
2007-04-01 13:09:22 +00:00
|
|
|
else {
|
|
|
|
of = fopen("iso.cp", "wb");
|
|
|
|
if (!of) return 1;
|
2005-12-06 13:27:15 +00:00
|
|
|
|
2007-10-01 17:16:31 +00:00
|
|
|
for (i=1; i<9; i++) {
|
2007-04-01 13:09:22 +00:00
|
|
|
|
|
|
|
for (j=0; j<128; j++) {
|
|
|
|
k = (unsigned char)j + 128;
|
|
|
|
uni = iso_decode(&k, i, 1);
|
|
|
|
writeshort(of, uni);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
fclose(of);
|
|
|
|
|
|
|
|
of = fopen("932.cp", "wb");
|
|
|
|
if (!of) return 1;
|
|
|
|
for (i=0; i < MAX_TABLE_SIZE; i++)
|
|
|
|
writeshort(of, cp932_table[i]);
|
|
|
|
fclose(of);
|
|
|
|
|
|
|
|
of = fopen("936.cp", "wb");
|
|
|
|
if (!of) return 1;
|
|
|
|
for (i=0; i < MAX_TABLE_SIZE; i++)
|
|
|
|
writeshort(of, cp936_table[i]);
|
|
|
|
fclose(of);
|
|
|
|
|
|
|
|
of = fopen("949.cp", "wb");
|
|
|
|
if (!of) return 1;
|
|
|
|
for (i=0; i < MAX_TABLE_SIZE; i++)
|
|
|
|
writeshort(of, cp949_table[i]);
|
|
|
|
fclose(of);
|
|
|
|
|
|
|
|
of = fopen("950.cp", "wb");
|
|
|
|
if (!of) return 1;
|
|
|
|
for (i=0; i < MAX_TABLE_SIZE; i++)
|
|
|
|
writeshort(of, cp950_table[i]);
|
|
|
|
fclose(of);
|
|
|
|
}
|
2005-12-06 13:27:15 +00:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|