Mercurial > freewnn
view Wnn/jserver/atojis.c @ 18:e7e2aba67cb3
disabled build for cWnn and kWnn by default
author | Yoshiki Yazawa <yaz@cc.rim.or.jp> |
---|---|
date | Mon, 14 Apr 2008 17:33:53 +0900 |
parents | bbc77ca4def5 |
children |
line wrap: on
line source
/* * $Id: atojis.c,v 1.3 2001/06/14 18:15:59 ura Exp $ */ /* * FreeWnn is a network-extensible Kana-to-Kanji conversion system. * This file is part of FreeWnn. * * Copyright Kyoto University Research Institute for Mathematical Sciences * 1987, 1988, 1989, 1990, 1991, 1992 * Copyright OMRON Corporation. 1987, 1988, 1989, 1990, 1991, 1992, 1999 * Copyright ASTEC, Inc. 1987, 1988, 1989, 1990, 1991, 1992 * Copyright FreeWnn Project 1999, 2000 * * Maintainer: FreeWnn Project <freewnn@tomo.gr.jp> * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */ #include "commonhd.h" #include "de_header.h" #include "kaiseki.h" static int keta_4; static w_char _tatojis[] = { #ifdef CHINESE 0xa1a1, 0xa3a1, 0xa3a2, 0xa3a3, 0xa1e7, 0xa3a5, 0xa3a6, 0xa3a7, 0xa3a8, 0xa3a9, 0xa3aa, 0xa3ab, 0xa3ac, 0xa3ad, 0xa3ae, 0xa3af, 0xa3b0, 0xa3b1, 0xa3b2, 0xa3b3, 0xa3b4, 0xa3b5, 0xa3b6, 0xa3b7, 0xa3b8, 0xa3b9, 0xa3ba, 0xa3bb, 0xa3bc, 0xa3bd, 0xa3be, 0xa3bf, 0xa3c0, 0xa3c1, 0xa3c2, 0xa3c3, 0xa3c4, 0xa3c5, 0xa3c6, 0xa3c7, 0xa3c8, 0xa3c9, 0xa3ca, 0xa3cb, 0xa3cc, 0xa3cd, 0xa3ce, 0xa3cf, 0xa3d0, 0xa3d1, 0xa3d2, 0xa3d3, 0xa3d4, 0xa3d5, 0xa3d6, 0xa3d7, 0xa3d8, 0xa3d9, 0xa3da, 0xa3db, 0xa3dc, 0xa3dd, 0xa3de, 0xa3df, 0xa3e0, 0xa3e1, 0xa3e2, 0xa3e3, 0xa3e4, 0xa3e5, 0xa3e6, 0xa3e7, 0xa3e8, 0xa3e9, 0xa3ea, 0xa3eb, 0xa3ec, 0xa3ed, 0xa3ee, 0xa3ef, 0xa3f0, 0xa3f1, 0xa3f2, 0xa3f3, 0xa3f4, 0xa3f5, 0xa3f6, 0xa3f7, 0xa3f8, 0xa3f9, 0xa3fa, 0xa3fb, 0xa3fc, 0xa3fd, 0xa3fe, 0x007f #else # ifdef KOREAN 0xa1a1, 0xa3a1, 0xa3a2, 0xa3a3, 0xa3a4, 0xa3a5, 0xa3a6, 0xa3a7, 0xa3a8, 0xa3a9, 0xa3aa, 0xa3ab, 0xa3ac, 0xa3ad, 0xa3ae, 0xa3af, 0xa3b0, 0xa3b1, 0xa3b2, 0xa3b3, 0xa3b4, 0xa3b5, 0xa3b6, 0xa3b7, 0xa3b8, 0xa3b9, 0xa3ba, 0xa3bb, 0xa3bc, 0xa3bd, 0xa3be, 0xa3bf, 0xa3c0, 0xa3c1, 0xa3c2, 0xa3c3, 0xa3c4, 0xa3c5, 0xa3c6, 0xa3c7, 0xa3c8, 0xa3c9, 0xa3ca, 0xa3cb, 0xa3cc, 0xa3cd, 0xa3ce, 0xa3cf, 0xa3d0, 0xa3d1, 0xa3d2, 0xa3d3, 0xa3d4, 0xa3d5, 0xa3d6, 0xa3d7, 0xa3d8, 0xa3d9, 0xa3da, 0xa3db, 0xa1ac, 0xa3dd, 0xa3de, 0xa3df, 0xa3e0, 0xa3e1, 0xa3e2, 0xa3e3, 0xa3e4, 0xa3e5, 0xa3e6, 0xa3e7, 0xa3e8, 0xa3e9, 0xa3ea, 0xa3eb, 0xa3ec, 0xa3ed, 0xa3ee, 0xa3ef, 0xa3f0, 0xa3f1, 0xa3f2, 0xa3f3, 0xa3f4, 0xa3f5, 0xa3f6, 0xa3f7, 0xa3f8, 0xa3f9, 0xa3fa, 0xa3fb, 0xa3fc, 0xa3fd, 0xa3fe, 0x007f, # else /* JAPANESE */ 0xa1a1, 0xa1aa, 0xa1c9, 0xa1f4, 0xa1f0, 0xa1f3, 0xa1f5, 0xa1c7, 0xa1ca, 0xa1cb, 0xa1f6, 0xa1dc, 0xa1a4, 0xa1dd, 0xa1a5, 0xa1bf, 0xa3b0, 0xa3b1, 0xa3b2, 0xa3b3, 0xa3b4, 0xa3b5, 0xa3b6, 0xa3b7, 0xa3b8, 0xa3b9, 0xa1a7, 0xa1a8, 0xa1e3, 0xa1e1, 0xa1e4, 0xa1a9, 0xa1f7, 0xa3c1, 0xa3c2, 0xa3c3, 0xa3c4, 0xa3c5, 0xa3c6, 0xa3c7, 0xa3c8, 0xa3c9, 0xa3ca, 0xa3cb, 0xa3cc, 0xa3cd, 0xa3ce, 0xa3cf, 0xa3d0, 0xa3d1, 0xa3d2, 0xa3d3, 0xa3d4, 0xa3d5, 0xa3d6, 0xa3d7, 0xa3d8, 0xa3d9, 0xa3da, 0xa1ce, 0xa1c0, 0xa1cf, 0xa1b0, 0xa1b2, 0xa1ae, 0xa3e1, 0xa3e2, 0xa3e3, 0xa3e4, 0xa3e5, 0xa3e6, 0xa3e7, 0xa3e8, 0xa3e9, 0xa3ea, 0xa3eb, 0xa3ec, 0xa3ed, 0xa3ee, 0xa3ef, 0xa3f0, 0xa3f1, 0xa3f2, 0xa3f3, 0xa3f4, 0xa3f5, 0xa3f6, 0xa3f7, 0xa3f8, 0xa3f9, 0xa3fa, 0xa1d0, 0xa1c3, 0xa1d1, 0xa1b1, 0x007f # endif /* KOREAN */ #endif /* CHINESE */ }; static int atojis (c) register w_char c; { if (c >= ' ' && c <= (unsigned char) '\376') c = _tatojis[c - ' ']; return (c); } static w_char _tatokan[] = { #ifdef CHINESE 0xa1f0, 0xd2bb, 0xb6fe, 0xc8fd, 0xcbc4, /* ¡ðÒ»¶þÈýËÄ */ 0xcee5, 0xc1f9, 0xc6df, 0xb0cb, 0xbec5 /* ÎåÁùÆ߰˾Š*/ #else # ifdef KOREAN 0xd6c3, 0xece9, 0xeca3, 0xdfb2, 0xdecc, /* ÖÃìéì£ß²ÞÌ */ 0xe7e9, 0xd7bf, 0xf6d2, 0xf8a2, 0xcefa, /* çé׿öÒø¢Îú */ # else /* JAPANESE */ 0xa1bb, 0xb0ec, 0xc6f3, 0xbbb0, 0xbbcd, /* ¡»°ìÆó»°»Í */ 0xb8de, 0xcfbb, 0xbcb7, 0xc8ac, 0xb6e5 /* ¸ÞÏ»¼·È¬¶å */ # endif /* KOREAN */ #endif /* CHINESE */ }; static w_char _tatokan_o[] = { #ifdef CHINESE 0xc1e3, 0xd2bc, 0xb7a1, 0xc8fe, 0xcbc1, /* ÁãÒ¼·¡ÈþËÁ */ 0xcee9, 0xc2bd, 0xc6e2, 0xb0c6, 0xbec1 /* Îé½Æâ°Æ¾Á */ #else # ifdef KOREAN 0xd6c3, 0xecec, 0xecc3, 0xdfb3, 0xdecc, /* ÖÃìììÃß³ÞÌ */ 0xe7ea, 0xd7bf, 0xf6d2, 0xf8a2, 0xcefa, /* çê׿öÒø¢Îú */ #else /* JAPANESE */ 0xceed, 0xb0ed, 0xc6f5, 0xbbb2, 0xbbcd, /* Îí°íÆõ»²»Í */ 0xb8e0, 0xcfbb, 0xbcb7, 0xc8ac, 0xb6e5 /* ¸àÏ»¼·È¬¶å */ # endif /* KOREAN */ #endif /* CHINESE */ }; static w_char atokan (c) register w_char c; { if (c >= '0' && c <= '9') c = _tatokan[c - '0']; else if (c >= S_NUM && c <= S_NUM + 9) c = _tatokan[c - S_NUM]; return (c); } static w_char atokan_o (c) register w_char c; { if (c >= '0' && c <= '9') c = _tatokan_o[c - '0']; else if (c >= S_NUM && c <= S_NUM + 9) c = _tatokan_o[c - S_NUM]; return (c); } static w_char _tatoket[] = { #ifdef CHINESE 0xcaae, 0xb0d9, 0xc7a7, /* Ê®°Ùǧ */ 0xcdf2, 0xd2da, 0xd5d7, 0xbea9, /* ÍòÒÚÕ×¾© */ 0xdbf2, 0xeff6, 0xf0a6, 0xb9b5, /* Ûòïö(Êã)𦹵 */ 0xbda7, 0xd5fd, 0xd4d8, 0xbcab /* ½§ÕýÔؼ« */ /* ºãºÓɳ *//* °¢É®?? *//* ÄÇÓÉËû *//* ²»¿É˼Òé *//* ÎÞÁ¿´óÊý */ #else # ifdef KOREAN 0xe4a8, 0xdbdd, 0xf4b6, /* ä¨ÛÝô¶ */ 0xd8b2, 0xe5e2, 0xf0bc, 0xccc8, /* زåâð¼ÌÈ */ 0xfaa7, 0xdff1, 0xe5cd, 0xcfb5, /* ú§ßñåÍϵ */ 0xcad5, 0xefe1, 0xeeb0, 0xd0bf, /* ÊÕïáî°Ð¿ */ /* ùöùÁÞÞ ä¹ã¬Ñ¶ Ñáë¦öâ ÜôʦÞÖì¡ ÙíÕáÓÞ⦠*/ # else /* JAPANESE */ 0xbdbd, 0xc9b4, 0xc0e9, /* ½½É´Àé */ 0xcbfc, 0xb2af, 0xc3fb, 0xb5fe, /* Ëü²¯Ãûµþ */ 0xd4b6, 0xd9b3, 0xbef7, 0xb9c2, /* Ô¶Ù³(¤·d126)¾÷¹Â */ 0xb4c2, 0xc0b5, 0xbadc, 0xb6cb /* ´ÂÀµºÜ¶Ë */ /* ¹±²Ïº» *//* °¤ÁεÀ *//* Æáͳ¾ *//* ÉÔ²Ä»×µÄ *//* ̵ÎÌÂç¿ô */ # endif /* KOREAN */ #endif /* CHINESE */ }; static w_char _tatoket_o[] = { #ifdef CHINESE 0xcab0, 0xb0db, 0xc7aa, /* Ê°°ÛǪ */ 0xcdf2 /* Íò */ #else # ifdef KOREAN 0xe3a6, 0xd8e8, 0xf4c6, /* ã¦ØèôÆ */ 0xd8bf /* Ø¿ */ # else /* JAPANESE */ 0xbda6, 0xeff9, 0xeff4, /* ½¦ïùïô */ 0xe8df /* èß */ # endif /* KOREAN */ #endif /* CHINESE */ }; static void getketa (k, kouho, col) int k; w_char kouho[]; int *col; { if (k % 4) { if (keta_4 != 0) { keta_4 = 0; getketa (k / 4 * 4, kouho, col); } kouho[(*col)++] = _tatoket[k % 4 - 1]; } else if ((k / 4 > 0) && (k / 4 < 13)) { kouho[(*col)++] = _tatoket[k / 4 + 2]; } else if (k / 4 == 13) { #ifdef CHINESE kouho[(*col)++] = 0xc9b3; /* ºãºÓɳ */ kouho[(*col)++] = 0xbad3; kouho[(*col)++] = 0xbae3; #else # ifdef KOREAN kouho[(*col)++] = 0xdede; /* ùöùÁÞÞ */ kouho[(*col)++] = 0xf9c1; kouho[(*col)++] = 0xf9f6; # else /* JAPANESE */ kouho[(*col)++] = 0xbabb; kouho[(*col)++] = 0xb2cf; kouho[(*col)++] = 0xb9b1; /* ¹±²Ïº» */ # endif /* KOREAN */ #endif /* CHINESE */ } else if (k / 4 == 14) { #ifdef CHINESE kouho[(*col)++] = 0xecf3; /* °¢É®ìó */ kouho[(*col)++] = 0xc9ae; kouho[(*col)++] = 0xb0a2; #else # ifdef KOREAN kouho[(*col)++] = 0xd1b6; /* ä¹ã¬Ñ¶ */ kouho[(*col)++] = 0xe3ac; kouho[(*col)++] = 0xe4b9; # else /* JAPANESE */ kouho[(*col)++] = 0xb5c0; kouho[(*col)++] = 0xc1ce; kouho[(*col)++] = 0xb0a4; /* °¤ÁεÀ */ # endif /* KOREAN */ #endif /* CHINESE */ } else if (k / 4 == 15) { #ifdef CHINESE kouho[(*col)++] = 0xcbfb; /* ÄÇÓÉËû */ kouho[(*col)++] = 0xd3c9; kouho[(*col)++] = 0xc4c7; #else # ifdef KOREAN kouho[(*col)++] = 0xf6e2; /* Ñáë¦öâ */ kouho[(*col)++] = 0xeba6; kouho[(*col)++] = 0xd1e1; # else /* JAPANESE */ kouho[(*col)++] = 0xc2be; kouho[(*col)++] = 0xcdb3; kouho[(*col)++] = 0xc6e1; /* Æáͳ¾ */ # endif /* KOREAN */ #endif /* CHINESE */ } else if (k / 4 == 16) { #ifdef CHINESE kouho[(*col)++] = 0xd2e5; kouho[(*col)++] = 0xcbbc; kouho[(*col)++] = 0xbfc9; kouho[(*col)++] = 0xb2bb; /* ²»¿É˼Òå */ #else # ifdef KOREAN kouho[(*col)++] = 0xeca1; /* ÜôʦÞÖì¡ */ kouho[(*col)++] = 0xded6; kouho[(*col)++] = 0xcaa6; kouho[(*col)++] = 0xdcf4; # else /* JAPANESE */ kouho[(*col)++] = 0xb5c4; kouho[(*col)++] = 0xbbd7; kouho[(*col)++] = 0xb2c4; kouho[(*col)++] = 0xc9d4; /* ÉÔ²Ä»×µÄ */ # endif /* KOREAN */ #endif /* CHINESE */ } else if (k / 4 == 17) { #ifdef CHINESE kouho[(*col)++] = 0xcafd; /* ÎÞÁ¿´óÊý */ kouho[(*col)++] = 0xb4f3; kouho[(*col)++] = 0xc1bf; kouho[(*col)++] = 0xcede; #else # ifdef KOREAN kouho[(*col)++] = 0xe2a6; /* ÙíÕáÓÞ⦠*/ kouho[(*col)++] = 0xd3de; kouho[(*col)++] = 0xd5e1; kouho[(*col)++] = 0xd9ed; # else /* JAPANESE */ kouho[(*col)++] = 0xbff4; kouho[(*col)++] = 0xc2e7; kouho[(*col)++] = 0xcecc; kouho[(*col)++] = 0xccb5; /* ̵ÎÌÂç¿ô */ # endif /* KOREAN */ #endif /* CHINESE */ } else { #ifdef CHINESE kouho[(*col)++] = 0xa3bf; /* £¿ */ #else # ifdef KOREAN kouho[(*col)++] = 0xa3bf; /* £¿ */ # else /* JAPANESE */ kouho[(*col)++] = 0xa1a9; /* ¡© */ # endif /* KOREAN */ #endif /* CHINESE */ } keta_4 = 0; } static void getketa_o (k, kouho, col) int k; w_char kouho[]; int *col; { if (k % 4) { if (keta_4 != 0) { keta_4 = 0; if (k / 4 == 1) kouho[(*col)++] = _tatoket_o[3]; /* èß */ else getketa (k / 4 * 4, kouho, col); } kouho[(*col)++] = _tatoket_o[k % 4 - 1]; } else if (k / 4 == 1) { kouho[(*col)++] = _tatoket_o[3]; /* èß */ } else { getketa (k, kouho, col); } keta_4 = 0; } w_char * get_giji_knj (j, i, t, kouho) int j; int i; int t; w_char *kouho; { register int k; w_char revkouho[1000]; int col = 0, keta = 0; switch (t) { case WNN_NUM_ZEN: /* Á´³Ñ¿ô»ú *//* £±£²£³ */ #ifdef CONVERT_from_TOP for (k = i; k <= j; k++) { if (k == i && #else for (k = j; k >= i; k--) { if (k == j && #endif /* CONVERT_from_TOP */ (isspace (bun[k]) || isjspace (bun[k]))) *kouho++ = bun[k]; else *kouho++ = atojis (bun[k]); } break; case WNN_ALP_ZEN: /* Á´³Ñ */ case WNN_KIG_JIS: case WNN_KIG_ASC: #ifdef CONVERT_from_TOP for (k = i; k <= j; k++) #else for (k = j; k >= i; k--) #endif /* CONVERT_from_TOP */ *kouho++ = atojis (bun[k]); break; case WNN_KATAKANA: /* ¥«¥¿¥«¥Ê */ #ifdef CONVERT_from_TOP for (k = i; k <= j; k++) { #else for (k = j; k >= i; k--) { #endif /* CONVERT_from_TOP */ if ((bun[k] & 0xff00) == 0xa400) *kouho++ = bun[k] | 0x100; else *kouho++ = bun[k]; } break; case WNN_NUM_KAN: /* ´Á¿ô»ú *//* °ìÆó»° */ #ifdef CONVERT_from_TOP for (k = i; k <= j; k++) #else for (k = j; k >= i; k--) #endif /* CONVERT_from_TOP */ *kouho++ = atokan (bun[k]); break; case WNN_NUM_HANCAN: /* Ⱦ³Ñ¿ô»ú *//* 1,234 */ #ifdef CONVERT_from_TOP for (k = j; k >= i; k--) { if (k == i && #else for (k = i; k <= j; k++) { if (k == j && #endif /* CONVERT_from_TOP */ (isspace (bun[k]) || isjspace (bun[k]))) { revkouho[col++] = bun[k]; break; } if ((keta != 0) && (keta % 3 == 0)) revkouho[col++] = ','; /* , */ if (bun[k] >= S_NUM && bun[k] <= S_NUM + 9) revkouho[col++] = '0' + bun[k] - S_NUM; else revkouho[col++] = bun[k]; keta++; } while (--col >= 0) { *kouho++ = revkouho[col]; } break; case WNN_NUM_ZENCAN: /* Á´³Ñ¿ô»ú *//* £±¡¤£²£³£´ */ #ifdef CONVERT_from_TOP for (k = j; k >= i; k--) { if (k == i && #else for (k = i; k <= j; k++) { if (k == j && #endif /* CONVERT_from_TOP */ (isspace (bun[k]) || isjspace (bun[k]))) { revkouho[col++] = bun[k]; break; } if ((keta != 0) && (keta % 3 == 0)) revkouho[col++] = UJIS_comma; /* ¡¤ */ revkouho[col++] = atojis (bun[k]); keta++; } while (--col >= 0) { *kouho++ = revkouho[col]; } break; case WNN_NUM_KANSUUJI: /* ´Á¿ô»ú *//* É´Æó½½»° */ keta_4 = 0; #ifdef CONVERT_from_TOP for (k = j; k >= i; k--) { if (k == i && #else for (k = i; k <= j; k++) { if (k == j && #endif /* CONVERT_from_TOP */ (isspace (bun[k]) || isjspace (bun[k]))) { revkouho[col++] = bun[k]; break; } if (bun[k] != '0') { if (keta != 0) getketa (keta, revkouho, &col); if (bun[k] != '1' || #ifdef CHINESE keta % 4 != 1) #else /* JAPANESE */ keta % 4 == 0 || keta % 4 == 3) /* °ìÀéÉ´½½°ì */ #endif /* CHINESE */ revkouho[col++] = atokan (bun[k]); } else if ((keta != 0) && (keta % 4 == 0)) { keta_4 = 1; } keta++; } if (col == 0) *kouho++ = _tatokan[0]; while (--col >= 0) { *kouho++ = revkouho[col]; } break; case WNN_NUM_KANOLD: /* ´Á¿ô»ú *//* °íÉ´Æõ½¦»² */ keta_4 = 0; #ifdef CONVERT_from_TOP for (k = j; k >= i; k--) { if (k == i && #else for (k = i; k <= j; k++) { if (k == j && #endif /* CONVERT_from_TOP */ (isspace (bun[k]) || isjspace (bun[k]))) { revkouho[col++] = bun[k]; break; } if (bun[k] != '0') { if (keta != 0) getketa_o (keta, revkouho, &col); if (bun[k] != '1' || #ifdef CHINESE keta % 4 != 1) #else /* JAPANESE */ keta % 4 == 0 || keta % 4 == 3) /* °ìÀéÉ´½½°ì */ #endif /* CHINESE */ revkouho[col++] = atokan_o (bun[k]); } else if ((keta != 0) && (keta % 4 == 0)) { keta_4 = 1; } keta++; } if (col == 0) *kouho++ = _tatokan_o[0]; while (--col >= 0) { *kouho++ = revkouho[col]; } break; case WNN_NUM_HAN: /* 123 */ #ifdef CONVERT_from_TOP for (k = i; k <= j; k++) { #else for (k = j; k >= i; k--) { #endif /* CONVERT_from_TOP */ if (bun[k] >= S_NUM && bun[k] <= S_NUM + 9) *kouho++ = '0' + bun[k] - S_NUM; else *kouho++ = bun[k]; } break; default: /* ¤Ò¤é¤¬¤Ê */ #ifdef CONVERT_from_TOP for (k = i; k <= j; k++) { #else for (k = j; k >= i; k--) { #endif /* CONVERT_from_TOP */ *kouho++ = bun[k]; } break; } *kouho++ = 0; return (kouho); } void giji_hindoup (t_jc) int t_jc; { if (t_jc >= 0) return; switch (t_jc) { case WNN_NUM_HAN: case WNN_NUM_ZEN: case WNN_NUM_KAN: case WNN_NUM_KANSUUJI: case WNN_NUM_KANOLD: case WNN_NUM_HANCAN: case WNN_NUM_ZENCAN: c_env->giji.number = t_jc; break; case WNN_ALP_HAN: case WNN_ALP_ZEN: c_env->giji.eisuu = t_jc; break; case WNN_KIG_HAN: case WNN_KIG_JIS: case WNN_KIG_ASC: c_env->giji.kigou = t_jc; break; default: return; } }