12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445 |
- /*
- * CDE - Common Desktop Environment
- *
- * Copyright (c) 1993-2012, The Open Group. All rights reserved.
- *
- * These libraries and programs are free software; you can
- * redistribute them and/or modify them under the terms of the GNU
- * Lesser General Public License as published by the Free Software
- * Foundation; either version 2 of the License, or (at your option)
- * any later version.
- *
- * These libraries and programs are distributed in the hope that
- * they will be useful, but WITHOUT ANY WARRANTY; without even the
- * implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR
- * PURPOSE. See the GNU Lesser General Public License for more
- * details.
- *
- * You should have received a copy of the GNU Lesser General Public
- * License along with these libraries and programs; if not, write
- * to the Free Software Foundation, Inc., 51 Franklin Street, Fifth
- * Floor, Boston, MA 02110-1301 USA
- */
- /* lcUTF.c 1.1 - Fujitsu source for CDEnext 95/11/06 20:32:41 */
- /* $XConsortium: _fallcUTF.c /main/2 1996/09/27 19:03:38 drk $ */
- /******************************************************************
- Copyright 1993 by SunSoft, Inc.
- Permission to use, copy, modify, distribute, and sell this software
- and its documentation for any purpose is hereby granted without fee,
- provided that the above copyright notice appear in all copies and
- that both that copyright notice and this permission notice appear
- in supporting documentation, and that the name of SunSoft, Inc.
- not be used in advertising or publicity pertaining to distribution
- of the software without specific, written prior permission.
- SunSoft, Inc. makes no representations about the suitability of
- this software for any purpose. It is provided "as is" without
- express or implied warranty.
- SunSoft Inc. DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS
- SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS,
- IN NO EVENT SHALL SunSoft, Inc. BE LIABLE FOR ANY SPECIAL, INDIRECT
- OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS
- OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE
- OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE
- OR PERFORMANCE OF THIS SOFTWARE.
- Author: Hiromu Inukai (inukai@Japan.Sun.COM) SunSoft, inc.
- ******************************************************************/
- #include "_fallcUTF.h"
- #include <stdlib.h>
- static long getutfrune(char **read_from, int *from_len);
- static void our_wctomb(
- unsigned short r,
- char **bufptr,
- int *buf_len
- );
- static int our_mbtowc(
- unsigned long *p,
- char *s,
- size_t n
- );
- static void latin2rune(
- unsigned char c,
- Rune *r
- );
- static void jis02012rune(
- unsigned char c,
- Rune *r
- );
- static void jis02082rune(
- unsigned char c,
- Rune *r
- );
- static void ksc2rune(
- unsigned char c,
- Rune *r
- );
- static void gb2rune(
- unsigned char c,
- Rune *r
- );
- static void init_latin1tab(long *tbl, long fb_default);
- static void init_latin2tab(long *tbl, long fb_default);
- static void init_latin3tab(long *tbl, long fb_default);
- static void init_latin4tab(long *tbl, long fb_default);
- static void init_latin5tab(long *tbl, long fb_default);
- static void init_latin6tab(long *tbl, long fb_default);
- static void init_latin7tab(long *tbl, long fb_default);
- static void init_latin8tab(long *tbl, long fb_default);
- static void init_latin9tab(long *tbl, long fb_default);
- static void init_jis0201tab(long *tbl, long fb_default);
- static void init_jis0208tab(long *tbl, long fb_default);
- static void init_ksc5601tab(long *tbl, long fb_default);
- static void init_gb2312tab(long *tbl, long fb_default);
- static char *int_locale = NULL;
- static long *tabkuten = NULL;
- static long *tabksc5601 = NULL;
- static long *tabgb = NULL;
- static UtfData utfdata_list = (UtfData)NULL;
- static XlcUTFDataRec default_utf_data[] =
- {
- {"ISO8859-1", XlcGL, init_latin1tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGR, init_latin1tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGL, init_latin2tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGR, init_latin2tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGL, init_latin3tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGR, init_latin3tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGL, init_latin4tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGR, init_latin4tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGL, init_latin5tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGR, init_latin5tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGL, init_latin6tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGR, init_latin6tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGL, init_latin7tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGR, init_latin7tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGL, init_latin8tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGR, init_latin8tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGL, init_latin9tab, latin2rune, N11n_none, 0x20},
- {"ISO8859-1", XlcGR, init_latin9tab, latin2rune, N11n_none, 0x20},
- {"JISX0201.1976-0", XlcGL, init_jis0201tab, jis02012rune, N11n_none, 0x20},
- {"JISX0201.1976-0", XlcGR, init_jis0201tab, jis02012rune, N11n_none, 0x20},
- {"JISX0208.1983-0", XlcGL, init_jis0208tab, jis02082rune, N11n_ja, 0x2222},
- {"JISX0208.1983-0", XlcGR, init_jis0208tab, jis02082rune, N11n_ja, 0x2222},
- {"KSC5601.1987-0", XlcGL, init_ksc5601tab, ksc2rune, N11n_ko, 0x2160},
- {"KSC5601.1987-0", XlcGR, init_ksc5601tab, ksc2rune, N11n_ko, 0x2160},
- {"GB2312.1980-0", XlcGL, init_gb2312tab, gb2rune, N11n_zh, 0x2175},
- {"GB2312.1980-0", XlcGR, init_gb2312tab, gb2rune, N11n_zh, 0x2175},
- };
- static void
- set_latin_nop(long *table, long default_val)
- {
- int i;
- for(i = 0; i < 0x1fff; i++)
- table[i] = default_val;
- return;
- }
- static void
- set_latin_tab(FILE *fptr, long *table, long fb_default)
- {
- int i = 0;
- int j = 0;
- int rv = 0;
- long value;
- for(i = 0; i < NRUNE; i++)
- table[i] = -1;
- while((rv = fscanf(fptr, "%lx", (long unsigned *) &value)) != EOF) {
- if(rv != 0 && value >= 0) {
- table[value] = j++;
- } else {
- set_latin_nop(table, fb_default);
- return;
- }
- }
- }
- extern int _fallcResolveI18NPath();
- #define TBL_DATA_DIR "tbl_data"
- static void
- init_latin1tab(long *tbl, long fb_default)
- {
- FILE *fp = NULL;
- char dirname[BUFSIZE];
- char filename[BUFSIZE];
- char *p, *q;
- _fallcResolveI18NPath(dirname);
- p = dirname;
- while(p) {
- q = strchr(p, ':');
- if(q) {
- *q = '\0';
- }
- sprintf(filename, "%s/%s/%s", p, TBL_DATA_DIR, tab8859_1);
- fp = fopen(filename, "r");
- if(fp) {
- set_latin_tab(fp, tbl, fb_default);
- fclose(fp);
- return;
- }
- if(q) {
- p = q + 1;
- } else {
- p = q;
- }
- }
- if(!fp) {
- set_latin_nop(tbl, fb_default);
- }
- }
- static void
- init_latin2tab(long *tbl, long fb_default)
- {
- FILE *fp;
- char dirname[BUFSIZE];
- char filename[BUFSIZE];
- char *p, *q;
- _fallcResolveI18NPath(dirname);
- p = dirname;
- while(p) {
- q = strchr(p, ':');
- if(q) {
- *q = '\0';
- }
- sprintf(filename, "%s/%s/%s", p, TBL_DATA_DIR, tab8859_2);
- fp = fopen(filename, "r");
- if(fp) {
- set_latin_tab(fp, tbl, fb_default);
- fclose(fp);
- return;
- }
- if(q) {
- p = q + 1;
- } else {
- p = q;
- }
- }
- if(!fp) {
- set_latin_nop(tbl, fb_default);
- }
- }
- static void
- init_latin3tab(long *tbl, long fb_default)
- {
- FILE *fp;
- char dirname[BUFSIZE];
- char filename[BUFSIZE];
- char *p, *q;
- _fallcResolveI18NPath(dirname);
- p = dirname;
- while(p) {
- q = strchr(p, ':');
- if(q) {
- *q = '\0';
- }
- sprintf(filename, "%s/%s/%s", p, TBL_DATA_DIR, tab8859_3);
- fp = fopen(filename, "r");
- if(fp) {
- set_latin_tab(fp, tbl, fb_default);
- fclose(fp);
- return;
- }
- if(q) {
- p = q + 1;
- } else {
- p = q;
- }
- }
- if(!fp) {
- set_latin_nop(tbl, fb_default);
- }
- }
- static void
- init_latin4tab(long *tbl, long fb_default)
- {
- FILE *fp;
- char dirname[BUFSIZE];
- char filename[BUFSIZE];
- char *p, *q;
- _fallcResolveI18NPath(dirname);
- p = dirname;
- while(p) {
- q = strchr(p, ':');
- if(q) {
- *q = '\0';
- }
- sprintf(filename, "%s/%s/%s", p, TBL_DATA_DIR, tab8859_4);
- fp = fopen(filename, "r");
- if(fp) {
- set_latin_tab(fp, tbl, fb_default);
- fclose(fp);
- return;
- }
- if(q) {
- p = q + 1;
- } else {
- p = q;
- }
- }
- if(!fp) {
- set_latin_nop(tbl, fb_default);
- }
- }
- static void
- init_latin5tab(long *tbl, long fb_default)
- {
- FILE *fp;
- char dirname[BUFSIZE];
- char filename[BUFSIZE];
- char *p, *q;
- _fallcResolveI18NPath(dirname);
- p = dirname;
- while(p) {
- q = strchr(p, ':');
- if(q) {
- *q = '\0';
- }
- sprintf(filename, "%s/%s/%s", p, TBL_DATA_DIR, tab8859_5);
- fp = fopen(filename, "r");
- if(fp) {
- set_latin_tab(fp, tbl, fb_default);
- fclose(fp);
- return;
- }
- if(q) {
- p = q + 1;
- } else {
- p = q;
- }
- }
- if(!fp) {
- set_latin_nop(tbl, fb_default);
- }
- }
- static void
- init_latin6tab(long *tbl, long fb_default)
- {
- FILE *fp;
- char dirname[BUFSIZE];
- char filename[BUFSIZE];
- char *p, *q;
- _fallcResolveI18NPath(dirname);
- p = dirname;
- while(p) {
- q = strchr(p, ':');
- if(q) {
- *q = '\0';
- }
- sprintf(filename, "%s/%s/%s", p, TBL_DATA_DIR, tab8859_6);
- fp = fopen(filename, "r");
- if(fp) {
- set_latin_tab(fp, tbl, fb_default);
- fclose(fp);
- return;
- }
- if(q) {
- p = q + 1;
- } else {
- p = q;
- }
- }
- if(!fp) {
- set_latin_nop(tbl, fb_default);
- }
- }
- static void
- init_latin7tab(long *tbl, long fb_default)
- {
- FILE *fp;
- char dirname[BUFSIZE];
- char filename[BUFSIZE];
- char *p, *q;
- _fallcResolveI18NPath(dirname);
- p = dirname;
- while(p) {
- q = strchr(p, ':');
- if(q) {
- *q = '\0';
- }
- sprintf(filename, "%s/%s/%s", p, TBL_DATA_DIR, tab8859_7);
- fp = fopen(filename, "r");
- if(fp) {
- set_latin_tab(fp, tbl, fb_default);
- fclose(fp);
- return;
- }
- if(q) {
- p = q + 1;
- } else {
- p = q;
- }
- }
- if(!fp) {
- set_latin_nop(tbl, fb_default);
- }
- }
- static void
- init_latin8tab(long *tbl, long fb_default)
- {
- FILE *fp;
- char dirname[BUFSIZE];
- char filename[BUFSIZE];
- char *p, *q;
- _fallcResolveI18NPath(dirname);
- p = dirname;
- while(p) {
- q = strchr(p, ':');
- if(q) {
- *q = '\0';
- }
- sprintf(filename, "%s/%s/%s", p, TBL_DATA_DIR, tab8859_8);
- fp = fopen(filename, "r");
- if(fp) {
- set_latin_tab(fp, tbl, fb_default);
- fclose(fp);
- return;
- }
- if(q) {
- p = q + 1;
- } else {
- p = q;
- }
- }
- if(!fp) {
- set_latin_nop(tbl, fb_default);
- }
- }
- static void
- init_latin9tab(long *tbl, long fb_default)
- {
- FILE *fp;
- char dirname[BUFSIZE];
- char filename[BUFSIZE];
- char *p, *q;
- _fallcResolveI18NPath(dirname);
- p = dirname;
- while(p) {
- q = strchr(p, ':');
- if(q) {
- *q = '\0';
- }
- sprintf(filename, "%s/%s/%s", p, TBL_DATA_DIR, tab8859_9);
- fp = fopen(filename, "r");
- if(fp) {
- set_latin_tab(fp, tbl, fb_default);
- fclose(fp);
- return;
- }
- if(q) {
- p = q + 1;
- } else {
- p = q;
- }
- }
- if(!fp) {
- set_latin_nop(tbl, fb_default);
- }
- }
- static void
- init_jis0201tab(long *tbl, long fb_default)
- {
- int i;
- for(i = 0; i < NRUNE; i++)
- tbl[i] = -1;
- }
- static void
- set_cjk_nop(long **to_tbl, int to_max, long default_val)
- {
- int i;
- for(i = 0; i < to_max; i++)
- (*to_tbl)[i] = default_val;
- return;
- }
- static void
- set_table(
- FILE *fptr,
- long **to_tbl,
- long *from_tbl,
- int to_max,
- long fb_default)
- {
- int i = 0;
- int j = 0;
- int rv = 0;
- long value;
- for(i = 0; i < NRUNE; i++)
- from_tbl[i] = -1;
- while((rv = fscanf(fptr, "%lx", (long unsigned *) &value)) != EOF) {
- if(rv != 0) {
- (*to_tbl)[j++] = value;
- } else {
- set_cjk_nop(to_tbl, to_max, fb_default);
- break;
- }
- }
- for(i = 0; i < to_max; i++) {
- if((value = (*to_tbl)[i]) != -1){
- from_tbl[abs(value)] = i;
- }
- }
- }
- static void
- init_jis0208tab(long *tbl, long fb_default)
- {
- FILE *fp;
- char dirname[BUFSIZE];
- char filename[BUFSIZE];
- char *p, *q;
- if((tabkuten = (long *)Xmalloc(KUTENMAX * sizeof(long))) == NULL) {
- return;
- }
- _fallcResolveI18NPath(dirname);
- p = dirname;
- while(p) {
- q = strchr(p, ':');
- if(q) {
- *q = '\0';
- }
- sprintf(filename, "%s/%s/%s", p, TBL_DATA_DIR, jis0208);
- fp = fopen(filename, "r");
- if(fp) {
- set_table(fp, &tabkuten, tbl, KUTENMAX, fb_default);
- fclose(fp);
- return;
- }
- if(q) {
- p = q + 1;
- } else {
- p = q;
- }
- }
- if(!fp) {
- set_cjk_nop(&tabkuten, KUTENMAX, fb_default);
- }
- }
- static void
- init_ksc5601tab(long *tbl, long fb_default)
- {
- FILE *fp;
- char dirname[BUFSIZE];
- char filename[BUFSIZE];
- char *p, *q;
- if((tabksc5601 = (long *)Xmalloc(KSCMAX * sizeof(long))) == NULL) {
- return;
- }
- _fallcResolveI18NPath(dirname);
- p = dirname;
- while(p) {
- q = strchr(p, ':');
- if(q) {
- *q = '\0';
- }
- sprintf(filename, "%s/%s/%s", p, TBL_DATA_DIR, ksc5601);
- fp = fopen(filename, "r");
- if(fp) {
- set_table(fp, &tabksc5601, tbl, KSCMAX, fb_default);
- fclose(fp);
- return;
- }
- if(q) {
- p = q + 1;
- } else {
- p = q;
- }
- }
- if(!fp) {
- set_cjk_nop(&tabksc5601, KSCMAX, fb_default);
- }
- }
- static void
- init_gb2312tab(long *tbl, long fb_default)
- {
- FILE *fp;
- char dirname[BUFSIZE];
- char filename[BUFSIZE];
- char *p, *q;
- if((tabgb = (long *)Xmalloc(GBMAX * sizeof(long))) == NULL) {
- return;
- }
- _fallcResolveI18NPath(dirname);
- p = dirname;
- while(p) {
- q = strchr(p, ':');
- if(q) {
- *q = '\0';
- }
- sprintf(filename, "%s/%s/%s", p, TBL_DATA_DIR, gb2312);
- fp = fopen(filename, "r");
- if(fp) {
- set_table(fp, &tabgb, tbl, GBMAX, fb_default);
- fclose(fp);
- return;
- }
- if(q) {
- p = q + 1;
- } else {
- p = q;
- }
- }
- if(!fp) {
- set_cjk_nop(&tabgb, GBMAX, fb_default);
- }
- }
- static UtfData
- make_entry(void)
- {
- UtfData tmp = (UtfData)Xmalloc(sizeof(UtfDataRec));
- bzero(tmp, sizeof(UtfDataRec));
- return tmp;
- }
- static int once = 0;
- static int
- _XlcInitUTFInfo(XLCd lcd)
- {
- if(!once) {
- int i;
- CodeSet *codeset_list = XLC_GENERIC(lcd, codeset_list);
- int codeset_num = XLC_GENERIC(lcd, codeset_num);
- UtfData pdata;
- if(!utfdata_list) {
- utfdata_list = make_entry();
- }
- pdata = utfdata_list;
- for(i=0; i < codeset_num; i++) {
- XlcCharSet charset = *codeset_list[i]->charset_list;
- while(pdata->next) {
- if(charset == pdata->charset) {
- break;
- }
- pdata = pdata->next;
- }
- if(pdata->next) {
- continue;
- } else {
- int j;
- for(j = 0; j < MAX_UTF_CHARSET; j++) {
- if(_fallcCompareISOLatin1(charset->encoding_name, default_utf_data[j].name) ||
- charset->side != default_utf_data[j].side) {
- continue;
- } else {
- pdata->initialize = default_utf_data[j].initialize;
- pdata->fromtbl = (long *)Xmalloc(NRUNE * sizeof(long));
- (*pdata->initialize)(pdata->fromtbl, default_utf_data[j].fallback_value);
- pdata->already_init = True;
- pdata->charset = charset;
- pdata->cstorune = default_utf_data[j].cstorune;
- pdata->type = default_utf_data[j].type;
- pdata->next = make_entry();
- break;
- }
- }
- }
- }
- once = 1;
- }
- return 1;
- }
- static int
- utftocs(
- XlcConv conv,
- char **from,
- int *from_left,
- char **to,
- int *to_left,
- XPointer *args,
- int num_args)
- {
- char *utfptr;
- char *bufptr;
- int utf_len, buf_len;
- long l;
- XlcCharSet tmpcharset = (XlcCharSet)NULL;
- UtfData pdata = utfdata_list;
- if (from == NULL || *from == NULL)
- return 0;
- utfptr = *from;
- bufptr = *to;
- utf_len = *from_left;
- buf_len = *to_left;
- while(utf_len > 0 && buf_len > 0) {
- char *p = utfptr;
- if((l = getutfrune(&p, &utf_len)) == -2) {
- return -1;
- } else {
- while(pdata->next) {
- long r;
- long *tbl;
- tbl = pdata->fromtbl;
- tbl += l;
- if((r = *tbl) == -1) {
- if(tmpcharset) {
- if((num_args > 0) && tmpcharset)
- *((XlcCharSet *) args[0]) = tmpcharset;
- *from_left -= utfptr - *from;
- *from = utfptr;
- *to_left -= bufptr - *to;
- *to = bufptr;
- return 0;
- } else {
- pdata = pdata->next;
- continue;
- }
- } else {
- utfptr = p;
- if(!tmpcharset) tmpcharset = pdata->charset;
- }
- if(r < 128) {
- *bufptr++ = r;
- buf_len--;
- } else {
- switch(pdata->type) {
- case N11n_ja:
- *bufptr++ = (r/100 + ' ');
- *bufptr++ = (r%100 + ' ');
- break;
- case N11n_ko:
- *bufptr++ = (r/94 + 0x21);
- *bufptr++ = (r%94 + 0x21);
- break;
- case N11n_zh:
- *bufptr++ = 0x20 + (r/100);
- *bufptr++ = 0x20 + (r%100);
- break;
- default:
- break;
- }
- buf_len -= 2;
- }
- break;
- }
- if(!tmpcharset) return (-1); /* Unknown Codepoint */
- }
- }
- }
- static int
- utf1tocs(
- XlcConv conv,
- char **from,
- int *from_left,
- char **to,
- int *to_left,
- XPointer *args,
- int num_args)
- {
- char **ptr = NULL;
- char char_ptr[UTFmax];
- int i = 0;
- unsigned long dummy = (unsigned long)0;
- if (from == NULL || *from == NULL)
- return utftocs(conv, from, from_left, to, to_left, args, num_args);
- ptr = from;
- for(i = 0; i < UTFmax; char_ptr[i++] = *(*ptr)++);
- i=0;
- while(our_mbtowc(&dummy, (char*)&char_ptr[0], i) <= 0)
- i++;
- utftocs(conv, from, &i, to, to_left, args, num_args);
- }
- static int
- ucstocs(
- XlcConv conv,
- XPointer *from,
- int *from_left,
- char **to,
- int *to_left,
- XPointer *args,
- int num_args)
- {
- wchar_t *ucsptr;
- char *bufptr;
- int ucs_len, buf_len;
- XlcCharSet tmpcharset = (XlcCharSet)NULL;
- UtfData pdata = utfdata_list;
- if (from == NULL || *from == NULL)
- return 0;
- ucsptr = (wchar_t *)*from;
- bufptr = *to;
- ucs_len = *from_left;
- buf_len = *to_left;
- while(ucs_len > 0 && buf_len > 0) {
- while(pdata->next) {
- long r;
- long *tbl;
- tbl = pdata->fromtbl;
- tbl += *ucsptr;
- if((r = *tbl) == -1) {
- if(tmpcharset) {
- if((num_args > 0) && tmpcharset)
- *((XlcCharSet *) args[0]) = tmpcharset;
- *from_left -= ucsptr - (wchar_t *)*from;
- *from = (XPointer)ucsptr;
- *to_left -= bufptr - *to;
- *to = bufptr;
- return 0;
- } else {
- pdata = pdata->next;
- continue;
- }
- } else {
- if(!tmpcharset) tmpcharset = pdata->charset;
- }
- ucsptr++;
- if(r < 128) {
- *bufptr++ = r;
- ucs_len--;
- buf_len--;
- } else {
- switch(pdata->type) {
- case N11n_ja:
- *bufptr++ = (r/100 + ' ');
- *bufptr++ = (r%100 + ' ');
- break;
- case N11n_ko:
- *bufptr++ = (r/94 + 0x21);
- *bufptr++ = (r%94 + 0x21);
- break;
- case N11n_zh:
- *bufptr++ = 0x20 + (r/100);
- *bufptr++ = 0x20 + (r%100);
- break;
- default:
- break;
- }
- ucs_len--;
- buf_len -= 2;
- }
- break;
- }
- if(!tmpcharset) return (-1); /* Unknown Codepoint */
- }
- }
- static long
- getutfrune(char **read_from, int *from_len)
- {
- int c, i;
- char str[UTFmax]; /* MB_LEN_MAX really */
- unsigned long l;
- int n;
- str[0] = '\0';
- for(i = 0; i <= UTFmax;) {
- c = **read_from;
- (*read_from)++;
- str[i++] = c;
- n = our_mbtowc(&l, str, i);
- if(n == -1)
- return(-2);
- if(n > 0) {
- *from_len -= n;
- return(l);
- }
- }
- return(-2);
- }
- static
- cstoutf(
- XlcConv conv,
- char **from,
- int *from_left,
- char **to,
- int *to_left,
- XPointer *args,
- int num_args)
- {
- XlcCharSet charset;
- char *csptr, *utfptr;
- int csstr_len, utf_len;
- int cmp_len = 0;
- void (*putrune)(
- unsigned char c,
- Rune *r
- ) = NULL;
- Rune r = (Rune)0;
- UtfData pdata = utfdata_list;
- if (from == NULL || *from == NULL)
- return 0;
- if (num_args < 1)
- return -1;
- csptr = *from;
- utfptr = *to;
- csstr_len = *from_left;
- utf_len = *to_left;
- charset = (XlcCharSet)args[0];
- cmp_len = strchr(charset->name, ':') - charset->name;
- while(pdata->next) {
- if(!_fallcNCompareISOLatin1(charset->name, pdata->charset->name, cmp_len)) {
- putrune = pdata->cstorune;
- break;
- } else {
- pdata = pdata->next;
- }
- }
- if(!putrune)
- return -1;
- while(csstr_len-- > 0 && utf_len > 0) {
- (*putrune)(*csptr++, &r);
- if(!r) {
- continue;
- }
- our_wctomb(r, &utfptr, &utf_len);
- r = 0;
- }
- *from_left -= csptr - *from;
- *from = csptr;
- *to_left -= utfptr - *to;
- *to = utfptr;
- return 0;
- }
- static
- cstoucs(
- XlcConv conv,
- char **from,
- int *from_left,
- XPointer *to,
- int *to_left,
- XPointer *args,
- int num_args)
- {
- XlcCharSet charset;
- char *csptr;
- wchar_t *ucsptr;
- int csstr_len, ucs_len;
- int cmp_len = 0;
- void (*putrune)(
- unsigned char c,
- Rune *r
- ) = NULL;
- Rune r = (Rune)0;
- UtfData pdata = utfdata_list;
- if (from == NULL || *from == NULL)
- return 0;
- if (num_args < 1)
- return -1;
- csptr = *from;
- ucsptr = (wchar_t *)*to;
- csstr_len = *from_left;
- ucs_len = *to_left;
- charset = (XlcCharSet)args[0];
- cmp_len = strchr(charset->name, ':') - charset->name;
- while(pdata->next) {
- if(!_fallcNCompareISOLatin1(charset->name, pdata->charset->name, cmp_len)) {
- putrune = pdata->cstorune;
- break;
- } else {
- pdata = pdata->next;
- }
- }
- if(!putrune)
- return -1;
- while(csstr_len-- > 0 && ucs_len > 0) {
- (*putrune)(*csptr++, &r);
- if(!r) {
- continue;
- }
- *ucsptr = (long)r;
- ucsptr++;
- ucs_len--;
- r = 0;
- }
- *from_left -= csptr - *from;
- *from = csptr;
- *to_left -= ucsptr - (wchar_t *)*to;
- *to = (XPointer)ucsptr;
- return 0;
- }
- static void
- our_wctomb(Rune r, char **utfptr, int *utf_len)
- {
- long l = (long)r;
- if(!utfptr || !*utfptr)
- return; /* no shift states */
- if(l & ~Wchar2) {
- if(l & ~Wchar4) {
- if(l & ~Wchar5) {
- /* 6 bytes */
- *(*utfptr)++ = T6 | ((l >> 5*Bitx) & Mask6);
- *(*utfptr)++ = Tx | ((l >> 4*Bitx) & Maskx);
- *(*utfptr)++ = Tx | ((l >> 3*Bitx) & Maskx);
- *(*utfptr)++ = Tx | ((l >> 2*Bitx) & Maskx);
- *(*utfptr)++ = Tx | ((l >> 1*Bitx) & Maskx);
- *(*utfptr)++ = Tx | (l & Maskx);
- *utf_len -= 6;
- return;
- }
- /* 5 bytes */
- *(*utfptr)++ = T5 | (l >> 4*Bitx);
- *(*utfptr)++ = Tx | ((l >> 3*Bitx) & Maskx);
- *(*utfptr)++ = Tx | ((l >> 2*Bitx) & Maskx);
- *(*utfptr)++ = Tx | ((l >> 1*Bitx) & Maskx);
- *(*utfptr)++ = Tx | (l & Maskx);
- *utf_len -= 5;
- return;
- }
- if(l & ~Wchar3) {
- /* 4 bytes */
- *(*utfptr)++ = T4 | (l >> 3*Bitx);
- *(*utfptr)++ = Tx | ((l >> 2*Bitx) & Maskx);
- *(*utfptr)++ = Tx | ((l >> 1*Bitx) & Maskx);
- *(*utfptr)++ = Tx | (l & Maskx);
- *utf_len -= 4;
- return;
- }
- /* 3 bytes */
- *(*utfptr)++ = T3 | (l >> 2*Bitx);
- *(*utfptr)++ = Tx | ((l >> 1*Bitx) & Maskx);
- *(*utfptr)++ = Tx | (l & Maskx);
- *utf_len -= 3;
- return;
- }
- if(l & ~Wchar1) {
- /* 2 bytes */
- *(*utfptr)++ = T2 | (l >> 1*Bitx);
- *(*utfptr)++ = Tx | (l & Maskx);
- *utf_len -= 2;
- return;
- }
- /* 1 byte */
- *(*utfptr)++ = T1 | l;
- *utf_len -= 1;
- return;
- }
- static void
- latin2rune(unsigned char c, Rune *r)
- {
- *r = (Rune)c;
- return;
- }
- static void
- ksc2rune(unsigned char c, Rune *r)
- {
- static enum { init, cs1last} state = init;
- static int korean646 = 1; /* fixed to 1 for now. */
- static int lastc;
- unsigned char ch = (c|0x80); /* XXX */
- int n;
- long l;
- switch(state)
- {
- case init:
- if (ch < 128){
- if(korean646 && (ch=='\\')){
- emit(0x20A9);
- } else {
- emit(ch);
- }
- }else{
- lastc = ch;
- state = cs1last;
- }
- return;
- case cs1last: /* 2nd byte of codeset 1 (KSC 5601) */
- n = ((lastc&0x7f)-33)*94 + (ch&0x7f)-33;
- if((l = tabksc5601[n]) == 0){
- emit(BADMAP);
- } else {
- emit(l);
- }
- state = init;
- return;
- }
- }
- static void
- jis02012rune(unsigned char c, Rune *r)
- {
- /* To Be Implemented */
- }
- static void
- gb2rune(unsigned char c, Rune *r)
- {
- static enum { state0, state1 } state = state0;
- static int lastc;
- long n, ch;
- unsigned char ch1 = (c|0x80); /* XXX */
- switch(state)
- {
- case state0: /* idle state */
- if(ch1 >= 0xA1){
- lastc = ch1;
- state = state1;
- return;
- }
- emit(ch1);
- return;
- case state1: /* seen a font spec */
- if(ch1 >= 0xA1)
- n = (lastc-0xA0)*100 + (ch1-0xA0);
- else {
- emit(BADMAP);
- state = state0;
- return;
- }
- ch = tabgb[n];
- if(ch < 0){
- emit(BADMAP);
- } else
- emit(ch);
- state = state0;
- }
- }
- static void
- jis02082rune(unsigned char c, Rune *r)
- {
- static enum { state0, state1} state = state0;
- static int lastc;
- unsigned char ch = (c|0x80); /* XXX */
- int n, again;
- long l;
- do {
- again = 0;
- switch(state)
- {
- case state0: /* idle state */
- lastc = ch;
- state = state1;
- return;
- case state1: /* two part char */
- if((lastc&0x80) != (ch&0x80)){
- emit(lastc);
- state = state0;
- again += 1;
- }
- if(CANS2J(lastc, ch)){
- int h = lastc, l = ch;
- S2J(h, l);
- n = h*100 + l - 3232;
- } else
- n = (lastc&0x7F)*100 + (ch&0x7f) - 3232; /* kuten */
- if((l = tabkuten[n]) == -1){
- emit(BADMAP);
- } else {
- if(l < 0){
- l = -l;
- }
- emit(l);
- }
- state = state0;
- }
- } while (again == 1);
- }
- static int
- our_mbtowc(unsigned long *p, char *s, size_t n)
- {
- unsigned char *us;
- int c0, c1, c2, c3, c4, c5;
- unsigned long wc;
- if(s == 0)
- return 0; /* no shift states */
- if(n < 1)
- return -2; /* bad length */
- us = (unsigned char*)s;
- c0 = us[0];
- if(c0 >= T3) {
- if(n < 3)
- return -2;
- c1 = us[1] ^ Tx;
- c2 = us[2] ^ Tx;
- if((c1|c2) & T2) {
- errno = EILSEQ;
- return -1;
- }
- if(c0 >= T5) {
- if(n < 5)
- return -2;
- c3 = us[3] ^ Tx;
- c4 = us[4] ^ Tx;
- if((c3|c4) & T2) {
- errno = EILSEQ;
- return -1;
- }
- if(c0 >= T6) {
- /* 6 bytes */
- if(n < 6)
- return -2;
- c5 = us[5] ^ Tx;
- if(c5 & T2) {
- errno = EILSEQ;
- return -1;
- }
- wc = ((((((((((c0 & Mask6) << Bitx) |
- c1) << Bitx) | c2) << Bitx) |
- c3) << Bitx) | c4) << Bitx) | c5;
- if(wc <= Wchar5) {
- errno = EILSEQ;
- return -1;
- }
- *p = wc;
- return 6;
- }
- /* 5 bytes */
- wc = ((((((((c0 & Mask5) << Bitx) |
- c1) << Bitx) | c2) << Bitx) |
- c3) << Bitx) | c4;
- if(wc <= Wchar4) {
- errno = EILSEQ;
- return -1;
- }
- *p = wc;
- return 5;
- }
- if(c0 >= T4) {
- /* 4 bytes */
- if(n < 4)
- return -2;
- c3 = us[3] ^ Tx;
- if(c3 & T2) {
- errno = EILSEQ;
- return -1;
- }
- wc = ((((((c0 & Mask4) << Bitx) |
- c1) << Bitx) | c2) << Bitx) |
- c3;
- if(wc <= Wchar3) {
- errno = EILSEQ;
- return -1;
- }
- *p = wc;
- return 4;
- }
- /* 3 bytes */
- wc = ((((c0 & Mask3) << Bitx) |
- c1) << Bitx) | c2;
- if(wc <= Wchar2) {
- errno = EILSEQ;
- return -1;
- }
- *p = wc;
- return 3;
- }
- if(c0 >= T2) {
- /* 2 bytes */
- if(n < 2)
- return -2;
- c1 = us[1] ^ Tx;
- if(c1 & T2) {
- errno = EILSEQ;
- return -1;
- }
- wc = ((c0 & Mask2) << Bitx) |
- c1;
- if(wc <= Wchar1) {
- errno = EILSEQ;
- return -1;
- }
- *p = wc;
- return 2;
- }
- /* 1 byte */
- if(c0 >= Tx) {
- errno = EILSEQ;
- return -1;
- }
- *p = c0;
- return 1;
- }
- static void
- close_converter(XlcConv conv)
- {
- Xfree((char *) conv);
- }
- static XlcConv
- create_conv(XLCd lcd, XlcConvMethods methods)
- {
- XlcConv conv;
- conv = (XlcConv) Xmalloc(sizeof(XlcConvRec));
- if (conv == (XlcConv) NULL)
- return (XlcConv) NULL;
- conv->methods = methods;
- conv->state = NULL;
- _XlcInitUTFInfo(lcd);
- return conv;
- /* if an error occurs somewhere
- close_converter(conv);
- return (XlcConv) NULL;
- */
- }
- static XlcConvMethodsRec mbtocs_methods = {
- close_converter,
- utf1tocs,
- NULL
- };
- static XlcConv
- open_mbtocs(XLCd from_lcd, char *from, XLCd to_lcd, char *to)
- {
- return create_conv(from_lcd, &mbtocs_methods);
- }
- static XlcConvMethodsRec mbstocs_methods = {
- close_converter,
- utftocs,
- NULL
- };
- static XlcConv
- open_mbstocs(XLCd from_lcd, char *from, XLCd to_lcd, char *to)
- {
- return create_conv(from_lcd, &mbstocs_methods);
- }
- static XlcConvMethodsRec wcstocs_methods = {
- close_converter,
- ucstocs,
- NULL
- };
- static XlcConv
- open_wcstocs(XLCd from_lcd, char *from, XLCd to_lcd, char *to)
- {
- return create_conv(from_lcd, &wcstocs_methods);
- }
- static XlcConvMethodsRec cstombs_methods = {
- close_converter,
- cstoutf,
- NULL
- };
- static XlcConv
- open_cstombs(XLCd from_lcd, char *from, XLCd to_lcd, char *to)
- {
- return create_conv(from_lcd, &cstombs_methods);
- }
- static XlcConvMethodsRec cstowcs_methods = {
- close_converter,
- cstoucs,
- NULL
- };
- static XlcConv
- open_cstowcs(XLCd from_lcd, char *from, XLCd to_lcd, char *to)
- {
- return create_conv(from_lcd, &cstowcs_methods);
- }
- XLCd
- _fallcUtfLoader(char *name)
- {
- XLCd lcd;
- lcd = _fallcCreateLC(name, _fallcGenericMethods);
- if (lcd == (XLCd) NULL)
- return lcd;
- if ((_fallcCompareISOLatin1(XLC_PUBLIC_PART(lcd)->codeset, "utf"))) {
- _fallcDestroyLC(lcd);
- return (XLCd) NULL;
- }
- _fallcSetConverter(lcd, XlcNMultiByte, lcd, XlcNCharSet, open_mbstocs);
- _fallcSetConverter(lcd, XlcNWideChar, lcd, XlcNCharSet, open_wcstocs);
- _fallcSetConverter(lcd, XlcNMultiByte, lcd, XlcNChar, open_mbtocs);
- _fallcSetConverter(lcd, XlcNCharSet, lcd, XlcNMultiByte, open_cstombs);
- _fallcSetConverter(lcd, XlcNCharSet, lcd, XlcNWideChar, open_cstowcs);
- return lcd;
- }
|