1*16d86563SAlexander Pyhalov /*
2*16d86563SAlexander Pyhalov * CDDL HEADER START
3*16d86563SAlexander Pyhalov *
4*16d86563SAlexander Pyhalov * The contents of this file are subject to the terms of the
5*16d86563SAlexander Pyhalov * Common Development and Distribution License (the "License").
6*16d86563SAlexander Pyhalov * You may not use this file except in compliance with the License.
7*16d86563SAlexander Pyhalov *
8*16d86563SAlexander Pyhalov * You can obtain a copy of the license at src/OPENSOLARIS.LICENSE
9*16d86563SAlexander Pyhalov * or http://www.opensolaris.org/os/licensing.
10*16d86563SAlexander Pyhalov * See the License for the specific language governing permissions
11*16d86563SAlexander Pyhalov * and limitations under the License.
12*16d86563SAlexander Pyhalov *
13*16d86563SAlexander Pyhalov * When distributing Covered Code, include this CDDL HEADER in each
14*16d86563SAlexander Pyhalov * file and include the License file at src/OPENSOLARIS.LICENSE.
15*16d86563SAlexander Pyhalov * If applicable, add the following below this CDDL HEADER, with the
16*16d86563SAlexander Pyhalov * fields enclosed by brackets "[]" replaced with your own identifying
17*16d86563SAlexander Pyhalov * information: Portions Copyright [yyyy] [name of copyright owner]
18*16d86563SAlexander Pyhalov *
19*16d86563SAlexander Pyhalov * CDDL HEADER END
20*16d86563SAlexander Pyhalov */
21*16d86563SAlexander Pyhalov /*
22*16d86563SAlexander Pyhalov * Copyright (c) 1994 by Sun Microsystems, Inc.
23*16d86563SAlexander Pyhalov */
24*16d86563SAlexander Pyhalov
25*16d86563SAlexander Pyhalov
26*16d86563SAlexander Pyhalov #include <stdlib.h>
27*16d86563SAlexander Pyhalov #include <errno.h>
28*16d86563SAlexander Pyhalov #include "ktable.h"
29*16d86563SAlexander Pyhalov #include "utf_euc.h"
30*16d86563SAlexander Pyhalov
31*16d86563SAlexander Pyhalov
32*16d86563SAlexander Pyhalov /**** _ I C V _ O P E N ****/
33*16d86563SAlexander Pyhalov
_icv_open()34*16d86563SAlexander Pyhalov void* _icv_open()
35*16d86563SAlexander Pyhalov {
36*16d86563SAlexander Pyhalov _conv_desc* cd = (_conv_desc*)malloc(sizeof(_conv_desc));
37*16d86563SAlexander Pyhalov
38*16d86563SAlexander Pyhalov if (cd == (_conv_desc*)NULL)
39*16d86563SAlexander Pyhalov {
40*16d86563SAlexander Pyhalov errno = ENOMEM;
41*16d86563SAlexander Pyhalov return((void*)-1);
42*16d86563SAlexander Pyhalov }
43*16d86563SAlexander Pyhalov
44*16d86563SAlexander Pyhalov RESET_CONV_DESC();
45*16d86563SAlexander Pyhalov
46*16d86563SAlexander Pyhalov return((void*)cd);
47*16d86563SAlexander Pyhalov } /* end of int _icv_open(). */
48*16d86563SAlexander Pyhalov
49*16d86563SAlexander Pyhalov
50*16d86563SAlexander Pyhalov /**** _ I C V _ C L O S E ****/
51*16d86563SAlexander Pyhalov
_icv_close(_conv_desc * cd)52*16d86563SAlexander Pyhalov void _icv_close(_conv_desc* cd)
53*16d86563SAlexander Pyhalov {
54*16d86563SAlexander Pyhalov if (!cd)
55*16d86563SAlexander Pyhalov errno = EBADF;
56*16d86563SAlexander Pyhalov else
57*16d86563SAlexander Pyhalov free((void*)cd);
58*16d86563SAlexander Pyhalov } /* end of void _icv_close(_conv_desc*). */
59*16d86563SAlexander Pyhalov
60*16d86563SAlexander Pyhalov
61*16d86563SAlexander Pyhalov /**** _ I C V _ I C O N V ****/
62*16d86563SAlexander Pyhalov
_icv_iconv(_conv_desc * cd,char ** inbuf,size_t * inbufleft,char ** outbuf,size_t * outbufleft)63*16d86563SAlexander Pyhalov size_t _icv_iconv(_conv_desc* cd, char** inbuf, size_t* inbufleft,
64*16d86563SAlexander Pyhalov char** outbuf, size_t* outbufleft)
65*16d86563SAlexander Pyhalov {
66*16d86563SAlexander Pyhalov extern unsigned short _johap_to_wansung(unsigned short, unsigned short,
67*16d86563SAlexander Pyhalov unsigned short);
68*16d86563SAlexander Pyhalov size_t ret_val = 0;
69*16d86563SAlexander Pyhalov unsigned char* ib;
70*16d86563SAlexander Pyhalov unsigned char* ob;
71*16d86563SAlexander Pyhalov unsigned char* ibtail;
72*16d86563SAlexander Pyhalov unsigned char* obtail;
73*16d86563SAlexander Pyhalov
74*16d86563SAlexander Pyhalov if (!cd)
75*16d86563SAlexander Pyhalov {
76*16d86563SAlexander Pyhalov errno = EBADF;
77*16d86563SAlexander Pyhalov return((size_t)-1);
78*16d86563SAlexander Pyhalov }
79*16d86563SAlexander Pyhalov
80*16d86563SAlexander Pyhalov if (!inbuf || !(*inbuf))
81*16d86563SAlexander Pyhalov {
82*16d86563SAlexander Pyhalov RESET_CONV_DESC();
83*16d86563SAlexander Pyhalov return((size_t)0);
84*16d86563SAlexander Pyhalov }
85*16d86563SAlexander Pyhalov
86*16d86563SAlexander Pyhalov ib = (unsigned char*)*inbuf;
87*16d86563SAlexander Pyhalov ob = (unsigned char*)*outbuf;
88*16d86563SAlexander Pyhalov ibtail = ib + *inbufleft;
89*16d86563SAlexander Pyhalov obtail = ob + *outbufleft;
90*16d86563SAlexander Pyhalov
91*16d86563SAlexander Pyhalov while (ib < ibtail)
92*16d86563SAlexander Pyhalov {
93*16d86563SAlexander Pyhalov if (!(*ib & 0x80)) /* 7 bits */
94*16d86563SAlexander Pyhalov {
95*16d86563SAlexander Pyhalov PROCESS_PRIOR_CVC();
96*16d86563SAlexander Pyhalov
97*16d86563SAlexander Pyhalov if (ob >= obtail)
98*16d86563SAlexander Pyhalov {
99*16d86563SAlexander Pyhalov errno = E2BIG;
100*16d86563SAlexander Pyhalov ret_val = (size_t)-1;
101*16d86563SAlexander Pyhalov break;
102*16d86563SAlexander Pyhalov }
103*16d86563SAlexander Pyhalov *ob++ = *ib++;
104*16d86563SAlexander Pyhalov }
105*16d86563SAlexander Pyhalov else if ((*ib & 0xF0) == 0xE0) /* 16 bits */
106*16d86563SAlexander Pyhalov {
107*16d86563SAlexander Pyhalov unsigned long utf;
108*16d86563SAlexander Pyhalov
109*16d86563SAlexander Pyhalov if ((ibtail - ib) < 3)
110*16d86563SAlexander Pyhalov {
111*16d86563SAlexander Pyhalov errno = EINVAL;
112*16d86563SAlexander Pyhalov ret_val = (size_t)-1;
113*16d86563SAlexander Pyhalov break;
114*16d86563SAlexander Pyhalov }
115*16d86563SAlexander Pyhalov
116*16d86563SAlexander Pyhalov utf = ((unsigned long)(*ib) << 16) |
117*16d86563SAlexander Pyhalov ((unsigned long)(*(ib + 1)) << 8) |
118*16d86563SAlexander Pyhalov (unsigned long)(*(ib + 2));
119*16d86563SAlexander Pyhalov if (utf == 0xE1859F ||
120*16d86563SAlexander Pyhalov (utf >= 0xE18480 && utf <= 0xE18492)) /* Ci */
121*16d86563SAlexander Pyhalov {
122*16d86563SAlexander Pyhalov PROCESS_PRIOR_CVC();
123*16d86563SAlexander Pyhalov
124*16d86563SAlexander Pyhalov cd->ci = (utf == 0xE1859F) ? CVC_FILL
125*16d86563SAlexander Pyhalov : utf - 0xE18480;
126*16d86563SAlexander Pyhalov cd->prev_state = CI;
127*16d86563SAlexander Pyhalov }
128*16d86563SAlexander Pyhalov else if (utf == 0xE185A0 ||
129*16d86563SAlexander Pyhalov (utf >= 0xE185A1 && utf <= 0xE185B5)) /* V */
130*16d86563SAlexander Pyhalov {
131*16d86563SAlexander Pyhalov if (cd->prev_state != E && cd->prev_state != CI)
132*16d86563SAlexander Pyhalov PROCESS_PRIOR_CVC();
133*16d86563SAlexander Pyhalov
134*16d86563SAlexander Pyhalov cd->v = (utf == 0xE185A0) ? CVC_FILL
135*16d86563SAlexander Pyhalov : utf - 0xE185A1;
136*16d86563SAlexander Pyhalov cd->prev_state = V;
137*16d86563SAlexander Pyhalov }
138*16d86563SAlexander Pyhalov else if ((utf >= 0xE186A8 && utf <= 0xE186BF) ||
139*16d86563SAlexander Pyhalov (utf >= 0xE18780 && utf <= 0xE18782)) /* Cf */
140*16d86563SAlexander Pyhalov {
141*16d86563SAlexander Pyhalov if (cd->prev_state != E && cd->prev_state != V)
142*16d86563SAlexander Pyhalov PROCESS_PRIOR_CVC();
143*16d86563SAlexander Pyhalov
144*16d86563SAlexander Pyhalov cd->cf = utf - ((utf >= 0xE18780) ? 0xE18766
145*16d86563SAlexander Pyhalov : 0xE186A6);
146*16d86563SAlexander Pyhalov cd->prev_state = CF;
147*16d86563SAlexander Pyhalov
148*16d86563SAlexander Pyhalov PROCESS_PRIOR_CVC();
149*16d86563SAlexander Pyhalov }
150*16d86563SAlexander Pyhalov else if (utf >= 0xE082A1 && utf <= 0xEFBFA6)
151*16d86563SAlexander Pyhalov {
152*16d86563SAlexander Pyhalov register int h, i, j, l;
153*16d86563SAlexander Pyhalov
154*16d86563SAlexander Pyhalov PROCESS_PRIOR_CVC();
155*16d86563SAlexander Pyhalov
156*16d86563SAlexander Pyhalov if ((obtail - ob) < 2)
157*16d86563SAlexander Pyhalov {
158*16d86563SAlexander Pyhalov errno = E2BIG;
159*16d86563SAlexander Pyhalov ret_val = (size_t)-1;
160*16d86563SAlexander Pyhalov break;
161*16d86563SAlexander Pyhalov }
162*16d86563SAlexander Pyhalov
163*16d86563SAlexander Pyhalov for (l = 0, h = MAX_U2E_NUM; l < h; )
164*16d86563SAlexander Pyhalov {
165*16d86563SAlexander Pyhalov i = (l + h) / 2;
166*16d86563SAlexander Pyhalov if (utf82euc_tbl[i].utf8 == utf)
167*16d86563SAlexander Pyhalov break;
168*16d86563SAlexander Pyhalov else if (utf82euc_tbl[l].utf8 == utf)
169*16d86563SAlexander Pyhalov {
170*16d86563SAlexander Pyhalov i = l;
171*16d86563SAlexander Pyhalov break;
172*16d86563SAlexander Pyhalov }
173*16d86563SAlexander Pyhalov else if (utf82euc_tbl[h].utf8 == utf)
174*16d86563SAlexander Pyhalov {
175*16d86563SAlexander Pyhalov i = h;
176*16d86563SAlexander Pyhalov break;
177*16d86563SAlexander Pyhalov }
178*16d86563SAlexander Pyhalov else if (utf82euc_tbl[i].utf8 < utf)
179*16d86563SAlexander Pyhalov l = i + 1;
180*16d86563SAlexander Pyhalov else
181*16d86563SAlexander Pyhalov h = i - 1;
182*16d86563SAlexander Pyhalov }
183*16d86563SAlexander Pyhalov
184*16d86563SAlexander Pyhalov if (utf82euc_tbl[i].utf8 != utf)
185*16d86563SAlexander Pyhalov {
186*16d86563SAlexander Pyhalov /* Let's assume the code is
187*16d86563SAlexander Pyhalov * non-identical. */
188*16d86563SAlexander Pyhalov *ob++ = NON_IDENTICAL;
189*16d86563SAlexander Pyhalov *ob++ = NON_IDENTICAL;
190*16d86563SAlexander Pyhalov ret_val += 2;
191*16d86563SAlexander Pyhalov }
192*16d86563SAlexander Pyhalov else
193*16d86563SAlexander Pyhalov {
194*16d86563SAlexander Pyhalov *ob++ = (char)((utf82euc_tbl[i].code
195*16d86563SAlexander Pyhalov >> 8) & 0xFF);
196*16d86563SAlexander Pyhalov *ob++ = (char)(utf82euc_tbl[i].code &
197*16d86563SAlexander Pyhalov 0xFF);
198*16d86563SAlexander Pyhalov }
199*16d86563SAlexander Pyhalov }
200*16d86563SAlexander Pyhalov else
201*16d86563SAlexander Pyhalov {
202*16d86563SAlexander Pyhalov PROCESS_PRIOR_CVC();
203*16d86563SAlexander Pyhalov
204*16d86563SAlexander Pyhalov /* Let's assume the code is non-identical. */
205*16d86563SAlexander Pyhalov if ((obtail - ob) < 2)
206*16d86563SAlexander Pyhalov {
207*16d86563SAlexander Pyhalov errno = E2BIG;
208*16d86563SAlexander Pyhalov ret_val = (size_t)-1;
209*16d86563SAlexander Pyhalov break;
210*16d86563SAlexander Pyhalov }
211*16d86563SAlexander Pyhalov *ob++ = NON_IDENTICAL;
212*16d86563SAlexander Pyhalov *ob++ = NON_IDENTICAL;
213*16d86563SAlexander Pyhalov ret_val += 2;
214*16d86563SAlexander Pyhalov }
215*16d86563SAlexander Pyhalov ib += 3;
216*16d86563SAlexander Pyhalov }
217*16d86563SAlexander Pyhalov else /* 11, 21, 26 & 31 bits codes won't be able to convert. */
218*16d86563SAlexander Pyhalov {
219*16d86563SAlexander Pyhalov short int offset;
220*16d86563SAlexander Pyhalov
221*16d86563SAlexander Pyhalov PROCESS_PRIOR_CVC();
222*16d86563SAlexander Pyhalov
223*16d86563SAlexander Pyhalov if ((*ib & 0xE0) == 0xC0) /* 11 */
224*16d86563SAlexander Pyhalov offset = 2;
225*16d86563SAlexander Pyhalov else if ((*ib & 0xF0) == 0xE0) /* 16 */
226*16d86563SAlexander Pyhalov offset = 3;
227*16d86563SAlexander Pyhalov else if ((*ib & 0xF8) == 0xF0) /* 21 */
228*16d86563SAlexander Pyhalov offset = 4;
229*16d86563SAlexander Pyhalov else if ((*ib & 0xFC) == 0xF8) /* 26 */
230*16d86563SAlexander Pyhalov offset = 5;
231*16d86563SAlexander Pyhalov else if ((*ib & 0xFE) == 0xFC) /* 31 */
232*16d86563SAlexander Pyhalov offset = 6;
233*16d86563SAlexander Pyhalov else /* Illegal sequence. */
234*16d86563SAlexander Pyhalov offset = 1;
235*16d86563SAlexander Pyhalov
236*16d86563SAlexander Pyhalov if ((ibtail - ib) < offset)
237*16d86563SAlexander Pyhalov {
238*16d86563SAlexander Pyhalov errno = EINVAL;
239*16d86563SAlexander Pyhalov ret_val = (size_t)-1;
240*16d86563SAlexander Pyhalov break;
241*16d86563SAlexander Pyhalov }
242*16d86563SAlexander Pyhalov ib += offset;
243*16d86563SAlexander Pyhalov
244*16d86563SAlexander Pyhalov /* Let's assume the code is non-identical. */
245*16d86563SAlexander Pyhalov offset = (offset > 2) ? 2 : 1;
246*16d86563SAlexander Pyhalov if ((obtail - ob) < offset)
247*16d86563SAlexander Pyhalov {
248*16d86563SAlexander Pyhalov errno = E2BIG;
249*16d86563SAlexander Pyhalov ret_val = (size_t)-1;
250*16d86563SAlexander Pyhalov break;
251*16d86563SAlexander Pyhalov }
252*16d86563SAlexander Pyhalov *ob++ = NON_IDENTICAL;
253*16d86563SAlexander Pyhalov if (offset > 1)
254*16d86563SAlexander Pyhalov *ob++ = NON_IDENTICAL;
255*16d86563SAlexander Pyhalov ret_val += offset;
256*16d86563SAlexander Pyhalov }
257*16d86563SAlexander Pyhalov }
258*16d86563SAlexander Pyhalov
259*16d86563SAlexander Pyhalov *inbuf = (char*)ib;
260*16d86563SAlexander Pyhalov *inbufleft = ibtail - ib;
261*16d86563SAlexander Pyhalov *outbuf = (char*)ob;
262*16d86563SAlexander Pyhalov *outbufleft = obtail - ob;
263*16d86563SAlexander Pyhalov
264*16d86563SAlexander Pyhalov return(ret_val);
265*16d86563SAlexander Pyhalov } /* end of size_t _icv_iconv(_conv_desc*, char**, size_t*, char**, size_t*).*/
266