1*16d86563SAlexander Pyhalov /*
2*16d86563SAlexander Pyhalov  * CDDL HEADER START
3*16d86563SAlexander Pyhalov  *
4*16d86563SAlexander Pyhalov  * The contents of this file are subject to the terms of the
5*16d86563SAlexander Pyhalov  * Common Development and Distribution License (the "License").
6*16d86563SAlexander Pyhalov  * You may not use this file except in compliance with the License.
7*16d86563SAlexander Pyhalov  *
8*16d86563SAlexander Pyhalov  * You can obtain a copy of the license at src/OPENSOLARIS.LICENSE
9*16d86563SAlexander Pyhalov  * or http://www.opensolaris.org/os/licensing.
10*16d86563SAlexander Pyhalov  * See the License for the specific language governing permissions
11*16d86563SAlexander Pyhalov  * and limitations under the License.
12*16d86563SAlexander Pyhalov  *
13*16d86563SAlexander Pyhalov  * When distributing Covered Code, include this CDDL HEADER in each
14*16d86563SAlexander Pyhalov  * file and include the License file at src/OPENSOLARIS.LICENSE.
15*16d86563SAlexander Pyhalov  * If applicable, add the following below this CDDL HEADER, with the
16*16d86563SAlexander Pyhalov  * fields enclosed by brackets "[]" replaced with your own identifying
17*16d86563SAlexander Pyhalov  * information: Portions Copyright [yyyy] [name of copyright owner]
18*16d86563SAlexander Pyhalov  *
19*16d86563SAlexander Pyhalov  * CDDL HEADER END
20*16d86563SAlexander Pyhalov  */
21*16d86563SAlexander Pyhalov /*
22*16d86563SAlexander Pyhalov  * Copyright (c) 1994 by Sun Microsystems, Inc.
23*16d86563SAlexander Pyhalov  */
24*16d86563SAlexander Pyhalov 
25*16d86563SAlexander Pyhalov 
26*16d86563SAlexander Pyhalov #include <stdlib.h>
27*16d86563SAlexander Pyhalov #include <errno.h>
28*16d86563SAlexander Pyhalov #include "ktable.h"
29*16d86563SAlexander Pyhalov #include "utf_nbyte.h"
30*16d86563SAlexander Pyhalov 
31*16d86563SAlexander Pyhalov 
32*16d86563SAlexander Pyhalov /****  _ I C V _ O P E N  ****/
33*16d86563SAlexander Pyhalov 
_icv_open()34*16d86563SAlexander Pyhalov void* _icv_open()
35*16d86563SAlexander Pyhalov {
36*16d86563SAlexander Pyhalov 	_conv_desc* cd = (_conv_desc*)malloc(sizeof(_conv_desc));
37*16d86563SAlexander Pyhalov 
38*16d86563SAlexander Pyhalov 	if (cd == (_conv_desc*)NULL)
39*16d86563SAlexander Pyhalov 	{
40*16d86563SAlexander Pyhalov 		errno = ENOMEM;
41*16d86563SAlexander Pyhalov 		return((void*)-1);
42*16d86563SAlexander Pyhalov 	}
43*16d86563SAlexander Pyhalov 
44*16d86563SAlexander Pyhalov 	RESET_CONV_DESC();
45*16d86563SAlexander Pyhalov 	cd->state = ASCII;
46*16d86563SAlexander Pyhalov 
47*16d86563SAlexander Pyhalov 	return((void*)cd);
48*16d86563SAlexander Pyhalov }  /* end of int _icv_open(). */
49*16d86563SAlexander Pyhalov 
50*16d86563SAlexander Pyhalov 
51*16d86563SAlexander Pyhalov /****  _ I C V _ C L O S E  ****/
52*16d86563SAlexander Pyhalov 
_icv_close(_conv_desc * cd)53*16d86563SAlexander Pyhalov void _icv_close(_conv_desc* cd)
54*16d86563SAlexander Pyhalov {
55*16d86563SAlexander Pyhalov 	if (!cd)
56*16d86563SAlexander Pyhalov 		errno = EBADF;
57*16d86563SAlexander Pyhalov 	else
58*16d86563SAlexander Pyhalov 		free((void*)cd);
59*16d86563SAlexander Pyhalov }  /* end of void _icv_close(_conv_desc*). */
60*16d86563SAlexander Pyhalov 
61*16d86563SAlexander Pyhalov 
62*16d86563SAlexander Pyhalov /****  _ I C V _ I C O N V  ****/
63*16d86563SAlexander Pyhalov 
_icv_iconv(_conv_desc * cd,char ** inbuf,size_t * inbufleft,char ** outbuf,size_t * outbufleft)64*16d86563SAlexander Pyhalov size_t _icv_iconv(_conv_desc* cd, char** inbuf, size_t* inbufleft,
65*16d86563SAlexander Pyhalov 			char** outbuf, size_t* outbufleft)
66*16d86563SAlexander Pyhalov {
67*16d86563SAlexander Pyhalov 	void		echo_vowel(char*, int*), echo_consonant(char*, int*);
68*16d86563SAlexander Pyhalov 	size_t		ret_val = 0;
69*16d86563SAlexander Pyhalov 	unsigned char*	ib;
70*16d86563SAlexander Pyhalov 	unsigned char*	ob;
71*16d86563SAlexander Pyhalov 	unsigned char*	ibtail;
72*16d86563SAlexander Pyhalov 	unsigned char*	obtail;
73*16d86563SAlexander Pyhalov 
74*16d86563SAlexander Pyhalov 	if (!cd)
75*16d86563SAlexander Pyhalov 	{
76*16d86563SAlexander Pyhalov 		errno = EBADF;
77*16d86563SAlexander Pyhalov 		return((size_t)-1);
78*16d86563SAlexander Pyhalov 	}
79*16d86563SAlexander Pyhalov 
80*16d86563SAlexander Pyhalov 	if (!inbuf || !(*inbuf))
81*16d86563SAlexander Pyhalov 	{
82*16d86563SAlexander Pyhalov 		RESET_CONV_DESC();
83*16d86563SAlexander Pyhalov 		cd->state = ASCII;
84*16d86563SAlexander Pyhalov 		return((size_t)0);
85*16d86563SAlexander Pyhalov 	}
86*16d86563SAlexander Pyhalov 
87*16d86563SAlexander Pyhalov 	ib = (unsigned char*)*inbuf;
88*16d86563SAlexander Pyhalov 	ob = (unsigned char*)*outbuf;
89*16d86563SAlexander Pyhalov 	ibtail = ib + *inbufleft;
90*16d86563SAlexander Pyhalov 	obtail = ob + *outbufleft;
91*16d86563SAlexander Pyhalov 
92*16d86563SAlexander Pyhalov 	while (ib < ibtail)
93*16d86563SAlexander Pyhalov 	{
94*16d86563SAlexander Pyhalov 		if (!(*ib & 0x80))		/* 7 bits */
95*16d86563SAlexander Pyhalov 		{
96*16d86563SAlexander Pyhalov 			PROCESS_PRIOR_CVC();
97*16d86563SAlexander Pyhalov 
98*16d86563SAlexander Pyhalov 			if ((obtail - ob) < (cd->state == WANSUNG ? 2 : 1))
99*16d86563SAlexander Pyhalov 			{
100*16d86563SAlexander Pyhalov 				errno = E2BIG;
101*16d86563SAlexander Pyhalov 				ret_val = (size_t)-1;
102*16d86563SAlexander Pyhalov 				break;
103*16d86563SAlexander Pyhalov 			}
104*16d86563SAlexander Pyhalov 			if (cd->state == WANSUNG)
105*16d86563SAlexander Pyhalov 			{
106*16d86563SAlexander Pyhalov 				*ob++ = SI;
107*16d86563SAlexander Pyhalov 				cd->state = ASCII;
108*16d86563SAlexander Pyhalov 			}
109*16d86563SAlexander Pyhalov 			*ob++ = *ib++;
110*16d86563SAlexander Pyhalov 		}
111*16d86563SAlexander Pyhalov 		else if ((*ib & 0xF0) == 0xE0)	/* 16 bits */
112*16d86563SAlexander Pyhalov 		{
113*16d86563SAlexander Pyhalov 			unsigned long	utf;
114*16d86563SAlexander Pyhalov 
115*16d86563SAlexander Pyhalov 			if ((ibtail - ib) < 3)
116*16d86563SAlexander Pyhalov 			{
117*16d86563SAlexander Pyhalov 				errno = EINVAL;
118*16d86563SAlexander Pyhalov 				ret_val = (size_t)-1;
119*16d86563SAlexander Pyhalov 				break;
120*16d86563SAlexander Pyhalov 			}
121*16d86563SAlexander Pyhalov 
122*16d86563SAlexander Pyhalov 			utf = ((unsigned long)(*ib) << 16) |
123*16d86563SAlexander Pyhalov 			      ((unsigned long)(*(ib + 1)) << 8) |
124*16d86563SAlexander Pyhalov 			      (unsigned long)(*(ib + 2));
125*16d86563SAlexander Pyhalov 			if (utf == 0xE1859F ||
126*16d86563SAlexander Pyhalov 			    (utf >= 0xE18480 && utf <= 0xE18492))  /* Ci */
127*16d86563SAlexander Pyhalov 			{
128*16d86563SAlexander Pyhalov 				PROCESS_PRIOR_CVC();
129*16d86563SAlexander Pyhalov 
130*16d86563SAlexander Pyhalov 				cd->ci = (utf == 0xE1859F) ? CVC_FILL
131*16d86563SAlexander Pyhalov 							   : utf - 0xE18480;
132*16d86563SAlexander Pyhalov 				cd->prev_state = CI;
133*16d86563SAlexander Pyhalov 			}
134*16d86563SAlexander Pyhalov 			else if (utf == 0xE185A0 ||
135*16d86563SAlexander Pyhalov 				 (utf >= 0xE185A1 && utf <= 0xE185B5))  /* V */
136*16d86563SAlexander Pyhalov 			{
137*16d86563SAlexander Pyhalov 				if (cd->prev_state != E && cd->prev_state != CI)
138*16d86563SAlexander Pyhalov 					PROCESS_PRIOR_CVC();
139*16d86563SAlexander Pyhalov 
140*16d86563SAlexander Pyhalov 				cd->v = (utf == 0xE185A0) ? CVC_FILL
141*16d86563SAlexander Pyhalov 							  : utf - 0xE185A1;
142*16d86563SAlexander Pyhalov 				cd->prev_state = V;
143*16d86563SAlexander Pyhalov 			}
144*16d86563SAlexander Pyhalov 			else if ((utf >= 0xE186A8 && utf <= 0xE186BF) ||
145*16d86563SAlexander Pyhalov 				 (utf >= 0xE18780 && utf <= 0xE18782))  /* Cf */
146*16d86563SAlexander Pyhalov 			{
147*16d86563SAlexander Pyhalov 				if (cd->prev_state != E && cd->prev_state != V)
148*16d86563SAlexander Pyhalov 					PROCESS_PRIOR_CVC();
149*16d86563SAlexander Pyhalov 
150*16d86563SAlexander Pyhalov 				cd->cf = utf - ((utf >= 0xE18780) ? 0xE18766
151*16d86563SAlexander Pyhalov 								 : 0xE186A6);
152*16d86563SAlexander Pyhalov 				cd->prev_state = CF;
153*16d86563SAlexander Pyhalov 
154*16d86563SAlexander Pyhalov 				PROCESS_PRIOR_CVC();
155*16d86563SAlexander Pyhalov 			}
156*16d86563SAlexander Pyhalov 			else
157*16d86563SAlexander Pyhalov 			{
158*16d86563SAlexander Pyhalov 				PROCESS_PRIOR_CVC();
159*16d86563SAlexander Pyhalov 
160*16d86563SAlexander Pyhalov 				/* Let's assume the code is non-identical. */
161*16d86563SAlexander Pyhalov 				if ((obtail - ob) < 2)
162*16d86563SAlexander Pyhalov 				{
163*16d86563SAlexander Pyhalov 					errno = E2BIG;
164*16d86563SAlexander Pyhalov 					ret_val = (size_t)-1;
165*16d86563SAlexander Pyhalov 					break;
166*16d86563SAlexander Pyhalov 				}
167*16d86563SAlexander Pyhalov 				*ob++ = NON_IDENTICAL;
168*16d86563SAlexander Pyhalov 				*ob++ = NON_IDENTICAL;
169*16d86563SAlexander Pyhalov 				ret_val += 2;
170*16d86563SAlexander Pyhalov 			}
171*16d86563SAlexander Pyhalov 			ib += 3;
172*16d86563SAlexander Pyhalov 		}
173*16d86563SAlexander Pyhalov 		else  /* 11, 21, 26 & 31 bits codes won't be able to convert. */
174*16d86563SAlexander Pyhalov 		{
175*16d86563SAlexander Pyhalov 			short int offset;
176*16d86563SAlexander Pyhalov 
177*16d86563SAlexander Pyhalov 			PROCESS_PRIOR_CVC();
178*16d86563SAlexander Pyhalov 
179*16d86563SAlexander Pyhalov 			if ((*ib & 0xE0) == 0xC0)  /* 11 */
180*16d86563SAlexander Pyhalov 				offset = 2;
181*16d86563SAlexander Pyhalov 			else if ((*ib & 0xF0) == 0xE0)  /* 16 */
182*16d86563SAlexander Pyhalov 				offset = 3;
183*16d86563SAlexander Pyhalov 			else if ((*ib & 0xF8) == 0xF0)  /* 21 */
184*16d86563SAlexander Pyhalov 				offset = 4;
185*16d86563SAlexander Pyhalov 			else if ((*ib & 0xFC) == 0xF8)  /* 26 */
186*16d86563SAlexander Pyhalov 				offset = 5;
187*16d86563SAlexander Pyhalov 			else if ((*ib & 0xFE) == 0xFC)  /* 31 */
188*16d86563SAlexander Pyhalov 				offset = 6;
189*16d86563SAlexander Pyhalov 			else  /* Illegal sequence. */
190*16d86563SAlexander Pyhalov 				offset = 1;
191*16d86563SAlexander Pyhalov 
192*16d86563SAlexander Pyhalov 			if ((ibtail - ib) < offset)
193*16d86563SAlexander Pyhalov 			{
194*16d86563SAlexander Pyhalov 				errno = EINVAL;
195*16d86563SAlexander Pyhalov 				ret_val = (size_t)-1;
196*16d86563SAlexander Pyhalov 				break;
197*16d86563SAlexander Pyhalov 			}
198*16d86563SAlexander Pyhalov 			ib += offset;
199*16d86563SAlexander Pyhalov 
200*16d86563SAlexander Pyhalov 			/* Let's assume the code is non-identical. */
201*16d86563SAlexander Pyhalov 			offset = (offset > 2) ? 2 : 1;
202*16d86563SAlexander Pyhalov 			if ((obtail - ob) < offset)
203*16d86563SAlexander Pyhalov 			{
204*16d86563SAlexander Pyhalov 				errno = E2BIG;
205*16d86563SAlexander Pyhalov 				ret_val = (size_t)-1;
206*16d86563SAlexander Pyhalov 				break;
207*16d86563SAlexander Pyhalov 			}
208*16d86563SAlexander Pyhalov 			*ob++ = NON_IDENTICAL;
209*16d86563SAlexander Pyhalov 			if (offset > 1)
210*16d86563SAlexander Pyhalov 				*ob++ = NON_IDENTICAL;
211*16d86563SAlexander Pyhalov 			ret_val += offset;
212*16d86563SAlexander Pyhalov 		}
213*16d86563SAlexander Pyhalov 	}
214*16d86563SAlexander Pyhalov 
215*16d86563SAlexander Pyhalov 	*inbuf = (char*)ib;
216*16d86563SAlexander Pyhalov 	*inbufleft = ibtail - ib;
217*16d86563SAlexander Pyhalov 	*outbuf = (char*)ob;
218*16d86563SAlexander Pyhalov 	*outbufleft = obtail - ob;
219*16d86563SAlexander Pyhalov 
220*16d86563SAlexander Pyhalov 	return(ret_val);
221*16d86563SAlexander Pyhalov }  /* end of size_t _icv_iconv(_conv_desc*, char**, size_t*, char**, size_t*).*/
222*16d86563SAlexander Pyhalov 
223*16d86563SAlexander Pyhalov 
224*16d86563SAlexander Pyhalov /****  E C H O _ V O W E L  ****/
225*16d86563SAlexander Pyhalov 
echo_vowel(char * c,int * i)226*16d86563SAlexander Pyhalov void echo_vowel(char* c,  int* i)
227*16d86563SAlexander Pyhalov {
228*16d86563SAlexander Pyhalov 	if (c[*i] == 'm')  /* _|_|- */
229*16d86563SAlexander Pyhalov 	{
230*16d86563SAlexander Pyhalov 		c[(*i)++] = 'l';	/* _|_ */
231*16d86563SAlexander Pyhalov 		c[(*i)++] = 'b';	/* |- */
232*16d86563SAlexander Pyhalov 	}
233*16d86563SAlexander Pyhalov 	else if (c[*i] == 'n')  /* _|_H */
234*16d86563SAlexander Pyhalov 	{
235*16d86563SAlexander Pyhalov 		c[(*i)++] = 'l';	/* _|_ */
236*16d86563SAlexander Pyhalov 		c[(*i)++] = 'c';	/* H */
237*16d86563SAlexander Pyhalov 	}
238*16d86563SAlexander Pyhalov 	else if (c[*i] == 'o')  /* _|_| */
239*16d86563SAlexander Pyhalov 	{
240*16d86563SAlexander Pyhalov 		c[(*i)++] = 'l';	/* _|_ */
241*16d86563SAlexander Pyhalov 		c[(*i)++] = '|';	/* | */
242*16d86563SAlexander Pyhalov 	}
243*16d86563SAlexander Pyhalov 	else if (c[*i] == 't')  /* T-| */
244*16d86563SAlexander Pyhalov 	{
245*16d86563SAlexander Pyhalov 		c[(*i)++] = 's';	/* T */
246*16d86563SAlexander Pyhalov 		c[(*i)++] = 'f';	/* -| */
247*16d86563SAlexander Pyhalov 	}
248*16d86563SAlexander Pyhalov 	else if (c[*i] == 'u')  /* T-|| */
249*16d86563SAlexander Pyhalov 	{
250*16d86563SAlexander Pyhalov 		c[(*i)++] = 's';	/* T */
251*16d86563SAlexander Pyhalov 		c[(*i)++] = 'g';	/* -|| */
252*16d86563SAlexander Pyhalov 	}
253*16d86563SAlexander Pyhalov 	else if (c[*i] == 'v')  /* T| */
254*16d86563SAlexander Pyhalov 	{
255*16d86563SAlexander Pyhalov 		c[(*i)++] = 's';	/* T */
256*16d86563SAlexander Pyhalov 		c[(*i)++] = '|';	/* | */
257*16d86563SAlexander Pyhalov 	}
258*16d86563SAlexander Pyhalov 	else if (c[*i] == '{')  /* _| */
259*16d86563SAlexander Pyhalov 	{
260*16d86563SAlexander Pyhalov 		c[(*i)++] = 'z';	/* __ */
261*16d86563SAlexander Pyhalov 		c[(*i)++] = '|';	/* | */
262*16d86563SAlexander Pyhalov 	}
263*16d86563SAlexander Pyhalov 	else
264*16d86563SAlexander Pyhalov 		(*i)++;
265*16d86563SAlexander Pyhalov }  /* end of void echo_vowel(char*, int*). */
266*16d86563SAlexander Pyhalov 
267*16d86563SAlexander Pyhalov 
268*16d86563SAlexander Pyhalov /****  E C H O _ C O N S O N A N T  ****/
269*16d86563SAlexander Pyhalov 
echo_consonant(char * c,int * i)270*16d86563SAlexander Pyhalov void echo_consonant(char* c,  int* i)
271*16d86563SAlexander Pyhalov {
272*16d86563SAlexander Pyhalov 	if (c[*i] == 'C')  /* gs */
273*16d86563SAlexander Pyhalov 	{
274*16d86563SAlexander Pyhalov 		c[(*i)++] = 'A';	/* g */
275*16d86563SAlexander Pyhalov 		c[(*i)++] = 'U';	/* s */
276*16d86563SAlexander Pyhalov 	}
277*16d86563SAlexander Pyhalov 	else if (c[*i] == 'E')  /* nj */
278*16d86563SAlexander Pyhalov 	{
279*16d86563SAlexander Pyhalov 		c[(*i)++] = 'D';	/* n */
280*16d86563SAlexander Pyhalov 		c[(*i)++] = 'X';	/* j */
281*16d86563SAlexander Pyhalov 	}
282*16d86563SAlexander Pyhalov 	else if (c[*i] == 'F')  /* nh */
283*16d86563SAlexander Pyhalov 	{
284*16d86563SAlexander Pyhalov 		c[(*i)++] = 'D';	/* n */
285*16d86563SAlexander Pyhalov 		c[(*i)++] = '^';	/* h */
286*16d86563SAlexander Pyhalov 	}
287*16d86563SAlexander Pyhalov 	else if (c[*i] == 'J')  /* rg */
288*16d86563SAlexander Pyhalov 	{
289*16d86563SAlexander Pyhalov 		c[(*i)++] = 'I';	/* r */
290*16d86563SAlexander Pyhalov 		c[(*i)++] = 'A';	/* g */
291*16d86563SAlexander Pyhalov 	}
292*16d86563SAlexander Pyhalov 	else if (c[*i] == 'K')  /* rm */
293*16d86563SAlexander Pyhalov 	{
294*16d86563SAlexander Pyhalov 		c[(*i)++] = 'I';	/* r */
295*16d86563SAlexander Pyhalov 		c[(*i)++] = 'Q';	/* m */
296*16d86563SAlexander Pyhalov 	}
297*16d86563SAlexander Pyhalov 	else if (c[*i] == 'L')  /* rb */
298*16d86563SAlexander Pyhalov 	{
299*16d86563SAlexander Pyhalov 		c[(*i)++] = 'I';	/* r */
300*16d86563SAlexander Pyhalov 		c[(*i)++] = 'R';	/* b */
301*16d86563SAlexander Pyhalov 	}
302*16d86563SAlexander Pyhalov 	else if (c[*i] == 'M')  /* rs */
303*16d86563SAlexander Pyhalov 	{
304*16d86563SAlexander Pyhalov 		c[(*i)++] = 'I';	/* r */
305*16d86563SAlexander Pyhalov 		c[(*i)++] = 'U';	/* s */
306*16d86563SAlexander Pyhalov 	}
307*16d86563SAlexander Pyhalov 	else if (c[*i] == 'N')  /* rt */
308*16d86563SAlexander Pyhalov 	{
309*16d86563SAlexander Pyhalov 		c[(*i)++] = 'I';	/* r */
310*16d86563SAlexander Pyhalov 		c[(*i)++] = '\\';	/* t */
311*16d86563SAlexander Pyhalov 	}
312*16d86563SAlexander Pyhalov 	else if (c[*i] == 'O')  /* rp */
313*16d86563SAlexander Pyhalov 	{
314*16d86563SAlexander Pyhalov 		c[(*i)++] = 'I';	/* r */
315*16d86563SAlexander Pyhalov 		c[(*i)++] = ']';	/* p */
316*16d86563SAlexander Pyhalov 	}
317*16d86563SAlexander Pyhalov 	else if (c[*i] == 'P')  /* rh */
318*16d86563SAlexander Pyhalov 	{
319*16d86563SAlexander Pyhalov 		c[(*i)++] = 'I';	/* r */
320*16d86563SAlexander Pyhalov 		c[(*i)++] = '^';	/* h */
321*16d86563SAlexander Pyhalov 	}
322*16d86563SAlexander Pyhalov 	else if (c[*i] == 'T')  /* bs */
323*16d86563SAlexander Pyhalov 	{
324*16d86563SAlexander Pyhalov 		c[(*i)++] = 'R';	/* b */
325*16d86563SAlexander Pyhalov 		c[(*i)++] = 'U';	/* s */
326*16d86563SAlexander Pyhalov 	}
327*16d86563SAlexander Pyhalov 	else
328*16d86563SAlexander Pyhalov 		(*i)++;
329*16d86563SAlexander Pyhalov }  /* end of void echo_consonant(char*, int*). */
330