1*16d86563SAlexander Pyhalov /*
2*16d86563SAlexander Pyhalov  * CDDL HEADER START
3*16d86563SAlexander Pyhalov  *
4*16d86563SAlexander Pyhalov  * The contents of this file are subject to the terms of the
5*16d86563SAlexander Pyhalov  * Common Development and Distribution License (the "License").
6*16d86563SAlexander Pyhalov  * You may not use this file except in compliance with the License.
7*16d86563SAlexander Pyhalov  *
8*16d86563SAlexander Pyhalov  * You can obtain a copy of the license at src/OPENSOLARIS.LICENSE
9*16d86563SAlexander Pyhalov  * or http://www.opensolaris.org/os/licensing.
10*16d86563SAlexander Pyhalov  * See the License for the specific language governing permissions
11*16d86563SAlexander Pyhalov  * and limitations under the License.
12*16d86563SAlexander Pyhalov  *
13*16d86563SAlexander Pyhalov  * When distributing Covered Code, include this CDDL HEADER in each
14*16d86563SAlexander Pyhalov  * file and include the License file at src/OPENSOLARIS.LICENSE.
15*16d86563SAlexander Pyhalov  * If applicable, add the following below this CDDL HEADER, with the
16*16d86563SAlexander Pyhalov  * fields enclosed by brackets "[]" replaced with your own identifying
17*16d86563SAlexander Pyhalov  * information: Portions Copyright [yyyy] [name of copyright owner]
18*16d86563SAlexander Pyhalov  *
19*16d86563SAlexander Pyhalov  * CDDL HEADER END
20*16d86563SAlexander Pyhalov  */
21*16d86563SAlexander Pyhalov /*
22*16d86563SAlexander Pyhalov  * Copyright (c) 1996 by Sun Microsystems, Inc.
23*16d86563SAlexander Pyhalov  */
24*16d86563SAlexander Pyhalov 
25*16d86563SAlexander Pyhalov 
26*16d86563SAlexander Pyhalov #include <errno.h>
27*16d86563SAlexander Pyhalov #include <widec.h>
28*16d86563SAlexander Pyhalov #include "common_def.h"
29*16d86563SAlexander Pyhalov #include "common_han.h"
30*16d86563SAlexander Pyhalov #include "utf_euc_api.h"
31*16d86563SAlexander Pyhalov #include "common_defs.h"
32*16d86563SAlexander Pyhalov 
33*16d86563SAlexander Pyhalov /****  _ I C V _ O P E N  ****/
34*16d86563SAlexander Pyhalov 
_icv_open()35*16d86563SAlexander Pyhalov void* _icv_open()
36*16d86563SAlexander Pyhalov {
37*16d86563SAlexander Pyhalov         return((void*)MAGIC_NUMBER);
38*16d86563SAlexander Pyhalov }  /* end of int _icv_open(). */
39*16d86563SAlexander Pyhalov 
40*16d86563SAlexander Pyhalov 
41*16d86563SAlexander Pyhalov /****  _ I C V _ C L O S E  ****/
42*16d86563SAlexander Pyhalov 
_icv_close(int * cd)43*16d86563SAlexander Pyhalov void _icv_close(int* cd)
44*16d86563SAlexander Pyhalov {
45*16d86563SAlexander Pyhalov         if (!cd || cd != (int*)MAGIC_NUMBER)
46*16d86563SAlexander Pyhalov                 errno = EBADF;
47*16d86563SAlexander Pyhalov }  /* end of void _icv_close(int*). */
48*16d86563SAlexander Pyhalov 
49*16d86563SAlexander Pyhalov 
50*16d86563SAlexander Pyhalov /****  _ I C V _ I C O N V  ****/
51*16d86563SAlexander Pyhalov 
_icv_iconv(int * cd,char ** inbuf,size_t * inbufleft,char ** outbuf,size_t * outbufleft)52*16d86563SAlexander Pyhalov size_t _icv_iconv(int* cd, char** inbuf, size_t* inbufleft,
53*16d86563SAlexander Pyhalov 			char** outbuf, size_t* outbufleft)
54*16d86563SAlexander Pyhalov {
55*16d86563SAlexander Pyhalov 	size_t		ret_val = 0;
56*16d86563SAlexander Pyhalov 	unsigned char*	ib;
57*16d86563SAlexander Pyhalov 	unsigned char*	ob;
58*16d86563SAlexander Pyhalov 	unsigned char*	ibtail;
59*16d86563SAlexander Pyhalov 	unsigned char*	obtail;
60*16d86563SAlexander Pyhalov 
61*16d86563SAlexander Pyhalov 	if (!cd || cd != (int*)MAGIC_NUMBER)
62*16d86563SAlexander Pyhalov 	{
63*16d86563SAlexander Pyhalov 		errno = EBADF;
64*16d86563SAlexander Pyhalov 		return((size_t)-1);
65*16d86563SAlexander Pyhalov 	}
66*16d86563SAlexander Pyhalov 
67*16d86563SAlexander Pyhalov 	if (!inbuf || !(*inbuf))
68*16d86563SAlexander Pyhalov 		return((size_t)0);
69*16d86563SAlexander Pyhalov 
70*16d86563SAlexander Pyhalov 	ib = (unsigned char*)*inbuf;
71*16d86563SAlexander Pyhalov 	ob = (unsigned char*)*outbuf;
72*16d86563SAlexander Pyhalov 	ibtail = ib + *inbufleft;
73*16d86563SAlexander Pyhalov 	obtail = ob + *outbufleft;
74*16d86563SAlexander Pyhalov 
75*16d86563SAlexander Pyhalov 	while (ib < ibtail)
76*16d86563SAlexander Pyhalov 	{
77*16d86563SAlexander Pyhalov 		if (!(*ib & 0x80))		/* 1-byte sequence */
78*16d86563SAlexander Pyhalov 		{
79*16d86563SAlexander Pyhalov 			if (ob >= obtail)
80*16d86563SAlexander Pyhalov 			{
81*16d86563SAlexander Pyhalov 				errno = E2BIG;
82*16d86563SAlexander Pyhalov 				ret_val = (size_t)-1;
83*16d86563SAlexander Pyhalov 				break;
84*16d86563SAlexander Pyhalov 			}
85*16d86563SAlexander Pyhalov 			*ob++ = *ib++;
86*16d86563SAlexander Pyhalov 		}
87*16d86563SAlexander Pyhalov                 else if((*ib & 0xF0) == 0xE0) /* 3-byte sequence */
88*16d86563SAlexander Pyhalov 		{
89*16d86563SAlexander Pyhalov 			hcode_type utf8_code, euc_code;
90*16d86563SAlexander Pyhalov 
91*16d86563SAlexander Pyhalov 			if ((ibtail - ib) < 3)
92*16d86563SAlexander Pyhalov 			{
93*16d86563SAlexander Pyhalov 				errno = EINVAL;
94*16d86563SAlexander Pyhalov 				ret_val = (size_t)-1;
95*16d86563SAlexander Pyhalov 				break;
96*16d86563SAlexander Pyhalov 			}
97*16d86563SAlexander Pyhalov 
98*16d86563SAlexander Pyhalov 			if (!is_valid_utf8_string(ib, 3))
99*16d86563SAlexander Pyhalov 		        {
100*16d86563SAlexander Pyhalov 				errno = EILSEQ;
101*16d86563SAlexander Pyhalov 				ret_val = (size_t)-1;
102*16d86563SAlexander Pyhalov 				break;
103*16d86563SAlexander Pyhalov 		        }
104*16d86563SAlexander Pyhalov 
105*16d86563SAlexander Pyhalov 			utf8_code.byte.byte1 = 0;
106*16d86563SAlexander Pyhalov 			utf8_code.byte.byte2 = *ib;
107*16d86563SAlexander Pyhalov 			utf8_code.byte.byte3 = *(ib + 1);
108*16d86563SAlexander Pyhalov 			utf8_code.byte.byte4 = *(ib + 2);
109*16d86563SAlexander Pyhalov 
110*16d86563SAlexander Pyhalov 			euc_code = _utf8_to_wansung(utf8_code);
111*16d86563SAlexander Pyhalov 
112*16d86563SAlexander Pyhalov 			if ((obtail - ob) < 2)
113*16d86563SAlexander Pyhalov 		        {
114*16d86563SAlexander Pyhalov 				errno = E2BIG;
115*16d86563SAlexander Pyhalov 				ret_val = (size_t)-1;
116*16d86563SAlexander Pyhalov 				break;
117*16d86563SAlexander Pyhalov 		        }
118*16d86563SAlexander Pyhalov 
119*16d86563SAlexander Pyhalov 			if (euc_code.code != 0) {
120*16d86563SAlexander Pyhalov 				/* If find something -> EUC code */
121*16d86563SAlexander Pyhalov 				*ob++ = euc_code.byte.byte3;
122*16d86563SAlexander Pyhalov 				*ob++ = euc_code.byte.byte4;
123*16d86563SAlexander Pyhalov 			}
124*16d86563SAlexander Pyhalov 			else
125*16d86563SAlexander Pyhalov 			{
126*16d86563SAlexander Pyhalov 				/* Let's assume the code is non-identical. */
127*16d86563SAlexander Pyhalov 				*ob++ = NON_IDENTICAL;
128*16d86563SAlexander Pyhalov 				ret_val += 1;
129*16d86563SAlexander Pyhalov 			}
130*16d86563SAlexander Pyhalov 			ib += 3;
131*16d86563SAlexander Pyhalov 		}
132*16d86563SAlexander Pyhalov                 else if((*ib & 0xE0) == 0xC0)	/* 2-byte sequence */
133*16d86563SAlexander Pyhalov 		{
134*16d86563SAlexander Pyhalov 			hcode_type utf8_code, euc_code;
135*16d86563SAlexander Pyhalov 
136*16d86563SAlexander Pyhalov 			if ((ibtail - ib) < 2)
137*16d86563SAlexander Pyhalov 			{
138*16d86563SAlexander Pyhalov 				errno = EINVAL;
139*16d86563SAlexander Pyhalov 				ret_val = (size_t)-1;
140*16d86563SAlexander Pyhalov 				break;
141*16d86563SAlexander Pyhalov 			}
142*16d86563SAlexander Pyhalov 
143*16d86563SAlexander Pyhalov 			if (!is_valid_utf8_string(ib, 2))
144*16d86563SAlexander Pyhalov 		        {
145*16d86563SAlexander Pyhalov 				errno = EILSEQ;
146*16d86563SAlexander Pyhalov 				ret_val = (size_t)-1;
147*16d86563SAlexander Pyhalov 				break;
148*16d86563SAlexander Pyhalov 		        }
149*16d86563SAlexander Pyhalov 
150*16d86563SAlexander Pyhalov 			utf8_code.byte.byte1 = 0;
151*16d86563SAlexander Pyhalov 			utf8_code.byte.byte2 = 0;
152*16d86563SAlexander Pyhalov 			utf8_code.byte.byte3 = *ib;
153*16d86563SAlexander Pyhalov 			utf8_code.byte.byte4 = *(ib + 1);
154*16d86563SAlexander Pyhalov 
155*16d86563SAlexander Pyhalov 			euc_code = _utf8_to_wansung(utf8_code);
156*16d86563SAlexander Pyhalov 
157*16d86563SAlexander Pyhalov 			if ((obtail - ob) < 2)
158*16d86563SAlexander Pyhalov 		        {
159*16d86563SAlexander Pyhalov 				errno = E2BIG;
160*16d86563SAlexander Pyhalov 				ret_val = (size_t)-1;
161*16d86563SAlexander Pyhalov 				break;
162*16d86563SAlexander Pyhalov 		        }
163*16d86563SAlexander Pyhalov 
164*16d86563SAlexander Pyhalov 			if (euc_code.code != 0) {
165*16d86563SAlexander Pyhalov 				*ob++ = euc_code.byte.byte3;
166*16d86563SAlexander Pyhalov 				*ob++ = euc_code.byte.byte4;
167*16d86563SAlexander Pyhalov 			}
168*16d86563SAlexander Pyhalov 			else
169*16d86563SAlexander Pyhalov 			{
170*16d86563SAlexander Pyhalov 			  *ob++ = NON_IDENTICAL;
171*16d86563SAlexander Pyhalov 			  ret_val += 1;
172*16d86563SAlexander Pyhalov 			}
173*16d86563SAlexander Pyhalov 			ib += 2;
174*16d86563SAlexander Pyhalov 		}
175*16d86563SAlexander Pyhalov 		else  /* 11, 21, 26 & 31 bits codes won't be able to convert. */
176*16d86563SAlexander Pyhalov 		{
177*16d86563SAlexander Pyhalov 			short int offset, offset2;
178*16d86563SAlexander Pyhalov 
179*16d86563SAlexander Pyhalov 			if ((*ib & 0xE0) == 0xC0)  /* 11 */
180*16d86563SAlexander Pyhalov 				offset = 2;
181*16d86563SAlexander Pyhalov 			else if ((*ib & 0xF0) == 0xE0)  /* 16 */
182*16d86563SAlexander Pyhalov 				offset = 3;
183*16d86563SAlexander Pyhalov 			else if ((*ib & 0xF8) == 0xF0)  /* 21 */
184*16d86563SAlexander Pyhalov 				offset = 4;
185*16d86563SAlexander Pyhalov 			else if ((*ib & 0xFC) == 0xF8)  /* 26 */
186*16d86563SAlexander Pyhalov 				offset = 5;
187*16d86563SAlexander Pyhalov 			else if ((*ib & 0xFE) == 0xFC)  /* 31 */
188*16d86563SAlexander Pyhalov 				offset = 6;
189*16d86563SAlexander Pyhalov 			else  /* Illegal sequence. */
190*16d86563SAlexander Pyhalov 				offset = 1;
191*16d86563SAlexander Pyhalov 
192*16d86563SAlexander Pyhalov 			if ((ibtail - ib) < offset)
193*16d86563SAlexander Pyhalov 			{
194*16d86563SAlexander Pyhalov 				errno = EINVAL;
195*16d86563SAlexander Pyhalov 				ret_val = (size_t)-1;
196*16d86563SAlexander Pyhalov 				break;
197*16d86563SAlexander Pyhalov 			}
198*16d86563SAlexander Pyhalov 
199*16d86563SAlexander Pyhalov 			if (!is_valid_utf8_string(ib, offset))
200*16d86563SAlexander Pyhalov 		        {
201*16d86563SAlexander Pyhalov 				errno = EILSEQ;
202*16d86563SAlexander Pyhalov 				ret_val = (size_t)-1;
203*16d86563SAlexander Pyhalov 				break;
204*16d86563SAlexander Pyhalov 		        }
205*16d86563SAlexander Pyhalov 
206*16d86563SAlexander Pyhalov 			/* Let's assume the code is non-identical. */
207*16d86563SAlexander Pyhalov 			offset2 = (offset > 2) ? 2 : 1;
208*16d86563SAlexander Pyhalov 			if ((obtail - ob) < offset2)
209*16d86563SAlexander Pyhalov 			{
210*16d86563SAlexander Pyhalov 				errno = E2BIG;
211*16d86563SAlexander Pyhalov 				ret_val = (size_t)-1;
212*16d86563SAlexander Pyhalov 				break;
213*16d86563SAlexander Pyhalov 			}
214*16d86563SAlexander Pyhalov 
215*16d86563SAlexander Pyhalov 			*ob++ = NON_IDENTICAL;
216*16d86563SAlexander Pyhalov 			if (offset2 > 1)
217*16d86563SAlexander Pyhalov 				*ob++ = NON_IDENTICAL;
218*16d86563SAlexander Pyhalov 
219*16d86563SAlexander Pyhalov 			ib += offset;
220*16d86563SAlexander Pyhalov 
221*16d86563SAlexander Pyhalov 			ret_val += offset2;
222*16d86563SAlexander Pyhalov 		}
223*16d86563SAlexander Pyhalov 	}
224*16d86563SAlexander Pyhalov 
225*16d86563SAlexander Pyhalov 	*inbuf = (char*)ib;
226*16d86563SAlexander Pyhalov 	*inbufleft = ibtail - ib;
227*16d86563SAlexander Pyhalov 	*outbuf = (char*)ob;
228*16d86563SAlexander Pyhalov 	*outbufleft = obtail - ob;
229*16d86563SAlexander Pyhalov 
230*16d86563SAlexander Pyhalov 	return(ret_val);
231*16d86563SAlexander Pyhalov }  /* end of size_t _icv_iconv(int*, char**, size_t*, char**, size_t*).*/
232