/* * CDDL HEADER START * * The contents of this file are subject to the terms of the * Common Development and Distribution License (the "License"). * You may not use this file except in compliance with the License. * * You can obtain a copy of the license at src/OPENSOLARIS.LICENSE * or http://www.opensolaris.org/os/licensing. * See the License for the specific language governing permissions * and limitations under the License. * * When distributing Covered Code, include this CDDL HEADER in each * file and include the License file at src/OPENSOLARIS.LICENSE. * If applicable, add the following below this CDDL HEADER, with the * fields enclosed by brackets "[]" replaced with your own identifying * information: Portions Copyright [yyyy] [name of copyright owner] * * CDDL HEADER END */ /* * Copyright (c) 1996 by Sun Microsystems, Inc. */ #include #include #include #include "common_han.h" #include "common_utf.h" #include "common_euc.h" #include "euc_utf_table.h" static int node_compare(const void *node1, const void *node2) { return(((int)(((const hcode_table *)node1)->code) - (int)(((const hcode_table *)node2)->code))); } /**** _ W A N S U N G _ T O _ U T F 8 ****/ hcode_type _wansung_to_utf8(hcode_type euc_code) { hcode_table *node_ptr, node; hcode_type utf_code; int udc_index; /* User Definable Area Check */ /* bugid 4701856 */ /* characters from 0xc9fa to 0xc9fe are not part of UDC */ /* Therefor, they need to be filtered out here... */ if ( (euc_code.code < 0xc9fa || euc_code.code > 0xc9fe) && ( (EUC_UDC_SEG1 == euc_code.byte.byte3) || (EUC_UDC_SEG2 == euc_code.byte.byte3) ) ){ if ((euc_code.byte.byte4 < EUC_UDC_OFFSET_START) || (EUC_UDC_OFFSET_END < euc_code.byte.byte4)) { /* beyond the UDC area */ utf_code.code = 0; return(utf_code); } udc_index = (euc_code.byte.byte3 == EUC_UDC_SEG1) ? 0 : EUC_UDC_SEG_GAP; udc_index += (int)(euc_code.byte.byte4 - EUC_UDC_OFFSET_START); utf_code = _udcidx_to_utf(udc_index); if (utf_code.code == UTF_UDC_ERROR) utf_code.code = UTF8_NON_ID_CHAR; /* Failed */ return(utf_code); } node.code = euc_code.word.low; node_ptr = bsearch( &node, euc2utf_tbl, sizeof(euc2utf_tbl)/sizeof(hcode_table), sizeof(hcode_table), node_compare); if (node_ptr != NULL) /* Success */ return(node_ptr->utf8); else { /* Failed */ utf_code.code = UTF8_NON_ID_CHAR; return(utf_code); } } /* end of hcode_type _wansung_to_utf8(hcode_type euc_code) */