1*16d86563SAlexander Pyhalov /*
2*16d86563SAlexander Pyhalov * CDDL HEADER START
3*16d86563SAlexander Pyhalov *
4*16d86563SAlexander Pyhalov * The contents of this file are subject to the terms of the
5*16d86563SAlexander Pyhalov * Common Development and Distribution License (the "License").
6*16d86563SAlexander Pyhalov * You may not use this file except in compliance with the License.
7*16d86563SAlexander Pyhalov *
8*16d86563SAlexander Pyhalov * You can obtain a copy of the license at src/OPENSOLARIS.LICENSE
9*16d86563SAlexander Pyhalov * or http://www.opensolaris.org/os/licensing.
10*16d86563SAlexander Pyhalov * See the License for the specific language governing permissions
11*16d86563SAlexander Pyhalov * and limitations under the License.
12*16d86563SAlexander Pyhalov *
13*16d86563SAlexander Pyhalov * When distributing Covered Code, include this CDDL HEADER in each
14*16d86563SAlexander Pyhalov * file and include the License file at src/OPENSOLARIS.LICENSE.
15*16d86563SAlexander Pyhalov * If applicable, add the following below this CDDL HEADER, with the
16*16d86563SAlexander Pyhalov * fields enclosed by brackets "[]" replaced with your own identifying
17*16d86563SAlexander Pyhalov * information: Portions Copyright [yyyy] [name of copyright owner]
18*16d86563SAlexander Pyhalov *
19*16d86563SAlexander Pyhalov * CDDL HEADER END
20*16d86563SAlexander Pyhalov */
21*16d86563SAlexander Pyhalov /*
22*16d86563SAlexander Pyhalov * Copyright (c) 1996 by Sun Microsystems, Inc.
23*16d86563SAlexander Pyhalov */
24*16d86563SAlexander Pyhalov
25*16d86563SAlexander Pyhalov
26*16d86563SAlexander Pyhalov #include <errno.h>
27*16d86563SAlexander Pyhalov #include <widec.h>
28*16d86563SAlexander Pyhalov #include "common_def.h"
29*16d86563SAlexander Pyhalov #include "common_thai.h"
30*16d86563SAlexander Pyhalov #include "utf_euc_api.h"
31*16d86563SAlexander Pyhalov
32*16d86563SAlexander Pyhalov #include "common_defs.h"
33*16d86563SAlexander Pyhalov /**** _ I C V _ O P E N ****/
34*16d86563SAlexander Pyhalov
_icv_open()35*16d86563SAlexander Pyhalov void* _icv_open()
36*16d86563SAlexander Pyhalov {
37*16d86563SAlexander Pyhalov return((void*)MAGIC_NUMBER);
38*16d86563SAlexander Pyhalov } /* end of int _icv_open(). */
39*16d86563SAlexander Pyhalov
40*16d86563SAlexander Pyhalov
41*16d86563SAlexander Pyhalov /**** _ I C V _ C L O S E ****/
42*16d86563SAlexander Pyhalov
_icv_close(int * cd)43*16d86563SAlexander Pyhalov void _icv_close(int* cd)
44*16d86563SAlexander Pyhalov {
45*16d86563SAlexander Pyhalov if (!cd || cd != (int*)MAGIC_NUMBER)
46*16d86563SAlexander Pyhalov errno = EBADF;
47*16d86563SAlexander Pyhalov } /* end of void _icv_close(int*). */
48*16d86563SAlexander Pyhalov
49*16d86563SAlexander Pyhalov
50*16d86563SAlexander Pyhalov /**** _ I C V _ I C O N V ****/
51*16d86563SAlexander Pyhalov
_icv_iconv(int * cd,char ** inbuf,size_t * inbufleft,char ** outbuf,size_t * outbufleft)52*16d86563SAlexander Pyhalov size_t _icv_iconv(int* cd, char** inbuf, size_t* inbufleft,
53*16d86563SAlexander Pyhalov char** outbuf, size_t* outbufleft)
54*16d86563SAlexander Pyhalov {
55*16d86563SAlexander Pyhalov size_t ret_val = 0;
56*16d86563SAlexander Pyhalov unsigned char* ib;
57*16d86563SAlexander Pyhalov unsigned char* ob;
58*16d86563SAlexander Pyhalov unsigned char* ibtail;
59*16d86563SAlexander Pyhalov unsigned char* obtail;
60*16d86563SAlexander Pyhalov
61*16d86563SAlexander Pyhalov if (!cd || cd != (int*)MAGIC_NUMBER)
62*16d86563SAlexander Pyhalov {
63*16d86563SAlexander Pyhalov errno = EBADF;
64*16d86563SAlexander Pyhalov return((size_t)-1);
65*16d86563SAlexander Pyhalov }
66*16d86563SAlexander Pyhalov
67*16d86563SAlexander Pyhalov if (!inbuf || !(*inbuf))
68*16d86563SAlexander Pyhalov return((size_t)0);
69*16d86563SAlexander Pyhalov
70*16d86563SAlexander Pyhalov ib = (unsigned char*)*inbuf;
71*16d86563SAlexander Pyhalov ob = (unsigned char*)*outbuf;
72*16d86563SAlexander Pyhalov ibtail = ib + *inbufleft;
73*16d86563SAlexander Pyhalov obtail = ob + *outbufleft;
74*16d86563SAlexander Pyhalov
75*16d86563SAlexander Pyhalov while (ib < ibtail)
76*16d86563SAlexander Pyhalov {
77*16d86563SAlexander Pyhalov if (!(*ib & 0x80)) /* 7 bits */
78*16d86563SAlexander Pyhalov {
79*16d86563SAlexander Pyhalov if (ob >= obtail)
80*16d86563SAlexander Pyhalov {
81*16d86563SAlexander Pyhalov errno = E2BIG;
82*16d86563SAlexander Pyhalov ret_val = (size_t)-1;
83*16d86563SAlexander Pyhalov break;
84*16d86563SAlexander Pyhalov }
85*16d86563SAlexander Pyhalov *ob++ = *ib++;
86*16d86563SAlexander Pyhalov }
87*16d86563SAlexander Pyhalov else if ((*ib & 0xF0) == 0xE0) /* 16 bits */
88*16d86563SAlexander Pyhalov {
89*16d86563SAlexander Pyhalov hcode_type utf8_code, euc_code;
90*16d86563SAlexander Pyhalov
91*16d86563SAlexander Pyhalov if ((ibtail - ib) < 3)
92*16d86563SAlexander Pyhalov {
93*16d86563SAlexander Pyhalov errno = EINVAL;
94*16d86563SAlexander Pyhalov ret_val = (size_t)-1;
95*16d86563SAlexander Pyhalov break;
96*16d86563SAlexander Pyhalov }
97*16d86563SAlexander Pyhalov
98*16d86563SAlexander Pyhalov /* UNICODE 3.2 :eliminate non-secure UTF-8 sequence */
99*16d86563SAlexander Pyhalov if (*(ib+1)<valid_min_2nd_byte[*ib] || *(ib+1)>valid_max_2nd_byte[*ib])
100*16d86563SAlexander Pyhalov {
101*16d86563SAlexander Pyhalov errno = EILSEQ;
102*16d86563SAlexander Pyhalov ret_val = (size_t)-1;
103*16d86563SAlexander Pyhalov break;
104*16d86563SAlexander Pyhalov }
105*16d86563SAlexander Pyhalov else if ((*(ib+2)&0xC0)^0x80)
106*16d86563SAlexander Pyhalov {
107*16d86563SAlexander Pyhalov errno = EILSEQ;
108*16d86563SAlexander Pyhalov ret_val = (size_t)-1;
109*16d86563SAlexander Pyhalov break;
110*16d86563SAlexander Pyhalov }
111*16d86563SAlexander Pyhalov else if (*ib==0xEF && *(ib+1)==0xBF && (*(ib+2)==0xBF || *(ib+2)==0xBE))
112*16d86563SAlexander Pyhalov { /*U+FFFE , U+FFFF*/
113*16d86563SAlexander Pyhalov errno = EILSEQ;
114*16d86563SAlexander Pyhalov ret_val = (size_t)-1;
115*16d86563SAlexander Pyhalov break;
116*16d86563SAlexander Pyhalov }
117*16d86563SAlexander Pyhalov
118*16d86563SAlexander Pyhalov utf8_code.byte.byte1 = 0;
119*16d86563SAlexander Pyhalov utf8_code.byte.byte2 = *ib;
120*16d86563SAlexander Pyhalov utf8_code.byte.byte3 = *(ib + 1);
121*16d86563SAlexander Pyhalov utf8_code.byte.byte4 = *(ib + 2);
122*16d86563SAlexander Pyhalov
123*16d86563SAlexander Pyhalov euc_code = _utf8_to_eucTH(utf8_code);
124*16d86563SAlexander Pyhalov
125*16d86563SAlexander Pyhalov if (euc_code.code != 0) {
126*16d86563SAlexander Pyhalov /* If find something -> EUC code */
127*16d86563SAlexander Pyhalov *ob++ = euc_code.byte.byte4;
128*16d86563SAlexander Pyhalov }
129*16d86563SAlexander Pyhalov else
130*16d86563SAlexander Pyhalov {
131*16d86563SAlexander Pyhalov /* Let's assume the code is non-identical. */
132*16d86563SAlexander Pyhalov if ((obtail - ob) < 1)
133*16d86563SAlexander Pyhalov {
134*16d86563SAlexander Pyhalov errno = E2BIG;
135*16d86563SAlexander Pyhalov ret_val = (size_t)-1;
136*16d86563SAlexander Pyhalov break;
137*16d86563SAlexander Pyhalov }
138*16d86563SAlexander Pyhalov *ob++ = NON_IDENTICAL;
139*16d86563SAlexander Pyhalov ret_val += 1;
140*16d86563SAlexander Pyhalov }
141*16d86563SAlexander Pyhalov ib += 3;
142*16d86563SAlexander Pyhalov }
143*16d86563SAlexander Pyhalov else /* 11, 21, 26 & 31 bits codes won't be able to convert. */
144*16d86563SAlexander Pyhalov {
145*16d86563SAlexander Pyhalov short int offset;
146*16d86563SAlexander Pyhalov
147*16d86563SAlexander Pyhalov errno = 0;
148*16d86563SAlexander Pyhalov offset = number_of_bytes_in_utf8_char[*ib];
149*16d86563SAlexander Pyhalov if (offset == ICV_TYPE_ILLEGAL_CHAR )
150*16d86563SAlexander Pyhalov {
151*16d86563SAlexander Pyhalov errno = EILSEQ;
152*16d86563SAlexander Pyhalov }
153*16d86563SAlexander Pyhalov else if (ibtail-ib < offset)
154*16d86563SAlexander Pyhalov {
155*16d86563SAlexander Pyhalov errno = EINVAL;
156*16d86563SAlexander Pyhalov }
157*16d86563SAlexander Pyhalov else if (*(ib+1)<valid_min_2nd_byte[*ib] || *(ib+1)>valid_max_2nd_byte[*ib])
158*16d86563SAlexander Pyhalov {
159*16d86563SAlexander Pyhalov errno = EILSEQ;
160*16d86563SAlexander Pyhalov }
161*16d86563SAlexander Pyhalov else /* check the remaining byte [0x80, 0xBF] */
162*16d86563SAlexander Pyhalov {
163*16d86563SAlexander Pyhalov int i;
164*16d86563SAlexander Pyhalov for(i=2;i<offset;i++)
165*16d86563SAlexander Pyhalov {
166*16d86563SAlexander Pyhalov if ((*(ib+i) & 0xC0) ^ 0x80)
167*16d86563SAlexander Pyhalov {
168*16d86563SAlexander Pyhalov errno = EILSEQ;
169*16d86563SAlexander Pyhalov break;
170*16d86563SAlexander Pyhalov }
171*16d86563SAlexander Pyhalov }
172*16d86563SAlexander Pyhalov }
173*16d86563SAlexander Pyhalov if(errno)
174*16d86563SAlexander Pyhalov {
175*16d86563SAlexander Pyhalov ret_val = (size_t)-1;
176*16d86563SAlexander Pyhalov break;
177*16d86563SAlexander Pyhalov }
178*16d86563SAlexander Pyhalov
179*16d86563SAlexander Pyhalov ib += offset;
180*16d86563SAlexander Pyhalov
181*16d86563SAlexander Pyhalov /* Let's assume the code is non-identical. */
182*16d86563SAlexander Pyhalov offset = (offset > 2) ? 2 : 1;
183*16d86563SAlexander Pyhalov if ((obtail - ob) < offset)
184*16d86563SAlexander Pyhalov {
185*16d86563SAlexander Pyhalov errno = E2BIG;
186*16d86563SAlexander Pyhalov ret_val = (size_t)-1;
187*16d86563SAlexander Pyhalov break;
188*16d86563SAlexander Pyhalov }
189*16d86563SAlexander Pyhalov *ob++ = NON_IDENTICAL;
190*16d86563SAlexander Pyhalov if (offset > 1)
191*16d86563SAlexander Pyhalov *ob++ = NON_IDENTICAL;
192*16d86563SAlexander Pyhalov ret_val += offset;
193*16d86563SAlexander Pyhalov }
194*16d86563SAlexander Pyhalov }
195*16d86563SAlexander Pyhalov
196*16d86563SAlexander Pyhalov *inbuf = (char*)ib;
197*16d86563SAlexander Pyhalov *inbufleft = ibtail - ib;
198*16d86563SAlexander Pyhalov *outbuf = (char*)ob;
199*16d86563SAlexander Pyhalov *outbufleft = obtail - ob;
200*16d86563SAlexander Pyhalov
201*16d86563SAlexander Pyhalov return(ret_val);
202*16d86563SAlexander Pyhalov } /* end of size_t _icv_iconv(int*, char**, size_t*, char**, size_t*).*/
203