1 /* $NetBSD: gettext_iconv.c,v 1.8 2009/02/18 13:08:22 yamt Exp $ */
2
3 /*-
4 * Copyright (c) 2004 Citrus Project,
5 * All rights reserved.
6 *
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
9 * are met:
10 * 1. Redistributions of source code must retain the above copyright
11 * notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 *
16 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 * SUCH DAMAGE.
27 *
28 * $Citrus$
29 */
30
31
32 #include <sys/types.h>
33 #include <sys/param.h>
34
35 #include <errno.h>
36 #include <iconv.h>
37 #include <libintl.h>
38 #include <langinfo.h>
39 #include <search.h>
40 #include <stdlib.h>
41 #include <string.h>
42
43 #include "libintl_local.h"
44
45 struct cache {
46 const char *c_origmsg;
47 const char *c_resultmsg;
48 };
49
50 static const struct cache *cache_find(const char *, struct domainbinding *);
51 static int cache_enter(const char *, const char *);
52 static int cache_cmp(const void *, const void *);
53
54 static void *cacheroot;
55
56 /* ARGSUSED1 */
57 static const struct cache *
cache_find(const char * msg,struct domainbinding * db)58 cache_find(const char *msg, struct domainbinding *db)
59 {
60 struct cache key;
61 struct cache **c;
62
63 key.c_origmsg = msg;
64 c = tfind(&key, &cacheroot, cache_cmp);
65
66 return c ? *c : NULL;
67 }
68
69 static int
cache_enter(const char * origmsg,const char * resultmsg)70 cache_enter(const char *origmsg, const char *resultmsg)
71 {
72 struct cache *c;
73
74 c = malloc(sizeof(*c));
75 if (c == NULL)
76 return -1;
77
78 c->c_origmsg = origmsg;
79 c->c_resultmsg = resultmsg;
80
81 if (tsearch(c, &cacheroot, cache_cmp) == NULL) {
82 free(c);
83 return -1;
84 }
85
86 return 0;
87 }
88
89 static int
cache_cmp(const void * va,const void * vb)90 cache_cmp(const void *va, const void *vb)
91 {
92 const struct cache *a = va;
93 const struct cache *b = vb;
94 int result;
95
96 if (a->c_origmsg > b->c_origmsg) {
97 result = 1;
98 } else if (a->c_origmsg < b->c_origmsg) {
99 result = -1;
100 } else {
101 result = 0;
102 }
103
104 return result;
105 }
106
107 #define GETTEXT_ICONV_MALLOC_CHUNK (16 * 1024)
108
109 const char *
__gettext_iconv(const char * origmsg,struct domainbinding * db)110 __gettext_iconv(const char *origmsg, struct domainbinding *db)
111 {
112 const char *tocode;
113 const char *fromcode = db->mohandle.mo.mo_charset;
114 const struct cache *cache;
115 const char *result;
116 iconv_t cd;
117 const char *src;
118 char *dst;
119 size_t origlen;
120 size_t srclen;
121 size_t dstlen;
122 size_t nvalid;
123 int savederrno = errno;
124
125 /*
126 * static buffer for converted texts.
127 *
128 * note:
129 * we never free buffers once returned to callers.
130 * because of interface design of gettext, we can't know
131 * the lifetime of them.
132 */
133 static char *buffer;
134 static size_t bufferlen;
135
136 /*
137 * don't convert message if *.mo doesn't specify codeset.
138 */
139 if (fromcode == NULL)
140 return origmsg;
141
142 tocode = db->codeset;
143 if (tocode == NULL) {
144 /*
145 * codeset isn't specified explicitly by
146 * bind_textdomain_codeset().
147 * use current locale(LC_CTYPE)'s codeset.
148 *
149 * XXX maybe wrong; it can mismatch with
150 * environment variable setting.
151 */
152 tocode = nl_langinfo(CODESET);
153 }
154
155 /*
156 * shortcut if possible.
157 * XXX should handle aliases
158 */
159 if (!strcasecmp(tocode, fromcode))
160 return origmsg;
161
162 /* XXX LOCK */
163
164 /* XXX should detect change of tocode and purge caches? */
165
166 /*
167 * see if we have already converted this message.
168 */
169 cache = cache_find(origmsg, db);
170 if (cache) {
171 result = cache->c_resultmsg;
172 goto out;
173 }
174
175 origlen = strlen(origmsg) + 1;
176 again:
177 cd = iconv_open(tocode, fromcode);
178 if (cd == (iconv_t)-1) {
179 result = origmsg;
180 goto out;
181 }
182
183 src = origmsg;
184 srclen = origlen;
185 dst = buffer;
186 dstlen = bufferlen;
187 nvalid = iconv(cd, &src, &srclen, &dst, &dstlen);
188 iconv_close(cd);
189
190 if (nvalid == (size_t)-1) {
191 /*
192 * try to allocate a new buffer.
193 *
194 * just give up if GETTEXT_ICONV_MALLOC_CHUNK was not enough.
195 */
196 if (errno == E2BIG &&
197 bufferlen != GETTEXT_ICONV_MALLOC_CHUNK) {
198 buffer = malloc(GETTEXT_ICONV_MALLOC_CHUNK);
199 if (buffer) {
200 bufferlen = GETTEXT_ICONV_MALLOC_CHUNK;
201 goto again;
202 }
203 }
204
205 result = origmsg;
206 } else if (cache_enter(origmsg, buffer)) {
207 /*
208 * failed to enter cache. give up.
209 */
210 result = origmsg;
211 } else {
212 size_t resultlen = dst - buffer;
213
214 result = buffer;
215 bufferlen -= resultlen;
216 buffer += resultlen;
217 }
218
219 out:
220 /* XXX UNLOCK */
221 errno = savederrno;
222
223 return result;
224 }
225