1 // std::ctype implementation details, GNU version -*- C++ -*-
2 
3 // Copyright (C) 2001-2013 Free Software Foundation, Inc.
4 //
5 // This file is part of the GNU ISO C++ Library.  This library is free
6 // software; you can redistribute it and/or modify it under the
7 // terms of the GNU General Public License as published by the
8 // Free Software Foundation; either version 3, or (at your option)
9 // any later version.
10 
11 // This library is distributed in the hope that it will be useful,
12 // but WITHOUT ANY WARRANTY; without even the implied warranty of
13 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14 // GNU General Public License for more details.
15 
16 // Under Section 7 of GPL version 3, you are granted additional
17 // permissions described in the GCC Runtime Library Exception, version
18 // 3.1, as published by the Free Software Foundation.
19 
20 // You should have received a copy of the GNU General Public License and
21 // a copy of the GCC Runtime Library Exception along with this program;
22 // see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
23 // <http://www.gnu.org/licenses/>.
24 
25 //
26 // ISO C++ 14882: 22.2.1.1.2  ctype virtual functions.
27 //
28 
29 // Written by Benjamin Kosnik <bkoz@redhat.com>
30 
31 #include <locale>
32 #include <cstdio>
33 #include <bits/c++locale_internal.h>
34 
35 namespace std _GLIBCXX_VISIBILITY(default)
36 {
37 _GLIBCXX_BEGIN_NAMESPACE_VERSION
38 
39   // NB: The other ctype<char> specializations are in src/locale.cc and
40   // various /config/os/* files.
41   ctype_byname<char>::ctype_byname(const char* __s, size_t __refs)
42   : ctype<char>(0, false, __refs)
43   {
44     if (std::strcmp(__s, "C") != 0 && std::strcmp(__s, "POSIX") != 0)
45       {
46 	this->_S_destroy_c_locale(this->_M_c_locale_ctype);
47 	this->_S_create_c_locale(this->_M_c_locale_ctype, __s);
48 	this->_M_toupper = this->_M_c_locale_ctype->__ctype_toupper;
49 	this->_M_tolower = this->_M_c_locale_ctype->__ctype_tolower;
50 	this->_M_table = this->_M_c_locale_ctype->__ctype_b;
51       }
52   }
53 
54   ctype_byname<char>::~ctype_byname()
55   { }
56 
57 #ifdef _GLIBCXX_USE_WCHAR_T
58   ctype<wchar_t>::__wmask_type
59   ctype<wchar_t>::_M_convert_to_wmask(const mask __m) const throw()
60   {
61     __wmask_type __ret;
62     switch (__m)
63       {
64       case space:
65 	__ret = __wctype_l("space", _M_c_locale_ctype);
66 	break;
67       case print:
68 	__ret = __wctype_l("print", _M_c_locale_ctype);
69 	break;
70       case cntrl:
71 	__ret = __wctype_l("cntrl", _M_c_locale_ctype);
72 	break;
73       case upper:
74 	__ret = __wctype_l("upper", _M_c_locale_ctype);
75 	break;
76       case lower:
77 	__ret = __wctype_l("lower", _M_c_locale_ctype);
78 	break;
79       case alpha:
80 	__ret = __wctype_l("alpha", _M_c_locale_ctype);
81 	break;
82       case digit:
83 	__ret = __wctype_l("digit", _M_c_locale_ctype);
84 	break;
85       case punct:
86 	__ret = __wctype_l("punct", _M_c_locale_ctype);
87 	break;
88       case xdigit:
89 	__ret = __wctype_l("xdigit", _M_c_locale_ctype);
90 	break;
91       case alnum:
92 	__ret = __wctype_l("alnum", _M_c_locale_ctype);
93 	break;
94       case graph:
95 	__ret = __wctype_l("graph", _M_c_locale_ctype);
96 	break;
97       default:
98 	__ret = __wmask_type();
99       }
100     return __ret;
101   }
102 
103   wchar_t
104   ctype<wchar_t>::do_toupper(wchar_t __c) const
105   { return __towupper_l(__c, _M_c_locale_ctype); }
106 
107   const wchar_t*
108   ctype<wchar_t>::do_toupper(wchar_t* __lo, const wchar_t* __hi) const
109   {
110     while (__lo < __hi)
111       {
112         *__lo = __towupper_l(*__lo, _M_c_locale_ctype);
113         ++__lo;
114       }
115     return __hi;
116   }
117 
118   wchar_t
119   ctype<wchar_t>::do_tolower(wchar_t __c) const
120   { return __towlower_l(__c, _M_c_locale_ctype); }
121 
122   const wchar_t*
123   ctype<wchar_t>::do_tolower(wchar_t* __lo, const wchar_t* __hi) const
124   {
125     while (__lo < __hi)
126       {
127         *__lo = __towlower_l(*__lo, _M_c_locale_ctype);
128         ++__lo;
129       }
130     return __hi;
131   }
132 
133   bool
134   ctype<wchar_t>::
135   do_is(mask __m, wchar_t __c) const
136   {
137     // The case of __m == ctype_base::space is particularly important,
138     // due to its use in many istream functions.  Therefore we deal with
139     // it first, exploiting the knowledge that on GNU systems _M_bit[5]
140     // is the mask corresponding to ctype_base::space.  NB: an encoding
141     // change would not affect correctness!
142     bool __ret = false;
143     if (__m == _M_bit[5])
144       __ret = __iswctype_l(__c, _M_wmask[5], _M_c_locale_ctype);
145     else
146       {
147 	// Highest bitmask in ctype_base == 10, but extra in "C"
148 	// library for blank.
149 	const size_t __bitmasksize = 11;
150 	for (size_t __bitcur = 0; __bitcur <= __bitmasksize; ++__bitcur)
151 	  if (__m & _M_bit[__bitcur])
152 	    {
153 	      if (__iswctype_l(__c, _M_wmask[__bitcur], _M_c_locale_ctype))
154 		{
155 		  __ret = true;
156 		  break;
157 		}
158 	      else if (__m == _M_bit[__bitcur])
159 		break;
160 	    }
161       }
162     return __ret;
163   }
164 
165   const wchar_t*
166   ctype<wchar_t>::
167   do_is(const wchar_t* __lo, const wchar_t* __hi, mask* __vec) const
168   {
169     for (; __lo < __hi; ++__vec, ++__lo)
170       {
171 	// Highest bitmask in ctype_base == 10, but extra in "C"
172 	// library for blank.
173 	const size_t __bitmasksize = 11;
174 	mask __m = 0;
175 	for (size_t __bitcur = 0; __bitcur <= __bitmasksize; ++__bitcur)
176 	  if (__iswctype_l(*__lo, _M_wmask[__bitcur], _M_c_locale_ctype))
177 	    __m |= _M_bit[__bitcur];
178 	*__vec = __m;
179       }
180     return __hi;
181   }
182 
183   const wchar_t*
184   ctype<wchar_t>::
185   do_scan_is(mask __m, const wchar_t* __lo, const wchar_t* __hi) const
186   {
187     while (__lo < __hi && !this->do_is(__m, *__lo))
188       ++__lo;
189     return __lo;
190   }
191 
192   const wchar_t*
193   ctype<wchar_t>::
194   do_scan_not(mask __m, const char_type* __lo, const char_type* __hi) const
195   {
196     while (__lo < __hi && this->do_is(__m, *__lo) != 0)
197       ++__lo;
198     return __lo;
199   }
200 
201   wchar_t
202   ctype<wchar_t>::
203   do_widen(char __c) const
204   { return _M_widen[static_cast<unsigned char>(__c)]; }
205 
206   const char*
207   ctype<wchar_t>::
208   do_widen(const char* __lo, const char* __hi, wchar_t* __dest) const
209   {
210     while (__lo < __hi)
211       {
212 	*__dest = _M_widen[static_cast<unsigned char>(*__lo)];
213 	++__lo;
214 	++__dest;
215       }
216     return __hi;
217   }
218 
219   char
220   ctype<wchar_t>::
221   do_narrow(wchar_t __wc, char __dfault) const
222   {
223     if (__wc >= 0 && __wc < 128 && _M_narrow_ok)
224       return _M_narrow[__wc];
225 #if __GLIBC__ > 2 || (__GLIBC__ == 2 && __GLIBC_MINOR__ > 2)
226     __c_locale __old = __uselocale(_M_c_locale_ctype);
227 #endif
228     const int __c = wctob(__wc);
229 #if __GLIBC__ > 2 || (__GLIBC__ == 2 && __GLIBC_MINOR__ > 2)
230     __uselocale(__old);
231 #endif
232     return (__c == EOF ? __dfault : static_cast<char>(__c));
233   }
234 
235   const wchar_t*
236   ctype<wchar_t>::
237   do_narrow(const wchar_t* __lo, const wchar_t* __hi, char __dfault,
238 	    char* __dest) const
239   {
240 #if __GLIBC__ > 2 || (__GLIBC__ == 2 && __GLIBC_MINOR__ > 2)
241     __c_locale __old = __uselocale(_M_c_locale_ctype);
242 #endif
243     if (_M_narrow_ok)
244       while (__lo < __hi)
245 	{
246 	  if (*__lo >= 0 && *__lo < 128)
247 	    *__dest = _M_narrow[*__lo];
248 	  else
249 	    {
250 	      const int __c = wctob(*__lo);
251 	      *__dest = (__c == EOF ? __dfault : static_cast<char>(__c));
252 	    }
253 	  ++__lo;
254 	  ++__dest;
255 	}
256     else
257       while (__lo < __hi)
258 	{
259 	  const int __c = wctob(*__lo);
260 	  *__dest = (__c == EOF ? __dfault : static_cast<char>(__c));
261 	  ++__lo;
262 	  ++__dest;
263 	}
264 #if __GLIBC__ > 2 || (__GLIBC__ == 2 && __GLIBC_MINOR__ > 2)
265     __uselocale(__old);
266 #endif
267     return __hi;
268   }
269 
270   void
271   ctype<wchar_t>::_M_initialize_ctype() throw()
272   {
273 #if __GLIBC__ > 2 || (__GLIBC__ == 2 && __GLIBC_MINOR__ > 2)
274     __c_locale __old = __uselocale(_M_c_locale_ctype);
275 #endif
276     wint_t __i;
277     for (__i = 0; __i < 128; ++__i)
278       {
279 	const int __c = wctob(__i);
280 	if (__c == EOF)
281 	  break;
282 	else
283 	  _M_narrow[__i] = static_cast<char>(__c);
284       }
285     if (__i == 128)
286       _M_narrow_ok = true;
287     else
288       _M_narrow_ok = false;
289     for (size_t __j = 0;
290 	 __j < sizeof(_M_widen) / sizeof(wint_t); ++__j)
291       _M_widen[__j] = btowc(__j);
292 
293     for (size_t __k = 0; __k <= 11; ++__k)
294       {
295 	_M_bit[__k] = static_cast<mask>(_ISbit(__k));
296 	_M_wmask[__k] = _M_convert_to_wmask(_M_bit[__k]);
297       }
298 #if __GLIBC__ > 2 || (__GLIBC__ == 2 && __GLIBC_MINOR__ > 2)
299     __uselocale(__old);
300 #endif
301   }
302 #endif //  _GLIBCXX_USE_WCHAR_T
303 
304 _GLIBCXX_END_NAMESPACE_VERSION
305 } // namespace
306