1 /* libxml2 - Library for parsing XML documents
2  * Copyright (C) 2006-2019 Free Software Foundation, Inc.
3  *
4  * This file is not part of the GNU gettext program, but is used with
5  * GNU gettext.
6  *
7  * The original copyright notice is as follows:
8  */
9 
10 /*
11  * Copyright (C) 1998-2012 Daniel Veillard.  All Rights Reserved.
12  *
13  * Permission is hereby granted, free of charge, to any person obtaining a copy
14  * of this software and associated documentation files (the "Software"), to deal
15  * in the Software without restriction, including without limitation the rights
16  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
17  * copies of the Software, and to permit persons to whom the Software is fur-
18  * nished to do so, subject to the following conditions:
19  *
20  * The above copyright notice and this permission notice shall be included in
21  * all copies or substantial portions of the Software.
22  *
23  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
24  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FIT-
25  * NESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
26  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
27  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
28  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
29  * THE SOFTWARE.
30  */
31 
32 /*
33  * chvalid.c:	this module implements the character range
34  *		validation APIs
35  *
36  * This file is automatically generated from the cvs source
37  * definition files using the genChRanges.py Python script
38  *
39  * Generation date: Mon Mar 27 11:09:48 2006
40  * Sources: chvalid.def
41  * William Brack <wbrack@mmm.com.hk>
42  */
43 
44 #define IN_LIBXML
45 #include "libxml.h"
46 #include <libxml/chvalid.h>
47 
48 /*
49  * The initial tables ({func_name}_tab) are used to validate whether a
50  * single-byte character is within the specified group.  Each table
51  * contains 256 bytes, with each byte representing one of the 256
52  * possible characters.  If the table byte is set, the character is
53  * allowed.
54  *
55  */
56 const unsigned char xmlIsPubidChar_tab[256] = {
57     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x01, 0x00,
58     0x00, 0x01, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
59     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x01, 0x01, 0x00, 0x01,
60     0x01, 0x01, 0x00, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01,
61     0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01,
62     0x00, 0x01, 0x00, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01,
63     0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01,
64     0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x00, 0x00, 0x00, 0x00, 0x01,
65     0x00, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01,
66     0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01,
67     0x01, 0x01, 0x01, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
68     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
69     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
70     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
71     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
72     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
73     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
74     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
75     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
76     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
77     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
78     0x00, 0x00, 0x00, 0x00 };
79 
80 static const xmlChSRange xmlIsBaseChar_srng[] = { {0x100, 0x131},
81     {0x134, 0x13e}, {0x141, 0x148}, {0x14a, 0x17e}, {0x180, 0x1c3},
82     {0x1cd, 0x1f0}, {0x1f4, 0x1f5}, {0x1fa, 0x217}, {0x250, 0x2a8},
83     {0x2bb, 0x2c1}, {0x386, 0x386}, {0x388, 0x38a}, {0x38c, 0x38c},
84     {0x38e, 0x3a1}, {0x3a3, 0x3ce}, {0x3d0, 0x3d6}, {0x3da, 0x3da},
85     {0x3dc, 0x3dc}, {0x3de, 0x3de}, {0x3e0, 0x3e0}, {0x3e2, 0x3f3},
86     {0x401, 0x40c}, {0x40e, 0x44f}, {0x451, 0x45c}, {0x45e, 0x481},
87     {0x490, 0x4c4}, {0x4c7, 0x4c8}, {0x4cb, 0x4cc}, {0x4d0, 0x4eb},
88     {0x4ee, 0x4f5}, {0x4f8, 0x4f9}, {0x531, 0x556}, {0x559, 0x559},
89     {0x561, 0x586}, {0x5d0, 0x5ea}, {0x5f0, 0x5f2}, {0x621, 0x63a},
90     {0x641, 0x64a}, {0x671, 0x6b7}, {0x6ba, 0x6be}, {0x6c0, 0x6ce},
91     {0x6d0, 0x6d3}, {0x6d5, 0x6d5}, {0x6e5, 0x6e6}, {0x905, 0x939},
92     {0x93d, 0x93d}, {0x958, 0x961}, {0x985, 0x98c}, {0x98f, 0x990},
93     {0x993, 0x9a8}, {0x9aa, 0x9b0}, {0x9b2, 0x9b2}, {0x9b6, 0x9b9},
94     {0x9dc, 0x9dd}, {0x9df, 0x9e1}, {0x9f0, 0x9f1}, {0xa05, 0xa0a},
95     {0xa0f, 0xa10}, {0xa13, 0xa28}, {0xa2a, 0xa30}, {0xa32, 0xa33},
96     {0xa35, 0xa36}, {0xa38, 0xa39}, {0xa59, 0xa5c}, {0xa5e, 0xa5e},
97     {0xa72, 0xa74}, {0xa85, 0xa8b}, {0xa8d, 0xa8d}, {0xa8f, 0xa91},
98     {0xa93, 0xaa8}, {0xaaa, 0xab0}, {0xab2, 0xab3}, {0xab5, 0xab9},
99     {0xabd, 0xabd}, {0xae0, 0xae0}, {0xb05, 0xb0c}, {0xb0f, 0xb10},
100     {0xb13, 0xb28}, {0xb2a, 0xb30}, {0xb32, 0xb33}, {0xb36, 0xb39},
101     {0xb3d, 0xb3d}, {0xb5c, 0xb5d}, {0xb5f, 0xb61}, {0xb85, 0xb8a},
102     {0xb8e, 0xb90}, {0xb92, 0xb95}, {0xb99, 0xb9a}, {0xb9c, 0xb9c},
103     {0xb9e, 0xb9f}, {0xba3, 0xba4}, {0xba8, 0xbaa}, {0xbae, 0xbb5},
104     {0xbb7, 0xbb9}, {0xc05, 0xc0c}, {0xc0e, 0xc10}, {0xc12, 0xc28},
105     {0xc2a, 0xc33}, {0xc35, 0xc39}, {0xc60, 0xc61}, {0xc85, 0xc8c},
106     {0xc8e, 0xc90}, {0xc92, 0xca8}, {0xcaa, 0xcb3}, {0xcb5, 0xcb9},
107     {0xcde, 0xcde}, {0xce0, 0xce1}, {0xd05, 0xd0c}, {0xd0e, 0xd10},
108     {0xd12, 0xd28}, {0xd2a, 0xd39}, {0xd60, 0xd61}, {0xe01, 0xe2e},
109     {0xe30, 0xe30}, {0xe32, 0xe33}, {0xe40, 0xe45}, {0xe81, 0xe82},
110     {0xe84, 0xe84}, {0xe87, 0xe88}, {0xe8a, 0xe8a}, {0xe8d, 0xe8d},
111     {0xe94, 0xe97}, {0xe99, 0xe9f}, {0xea1, 0xea3}, {0xea5, 0xea5},
112     {0xea7, 0xea7}, {0xeaa, 0xeab}, {0xead, 0xeae}, {0xeb0, 0xeb0},
113     {0xeb2, 0xeb3}, {0xebd, 0xebd}, {0xec0, 0xec4}, {0xf40, 0xf47},
114     {0xf49, 0xf69}, {0x10a0, 0x10c5}, {0x10d0, 0x10f6}, {0x1100, 0x1100},
115     {0x1102, 0x1103}, {0x1105, 0x1107}, {0x1109, 0x1109}, {0x110b, 0x110c},
116     {0x110e, 0x1112}, {0x113c, 0x113c}, {0x113e, 0x113e}, {0x1140, 0x1140},
117     {0x114c, 0x114c}, {0x114e, 0x114e}, {0x1150, 0x1150}, {0x1154, 0x1155},
118     {0x1159, 0x1159}, {0x115f, 0x1161}, {0x1163, 0x1163}, {0x1165, 0x1165},
119     {0x1167, 0x1167}, {0x1169, 0x1169}, {0x116d, 0x116e}, {0x1172, 0x1173},
120     {0x1175, 0x1175}, {0x119e, 0x119e}, {0x11a8, 0x11a8}, {0x11ab, 0x11ab},
121     {0x11ae, 0x11af}, {0x11b7, 0x11b8}, {0x11ba, 0x11ba}, {0x11bc, 0x11c2},
122     {0x11eb, 0x11eb}, {0x11f0, 0x11f0}, {0x11f9, 0x11f9}, {0x1e00, 0x1e9b},
123     {0x1ea0, 0x1ef9}, {0x1f00, 0x1f15}, {0x1f18, 0x1f1d}, {0x1f20, 0x1f45},
124     {0x1f48, 0x1f4d}, {0x1f50, 0x1f57}, {0x1f59, 0x1f59}, {0x1f5b, 0x1f5b},
125     {0x1f5d, 0x1f5d}, {0x1f5f, 0x1f7d}, {0x1f80, 0x1fb4}, {0x1fb6, 0x1fbc},
126     {0x1fbe, 0x1fbe}, {0x1fc2, 0x1fc4}, {0x1fc6, 0x1fcc}, {0x1fd0, 0x1fd3},
127     {0x1fd6, 0x1fdb}, {0x1fe0, 0x1fec}, {0x1ff2, 0x1ff4}, {0x1ff6, 0x1ffc},
128     {0x2126, 0x2126}, {0x212a, 0x212b}, {0x212e, 0x212e}, {0x2180, 0x2182},
129     {0x3041, 0x3094}, {0x30a1, 0x30fa}, {0x3105, 0x312c}, {0xac00, 0xd7a3}};
130 const xmlChRangeGroup xmlIsBaseCharGroup =
131 	{197, 0, xmlIsBaseChar_srng, (xmlChLRangePtr)0};
132 
133 static const xmlChSRange xmlIsChar_srng[] = { {0x100, 0xd7ff},
134     {0xe000, 0xfffd}};
135 static const xmlChLRange xmlIsChar_lrng[] = { {0x10000, 0x10ffff}};
136 const xmlChRangeGroup xmlIsCharGroup =
137 	{2, 1, xmlIsChar_srng, xmlIsChar_lrng};
138 
139 static const xmlChSRange xmlIsCombining_srng[] = { {0x300, 0x345},
140     {0x360, 0x361}, {0x483, 0x486}, {0x591, 0x5a1}, {0x5a3, 0x5b9},
141     {0x5bb, 0x5bd}, {0x5bf, 0x5bf}, {0x5c1, 0x5c2}, {0x5c4, 0x5c4},
142     {0x64b, 0x652}, {0x670, 0x670}, {0x6d6, 0x6dc}, {0x6dd, 0x6df},
143     {0x6e0, 0x6e4}, {0x6e7, 0x6e8}, {0x6ea, 0x6ed}, {0x901, 0x903},
144     {0x93c, 0x93c}, {0x93e, 0x94c}, {0x94d, 0x94d}, {0x951, 0x954},
145     {0x962, 0x963}, {0x981, 0x983}, {0x9bc, 0x9bc}, {0x9be, 0x9be},
146     {0x9bf, 0x9bf}, {0x9c0, 0x9c4}, {0x9c7, 0x9c8}, {0x9cb, 0x9cd},
147     {0x9d7, 0x9d7}, {0x9e2, 0x9e3}, {0xa02, 0xa02}, {0xa3c, 0xa3c},
148     {0xa3e, 0xa3e}, {0xa3f, 0xa3f}, {0xa40, 0xa42}, {0xa47, 0xa48},
149     {0xa4b, 0xa4d}, {0xa70, 0xa71}, {0xa81, 0xa83}, {0xabc, 0xabc},
150     {0xabe, 0xac5}, {0xac7, 0xac9}, {0xacb, 0xacd}, {0xb01, 0xb03},
151     {0xb3c, 0xb3c}, {0xb3e, 0xb43}, {0xb47, 0xb48}, {0xb4b, 0xb4d},
152     {0xb56, 0xb57}, {0xb82, 0xb83}, {0xbbe, 0xbc2}, {0xbc6, 0xbc8},
153     {0xbca, 0xbcd}, {0xbd7, 0xbd7}, {0xc01, 0xc03}, {0xc3e, 0xc44},
154     {0xc46, 0xc48}, {0xc4a, 0xc4d}, {0xc55, 0xc56}, {0xc82, 0xc83},
155     {0xcbe, 0xcc4}, {0xcc6, 0xcc8}, {0xcca, 0xccd}, {0xcd5, 0xcd6},
156     {0xd02, 0xd03}, {0xd3e, 0xd43}, {0xd46, 0xd48}, {0xd4a, 0xd4d},
157     {0xd57, 0xd57}, {0xe31, 0xe31}, {0xe34, 0xe3a}, {0xe47, 0xe4e},
158     {0xeb1, 0xeb1}, {0xeb4, 0xeb9}, {0xebb, 0xebc}, {0xec8, 0xecd},
159     {0xf18, 0xf19}, {0xf35, 0xf35}, {0xf37, 0xf37}, {0xf39, 0xf39},
160     {0xf3e, 0xf3e}, {0xf3f, 0xf3f}, {0xf71, 0xf84}, {0xf86, 0xf8b},
161     {0xf90, 0xf95}, {0xf97, 0xf97}, {0xf99, 0xfad}, {0xfb1, 0xfb7},
162     {0xfb9, 0xfb9}, {0x20d0, 0x20dc}, {0x20e1, 0x20e1}, {0x302a, 0x302f},
163     {0x3099, 0x3099}, {0x309a, 0x309a}};
164 const xmlChRangeGroup xmlIsCombiningGroup =
165 	{95, 0, xmlIsCombining_srng, (xmlChLRangePtr)0};
166 
167 static const xmlChSRange xmlIsDigit_srng[] = { {0x660, 0x669},
168     {0x6f0, 0x6f9}, {0x966, 0x96f}, {0x9e6, 0x9ef}, {0xa66, 0xa6f},
169     {0xae6, 0xaef}, {0xb66, 0xb6f}, {0xbe7, 0xbef}, {0xc66, 0xc6f},
170     {0xce6, 0xcef}, {0xd66, 0xd6f}, {0xe50, 0xe59}, {0xed0, 0xed9},
171     {0xf20, 0xf29}};
172 const xmlChRangeGroup xmlIsDigitGroup =
173 	{14, 0, xmlIsDigit_srng, (xmlChLRangePtr)0};
174 
175 static const xmlChSRange xmlIsExtender_srng[] = { {0x2d0, 0x2d0},
176     {0x2d1, 0x2d1}, {0x387, 0x387}, {0x640, 0x640}, {0xe46, 0xe46},
177     {0xec6, 0xec6}, {0x3005, 0x3005}, {0x3031, 0x3035}, {0x309d, 0x309e},
178     {0x30fc, 0x30fe}};
179 const xmlChRangeGroup xmlIsExtenderGroup =
180 	{10, 0, xmlIsExtender_srng, (xmlChLRangePtr)0};
181 
182 static const xmlChSRange xmlIsIdeographic_srng[] = { {0x3007, 0x3007},
183     {0x3021, 0x3029}, {0x4e00, 0x9fa5}};
184 const xmlChRangeGroup xmlIsIdeographicGroup =
185 	{3, 0, xmlIsIdeographic_srng, (xmlChLRangePtr)0};
186 
187 
188 /**
189  * xmlCharInRange:
190  * @val: character to be validated
191  * @rptr: pointer to range to be used to validate
192  *
193  * Does a binary search of the range table to determine if char
194  * is valid
195  *
196  * Returns: true if character valid, false otherwise
197  */
198 int
xmlCharInRange(unsigned int val,const xmlChRangeGroup * rptr)199 xmlCharInRange (unsigned int val, const xmlChRangeGroup *rptr) {
200     int low, high, mid;
201     const xmlChSRange *sptr;
202     const xmlChLRange *lptr;
203 
204     if (rptr == NULL) return(0);
205     if (val < 0x10000) {	/* is val in 'short' or 'long'  array? */
206 	if (rptr->nbShortRange == 0)
207 	    return 0;
208 	low = 0;
209 	high = rptr->nbShortRange - 1;
210 	sptr = rptr->shortRange;
211 	while (low <= high) {
212 	    mid = (low + high) / 2;
213 	    if ((unsigned short) val < sptr[mid].low) {
214 		high = mid - 1;
215 	    } else {
216 	        if ((unsigned short) val > sptr[mid].high) {
217 		    low = mid + 1;
218 		} else {
219 		    return 1;
220 		}
221 	    }
222 	}
223     } else {
224 	if (rptr->nbLongRange == 0) {
225 	    return 0;
226 	}
227 	low = 0;
228 	high = rptr->nbLongRange - 1;
229 	lptr = rptr->longRange;
230 	while (low <= high) {
231 	    mid = (low + high) / 2;
232 	    if (val < lptr[mid].low) {
233 		high = mid - 1;
234 	    } else {
235 	        if (val > lptr[mid].high) {
236 		    low = mid + 1;
237 		} else {
238 		    return 1;
239 		}
240 	    }
241 	}
242     }
243     return 0;
244 }
245 
246 
247 /**
248  * xmlIsBaseChar:
249  * @ch:  character to validate
250  *
251  * This function is DEPRECATED.
252  * Use xmlIsBaseChar_ch or xmlIsBaseCharQ instead
253  *
254  * Returns true if argument valid, false otherwise
255  */
256 int
xmlIsBaseChar(unsigned int ch)257 xmlIsBaseChar(unsigned int ch) {
258     return(xmlIsBaseCharQ(ch));
259 }
260 
261 
262 /**
263  * xmlIsBlank:
264  * @ch:  character to validate
265  *
266  * This function is DEPRECATED.
267  * Use xmlIsBlank_ch or xmlIsBlankQ instead
268  *
269  * Returns true if argument valid, false otherwise
270  */
271 int
xmlIsBlank(unsigned int ch)272 xmlIsBlank(unsigned int ch) {
273     return(xmlIsBlankQ(ch));
274 }
275 
276 
277 /**
278  * xmlIsChar:
279  * @ch:  character to validate
280  *
281  * This function is DEPRECATED.
282  * Use xmlIsChar_ch or xmlIsCharQ instead
283  *
284  * Returns true if argument valid, false otherwise
285  */
286 int
xmlIsChar(unsigned int ch)287 xmlIsChar(unsigned int ch) {
288     return(xmlIsCharQ(ch));
289 }
290 
291 
292 /**
293  * xmlIsCombining:
294  * @ch:  character to validate
295  *
296  * This function is DEPRECATED.
297  * Use xmlIsCombiningQ instead
298  *
299  * Returns true if argument valid, false otherwise
300  */
301 int
xmlIsCombining(unsigned int ch)302 xmlIsCombining(unsigned int ch) {
303     return(xmlIsCombiningQ(ch));
304 }
305 
306 
307 /**
308  * xmlIsDigit:
309  * @ch:  character to validate
310  *
311  * This function is DEPRECATED.
312  * Use xmlIsDigit_ch or xmlIsDigitQ instead
313  *
314  * Returns true if argument valid, false otherwise
315  */
316 int
xmlIsDigit(unsigned int ch)317 xmlIsDigit(unsigned int ch) {
318     return(xmlIsDigitQ(ch));
319 }
320 
321 
322 /**
323  * xmlIsExtender:
324  * @ch:  character to validate
325  *
326  * This function is DEPRECATED.
327  * Use xmlIsExtender_ch or xmlIsExtenderQ instead
328  *
329  * Returns true if argument valid, false otherwise
330  */
331 int
xmlIsExtender(unsigned int ch)332 xmlIsExtender(unsigned int ch) {
333     return(xmlIsExtenderQ(ch));
334 }
335 
336 
337 /**
338  * xmlIsIdeographic:
339  * @ch:  character to validate
340  *
341  * This function is DEPRECATED.
342  * Use xmlIsIdeographicQ instead
343  *
344  * Returns true if argument valid, false otherwise
345  */
346 int
xmlIsIdeographic(unsigned int ch)347 xmlIsIdeographic(unsigned int ch) {
348     return(xmlIsIdeographicQ(ch));
349 }
350 
351 
352 /**
353  * xmlIsPubidChar:
354  * @ch:  character to validate
355  *
356  * This function is DEPRECATED.
357  * Use xmlIsPubidChar_ch or xmlIsPubidCharQ instead
358  *
359  * Returns true if argument valid, false otherwise
360  */
361 int
xmlIsPubidChar(unsigned int ch)362 xmlIsPubidChar(unsigned int ch) {
363     return(xmlIsPubidCharQ(ch));
364 }
365 
366 #define bottom_chvalid
367 #include "elfgcchack.h"
368