xref: /freebsd/contrib/libucl/utils/chargen.c (revision 39ee7a7a)
1c99fb5f9SBaptiste Daroussin /* Copyright (c) 2013, Vsevolod Stakhov
2c99fb5f9SBaptiste Daroussin  * All rights reserved.
3c99fb5f9SBaptiste Daroussin  *
4c99fb5f9SBaptiste Daroussin  * Redistribution and use in source and binary forms, with or without
5c99fb5f9SBaptiste Daroussin  * modification, are permitted provided that the following conditions are met:
6c99fb5f9SBaptiste Daroussin  *       * Redistributions of source code must retain the above copyright
7c99fb5f9SBaptiste Daroussin  *         notice, this list of conditions and the following disclaimer.
8c99fb5f9SBaptiste Daroussin  *       * Redistributions in binary form must reproduce the above copyright
9c99fb5f9SBaptiste Daroussin  *         notice, this list of conditions and the following disclaimer in the
10c99fb5f9SBaptiste Daroussin  *         documentation and/or other materials provided with the distribution.
11c99fb5f9SBaptiste Daroussin  *
12c99fb5f9SBaptiste Daroussin  * THIS SOFTWARE IS PROVIDED ''AS IS'' AND ANY
13c99fb5f9SBaptiste Daroussin  * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
14c99fb5f9SBaptiste Daroussin  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
15c99fb5f9SBaptiste Daroussin  * DISCLAIMED. IN NO EVENT SHALL AUTHOR BE LIABLE FOR ANY
16c99fb5f9SBaptiste Daroussin  * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
17c99fb5f9SBaptiste Daroussin  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
18c99fb5f9SBaptiste Daroussin  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
19c99fb5f9SBaptiste Daroussin  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
20c99fb5f9SBaptiste Daroussin  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
21c99fb5f9SBaptiste Daroussin  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
22c99fb5f9SBaptiste Daroussin  */
23c99fb5f9SBaptiste Daroussin 
24c99fb5f9SBaptiste Daroussin /**
25c99fb5f9SBaptiste Daroussin  * @file this utility generates character table for ucl
26c99fb5f9SBaptiste Daroussin  */
27c99fb5f9SBaptiste Daroussin 
28c99fb5f9SBaptiste Daroussin #include <stdio.h>
29c99fb5f9SBaptiste Daroussin #include <ctype.h>
30c99fb5f9SBaptiste Daroussin #include <stdbool.h>
31c99fb5f9SBaptiste Daroussin 
32c99fb5f9SBaptiste Daroussin static inline int
print_flag(const char * flag,bool * need_or,char * val)33c99fb5f9SBaptiste Daroussin print_flag (const char *flag, bool *need_or, char *val)
34c99fb5f9SBaptiste Daroussin {
35c99fb5f9SBaptiste Daroussin 	int res;
36c99fb5f9SBaptiste Daroussin 	res = sprintf (val, "%s%s", *need_or ? "|" : "", flag);
37c99fb5f9SBaptiste Daroussin 
38c99fb5f9SBaptiste Daroussin 	*need_or |= true;
39c99fb5f9SBaptiste Daroussin 
40c99fb5f9SBaptiste Daroussin 	return res;
41c99fb5f9SBaptiste Daroussin }
42c99fb5f9SBaptiste Daroussin 
43c99fb5f9SBaptiste Daroussin int
main(int argc,char ** argv)44c99fb5f9SBaptiste Daroussin main (int argc, char **argv)
45c99fb5f9SBaptiste Daroussin {
46c99fb5f9SBaptiste Daroussin 	int i, col, r;
47c99fb5f9SBaptiste Daroussin 	const char *name = "ucl_chartable";
48c99fb5f9SBaptiste Daroussin 	bool need_or;
49c99fb5f9SBaptiste Daroussin 	char valbuf[2048];
50c99fb5f9SBaptiste Daroussin 
51c99fb5f9SBaptiste Daroussin 	col = 0;
52c99fb5f9SBaptiste Daroussin 
53c99fb5f9SBaptiste Daroussin 	if (argc > 1) {
54c99fb5f9SBaptiste Daroussin 		name = argv[1];
55c99fb5f9SBaptiste Daroussin 	}
56c99fb5f9SBaptiste Daroussin 
57*39ee7a7aSBaptiste Daroussin 	printf ("static const unsigned int %s[256] = {\n", name);
58c99fb5f9SBaptiste Daroussin 
59*39ee7a7aSBaptiste Daroussin 	for (i = 0; i < 256; i ++) {
60c99fb5f9SBaptiste Daroussin 		need_or = false;
61c99fb5f9SBaptiste Daroussin 		r = 0;
62c99fb5f9SBaptiste Daroussin 		/* UCL_CHARACTER_VALUE_END */
63c99fb5f9SBaptiste Daroussin 
64c99fb5f9SBaptiste Daroussin 		if (i == ' ' || i == '\t') {
65c99fb5f9SBaptiste Daroussin 			r += print_flag ("UCL_CHARACTER_WHITESPACE", &need_or, valbuf + r);
66c99fb5f9SBaptiste Daroussin 		}
67c99fb5f9SBaptiste Daroussin 		if (isspace (i)) {
68c99fb5f9SBaptiste Daroussin 			r += print_flag ("UCL_CHARACTER_WHITESPACE_UNSAFE", &need_or, valbuf + r);
69c99fb5f9SBaptiste Daroussin 		}
70c99fb5f9SBaptiste Daroussin 		if (isalnum (i) || i >= 0x80 || i == '/' || i == '_') {
71c99fb5f9SBaptiste Daroussin 			r += print_flag ("UCL_CHARACTER_KEY_START", &need_or, valbuf + r);
72c99fb5f9SBaptiste Daroussin 		}
73c99fb5f9SBaptiste Daroussin 		if (isalnum (i) || i == '-' || i == '_' || i == '/' || i == '.' || i >= 0x80) {
74c99fb5f9SBaptiste Daroussin 			r += print_flag ("UCL_CHARACTER_KEY", &need_or, valbuf + r);
75c99fb5f9SBaptiste Daroussin 		}
76c99fb5f9SBaptiste Daroussin 		if (i == 0 || i == '\r' || i == '\n' || i == ']' || i == '}' || i == ';' || i == ',' || i == '#') {
77c99fb5f9SBaptiste Daroussin 			r += print_flag ("UCL_CHARACTER_VALUE_END", &need_or, valbuf + r);
78c99fb5f9SBaptiste Daroussin 		}
79c99fb5f9SBaptiste Daroussin 		else {
80c99fb5f9SBaptiste Daroussin 			if (isprint (i) || i >= 0x80) {
81c99fb5f9SBaptiste Daroussin 				r += print_flag ("UCL_CHARACTER_VALUE_STR", &need_or, valbuf + r);
82c99fb5f9SBaptiste Daroussin 			}
83c99fb5f9SBaptiste Daroussin 			if (isdigit (i) || i == '-') {
84c99fb5f9SBaptiste Daroussin 				r += print_flag ("UCL_CHARACTER_VALUE_DIGIT_START", &need_or, valbuf + r);
85c99fb5f9SBaptiste Daroussin 			}
86c99fb5f9SBaptiste Daroussin 			if (isalnum (i) || i == '.' || i == '-' || i == '+') {
87c99fb5f9SBaptiste Daroussin 				r += print_flag ("UCL_CHARACTER_VALUE_DIGIT", &need_or, valbuf + r);
88c99fb5f9SBaptiste Daroussin 			}
89c99fb5f9SBaptiste Daroussin 		}
90c99fb5f9SBaptiste Daroussin 		if (i == '"' || i == '\\' || i == '/' || i == 'b' ||
91c99fb5f9SBaptiste Daroussin 			i == 'f' || i == 'n' || i == 'r' || i == 't' || i == 'u') {
92c99fb5f9SBaptiste Daroussin 			r += print_flag ("UCL_CHARACTER_ESCAPE", &need_or, valbuf + r);
93c99fb5f9SBaptiste Daroussin 		}
94c99fb5f9SBaptiste Daroussin 		if (i == ' ' || i == '\t' || i == ':' || i == '=') {
95c99fb5f9SBaptiste Daroussin 			r += print_flag ("UCL_CHARACTER_KEY_SEP", &need_or, valbuf + r);
96c99fb5f9SBaptiste Daroussin 		}
97c99fb5f9SBaptiste Daroussin 		if (i == '\n' || i == '\r' || i == '\\' || i == '\b' || i == '\t' ||
98c99fb5f9SBaptiste Daroussin 				i == '"' || i == '\f') {
99c99fb5f9SBaptiste Daroussin 			r += print_flag ("UCL_CHARACTER_JSON_UNSAFE", &need_or, valbuf + r);
100c99fb5f9SBaptiste Daroussin 		}
101c99fb5f9SBaptiste Daroussin 		if (i == '\n' || i == '\r' || i == '\\' || i == '\b' || i == '\t' ||
102c99fb5f9SBaptiste Daroussin 				i == '"' || i == '\f' || i == '=' || i == ':' || i == '{' || i == '[' || i == ' ') {
103c99fb5f9SBaptiste Daroussin 			r += print_flag ("UCL_CHARACTER_UCL_UNSAFE", &need_or, valbuf + r);
104c99fb5f9SBaptiste Daroussin 		}
105c99fb5f9SBaptiste Daroussin 
106c99fb5f9SBaptiste Daroussin 		if (!need_or) {
107c99fb5f9SBaptiste Daroussin 			r += print_flag ("UCL_CHARACTER_DENIED", &need_or, valbuf + r);
108c99fb5f9SBaptiste Daroussin 		}
109c99fb5f9SBaptiste Daroussin 
110c99fb5f9SBaptiste Daroussin 		if (isprint (i)) {
111c99fb5f9SBaptiste Daroussin 			r += sprintf (valbuf + r, " /* %c */", i);
112c99fb5f9SBaptiste Daroussin 		}
113*39ee7a7aSBaptiste Daroussin 		if (i != 255) {
114c99fb5f9SBaptiste Daroussin 			r += sprintf (valbuf + r, ", ");
115c99fb5f9SBaptiste Daroussin 		}
116c99fb5f9SBaptiste Daroussin 		col += r;
117c99fb5f9SBaptiste Daroussin 		if (col > 80) {
118c99fb5f9SBaptiste Daroussin 			printf ("\n%s", valbuf);
119c99fb5f9SBaptiste Daroussin 			col = r;
120c99fb5f9SBaptiste Daroussin 		}
121c99fb5f9SBaptiste Daroussin 		else {
122c99fb5f9SBaptiste Daroussin 			printf ("%s", valbuf);
123c99fb5f9SBaptiste Daroussin 		}
124c99fb5f9SBaptiste Daroussin 	}
125c99fb5f9SBaptiste Daroussin 	printf ("\n}\n");
126c99fb5f9SBaptiste Daroussin 
127c99fb5f9SBaptiste Daroussin 	return 0;
128c99fb5f9SBaptiste Daroussin }
129