1c99fb5f9SBaptiste Daroussin /* Copyright (c) 2013, Vsevolod Stakhov
2c99fb5f9SBaptiste Daroussin * All rights reserved.
3c99fb5f9SBaptiste Daroussin *
4c99fb5f9SBaptiste Daroussin * Redistribution and use in source and binary forms, with or without
5c99fb5f9SBaptiste Daroussin * modification, are permitted provided that the following conditions are met:
6c99fb5f9SBaptiste Daroussin * * Redistributions of source code must retain the above copyright
7c99fb5f9SBaptiste Daroussin * notice, this list of conditions and the following disclaimer.
8c99fb5f9SBaptiste Daroussin * * Redistributions in binary form must reproduce the above copyright
9c99fb5f9SBaptiste Daroussin * notice, this list of conditions and the following disclaimer in the
10c99fb5f9SBaptiste Daroussin * documentation and/or other materials provided with the distribution.
11c99fb5f9SBaptiste Daroussin *
12c99fb5f9SBaptiste Daroussin * THIS SOFTWARE IS PROVIDED ''AS IS'' AND ANY
13c99fb5f9SBaptiste Daroussin * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
14c99fb5f9SBaptiste Daroussin * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
15c99fb5f9SBaptiste Daroussin * DISCLAIMED. IN NO EVENT SHALL AUTHOR BE LIABLE FOR ANY
16c99fb5f9SBaptiste Daroussin * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
17c99fb5f9SBaptiste Daroussin * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
18c99fb5f9SBaptiste Daroussin * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
19c99fb5f9SBaptiste Daroussin * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
20c99fb5f9SBaptiste Daroussin * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
21c99fb5f9SBaptiste Daroussin * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
22c99fb5f9SBaptiste Daroussin */
23c99fb5f9SBaptiste Daroussin
24c99fb5f9SBaptiste Daroussin /**
25c99fb5f9SBaptiste Daroussin * @file this utility generates character table for ucl
26c99fb5f9SBaptiste Daroussin */
27c99fb5f9SBaptiste Daroussin
28c99fb5f9SBaptiste Daroussin #include <stdio.h>
29c99fb5f9SBaptiste Daroussin #include <ctype.h>
30c99fb5f9SBaptiste Daroussin #include <stdbool.h>
31c99fb5f9SBaptiste Daroussin
32c99fb5f9SBaptiste Daroussin static inline int
print_flag(const char * flag,bool * need_or,char * val)33c99fb5f9SBaptiste Daroussin print_flag (const char *flag, bool *need_or, char *val)
34c99fb5f9SBaptiste Daroussin {
35c99fb5f9SBaptiste Daroussin int res;
36c99fb5f9SBaptiste Daroussin res = sprintf (val, "%s%s", *need_or ? "|" : "", flag);
37c99fb5f9SBaptiste Daroussin
38c99fb5f9SBaptiste Daroussin *need_or |= true;
39c99fb5f9SBaptiste Daroussin
40c99fb5f9SBaptiste Daroussin return res;
41c99fb5f9SBaptiste Daroussin }
42c99fb5f9SBaptiste Daroussin
43c99fb5f9SBaptiste Daroussin int
main(int argc,char ** argv)44c99fb5f9SBaptiste Daroussin main (int argc, char **argv)
45c99fb5f9SBaptiste Daroussin {
46c99fb5f9SBaptiste Daroussin int i, col, r;
47c99fb5f9SBaptiste Daroussin const char *name = "ucl_chartable";
48c99fb5f9SBaptiste Daroussin bool need_or;
49c99fb5f9SBaptiste Daroussin char valbuf[2048];
50c99fb5f9SBaptiste Daroussin
51c99fb5f9SBaptiste Daroussin col = 0;
52c99fb5f9SBaptiste Daroussin
53c99fb5f9SBaptiste Daroussin if (argc > 1) {
54c99fb5f9SBaptiste Daroussin name = argv[1];
55c99fb5f9SBaptiste Daroussin }
56c99fb5f9SBaptiste Daroussin
57*39ee7a7aSBaptiste Daroussin printf ("static const unsigned int %s[256] = {\n", name);
58c99fb5f9SBaptiste Daroussin
59*39ee7a7aSBaptiste Daroussin for (i = 0; i < 256; i ++) {
60c99fb5f9SBaptiste Daroussin need_or = false;
61c99fb5f9SBaptiste Daroussin r = 0;
62c99fb5f9SBaptiste Daroussin /* UCL_CHARACTER_VALUE_END */
63c99fb5f9SBaptiste Daroussin
64c99fb5f9SBaptiste Daroussin if (i == ' ' || i == '\t') {
65c99fb5f9SBaptiste Daroussin r += print_flag ("UCL_CHARACTER_WHITESPACE", &need_or, valbuf + r);
66c99fb5f9SBaptiste Daroussin }
67c99fb5f9SBaptiste Daroussin if (isspace (i)) {
68c99fb5f9SBaptiste Daroussin r += print_flag ("UCL_CHARACTER_WHITESPACE_UNSAFE", &need_or, valbuf + r);
69c99fb5f9SBaptiste Daroussin }
70c99fb5f9SBaptiste Daroussin if (isalnum (i) || i >= 0x80 || i == '/' || i == '_') {
71c99fb5f9SBaptiste Daroussin r += print_flag ("UCL_CHARACTER_KEY_START", &need_or, valbuf + r);
72c99fb5f9SBaptiste Daroussin }
73c99fb5f9SBaptiste Daroussin if (isalnum (i) || i == '-' || i == '_' || i == '/' || i == '.' || i >= 0x80) {
74c99fb5f9SBaptiste Daroussin r += print_flag ("UCL_CHARACTER_KEY", &need_or, valbuf + r);
75c99fb5f9SBaptiste Daroussin }
76c99fb5f9SBaptiste Daroussin if (i == 0 || i == '\r' || i == '\n' || i == ']' || i == '}' || i == ';' || i == ',' || i == '#') {
77c99fb5f9SBaptiste Daroussin r += print_flag ("UCL_CHARACTER_VALUE_END", &need_or, valbuf + r);
78c99fb5f9SBaptiste Daroussin }
79c99fb5f9SBaptiste Daroussin else {
80c99fb5f9SBaptiste Daroussin if (isprint (i) || i >= 0x80) {
81c99fb5f9SBaptiste Daroussin r += print_flag ("UCL_CHARACTER_VALUE_STR", &need_or, valbuf + r);
82c99fb5f9SBaptiste Daroussin }
83c99fb5f9SBaptiste Daroussin if (isdigit (i) || i == '-') {
84c99fb5f9SBaptiste Daroussin r += print_flag ("UCL_CHARACTER_VALUE_DIGIT_START", &need_or, valbuf + r);
85c99fb5f9SBaptiste Daroussin }
86c99fb5f9SBaptiste Daroussin if (isalnum (i) || i == '.' || i == '-' || i == '+') {
87c99fb5f9SBaptiste Daroussin r += print_flag ("UCL_CHARACTER_VALUE_DIGIT", &need_or, valbuf + r);
88c99fb5f9SBaptiste Daroussin }
89c99fb5f9SBaptiste Daroussin }
90c99fb5f9SBaptiste Daroussin if (i == '"' || i == '\\' || i == '/' || i == 'b' ||
91c99fb5f9SBaptiste Daroussin i == 'f' || i == 'n' || i == 'r' || i == 't' || i == 'u') {
92c99fb5f9SBaptiste Daroussin r += print_flag ("UCL_CHARACTER_ESCAPE", &need_or, valbuf + r);
93c99fb5f9SBaptiste Daroussin }
94c99fb5f9SBaptiste Daroussin if (i == ' ' || i == '\t' || i == ':' || i == '=') {
95c99fb5f9SBaptiste Daroussin r += print_flag ("UCL_CHARACTER_KEY_SEP", &need_or, valbuf + r);
96c99fb5f9SBaptiste Daroussin }
97c99fb5f9SBaptiste Daroussin if (i == '\n' || i == '\r' || i == '\\' || i == '\b' || i == '\t' ||
98c99fb5f9SBaptiste Daroussin i == '"' || i == '\f') {
99c99fb5f9SBaptiste Daroussin r += print_flag ("UCL_CHARACTER_JSON_UNSAFE", &need_or, valbuf + r);
100c99fb5f9SBaptiste Daroussin }
101c99fb5f9SBaptiste Daroussin if (i == '\n' || i == '\r' || i == '\\' || i == '\b' || i == '\t' ||
102c99fb5f9SBaptiste Daroussin i == '"' || i == '\f' || i == '=' || i == ':' || i == '{' || i == '[' || i == ' ') {
103c99fb5f9SBaptiste Daroussin r += print_flag ("UCL_CHARACTER_UCL_UNSAFE", &need_or, valbuf + r);
104c99fb5f9SBaptiste Daroussin }
105c99fb5f9SBaptiste Daroussin
106c99fb5f9SBaptiste Daroussin if (!need_or) {
107c99fb5f9SBaptiste Daroussin r += print_flag ("UCL_CHARACTER_DENIED", &need_or, valbuf + r);
108c99fb5f9SBaptiste Daroussin }
109c99fb5f9SBaptiste Daroussin
110c99fb5f9SBaptiste Daroussin if (isprint (i)) {
111c99fb5f9SBaptiste Daroussin r += sprintf (valbuf + r, " /* %c */", i);
112c99fb5f9SBaptiste Daroussin }
113*39ee7a7aSBaptiste Daroussin if (i != 255) {
114c99fb5f9SBaptiste Daroussin r += sprintf (valbuf + r, ", ");
115c99fb5f9SBaptiste Daroussin }
116c99fb5f9SBaptiste Daroussin col += r;
117c99fb5f9SBaptiste Daroussin if (col > 80) {
118c99fb5f9SBaptiste Daroussin printf ("\n%s", valbuf);
119c99fb5f9SBaptiste Daroussin col = r;
120c99fb5f9SBaptiste Daroussin }
121c99fb5f9SBaptiste Daroussin else {
122c99fb5f9SBaptiste Daroussin printf ("%s", valbuf);
123c99fb5f9SBaptiste Daroussin }
124c99fb5f9SBaptiste Daroussin }
125c99fb5f9SBaptiste Daroussin printf ("\n}\n");
126c99fb5f9SBaptiste Daroussin
127c99fb5f9SBaptiste Daroussin return 0;
128c99fb5f9SBaptiste Daroussin }
129