1 #include <stdio.h>
2 #include <string.h>
3 #include <ctype.h>
4 #include <limits.h>
5 #include <stdlib.h>
6 #include <sys/types.h>
7 /* local headers */
8 #include "regex.h"
9 #include "utils.h"
10 #include "regex2.h"
11 
12 /* #include "debug.ih" // why generate this */
13 /* forward refs */
14 void regprint(regex_t *r, FILE *d);
15 static void s_print(register struct re_guts *g, FILE *d);
16 static char *regchar(int ch);
17 
18 /*
19  - regprint - print a regexp for debugging
20  == void regprint(regex_t *r, FILE *d);
21  */
22 void
regprint(r,d)23 regprint(r, d)
24 regex_t *r;
25 FILE *d;
26 {
27 	register struct re_guts *g = r->re_g;
28 	register int i;
29 	register int c;
30 	register int last;
31 	int nincat[NC];
32 
33 	fprintf(d, "%ld states, %d categories", (long)g->nstates,
34 							g->ncategories);
35 	fprintf(d, ", first %ld last %ld", (long)g->firststate,
36 						(long)g->laststate);
37 	if (g->iflags&USEBOL)
38 		fprintf(d, ", USEBOL");
39 	if (g->iflags&USEEOL)
40 		fprintf(d, ", USEEOL");
41 	if (g->iflags&BAD)
42 		fprintf(d, ", BAD");
43 	if (g->nsub > 0)
44 		fprintf(d, ", nsub=%ld", (long)g->nsub);
45 	if (g->must != NULL)
46 		fprintf(d, ", must(%ld) `%*s'", (long)g->mlen, (int)g->mlen,
47 								g->must);
48 	if (g->backrefs)
49 		fprintf(d, ", backrefs");
50 	if (g->nplus > 0)
51 		fprintf(d, ", nplus %ld", (long)g->nplus);
52 	fprintf(d, "\n");
53 	s_print(g, d);
54 	for (i = 0; i < g->ncategories; i++) {
55 		nincat[i] = 0;
56 		for (c = CHAR_MIN; c <= CHAR_MAX; c++)
57 			if (g->categories[c] == i)
58 				nincat[i]++;
59 	}
60 	fprintf(d, "cc0#%d", nincat[0]);
61 	for (i = 1; i < g->ncategories; i++)
62 		if (nincat[i] == 1) {
63 			for (c = CHAR_MIN; c <= CHAR_MAX; c++)
64 				if (g->categories[c] == i)
65 					break;
66 			fprintf(d, ", %d=%s", i, regchar(c));
67 		}
68 	fprintf(d, "\n");
69 	for (i = 1; i < g->ncategories; i++)
70 		if (nincat[i] != 1) {
71 			fprintf(d, "cc%d\t", i);
72 			last = -1;
73 			for (c = CHAR_MIN; c <= CHAR_MAX+1; c++)	/* +1 does flush */
74 				if (c <= CHAR_MAX && g->categories[c] == i) {
75 					if (last < 0) {
76 						fprintf(d, "%s", regchar(c));
77 						last = c;
78 					}
79 				} else {
80 					if (last >= 0) {
81 						if (last != c-1)
82 							fprintf(d, "-%s",
83 								regchar(c-1));
84 						last = -1;
85 					}
86 				}
87 			fprintf(d, "\n");
88 		}
89 }
90 
91 /*
92  - s_print - print the strip for debugging
93  == static void s_print(register struct re_guts *g, FILE *d);
94  */
95 static void
s_print(g,d)96 s_print(g, d)
97 register struct re_guts *g;
98 FILE *d;
99 {
100 	register sop *s;
101 	register cset *cs;
102 	register int i;
103 	register int done = 0;
104 	register sop opnd;
105 	register int col = 0;
106 	register int last;
107 	register sopno offset = 2;
108 #	define	GAP()	{	if (offset % 5 == 0) { \
109 					if (col > 40) { \
110 						fprintf(d, "\n\t"); \
111 						col = 0; \
112 					} else { \
113 						fprintf(d, " "); \
114 						col++; \
115 					} \
116 				} else \
117 					col++; \
118 				offset++; \
119 			}
120 
121 	if (OP(g->strip[0]) != OEND)
122 		fprintf(d, "missing initial OEND!\n");
123 	for (s = &g->strip[1]; !done; s++) {
124 		opnd = OPND(*s);
125 		switch (OP(*s)) {
126 		case OEND:
127 			fprintf(d, "\n");
128 			done = 1;
129 			break;
130 		case OCHAR:
131 			if (strchr("\\|()^$.[+*?{}!<> ", (char)opnd) != NULL)
132 				fprintf(d, "\\%c", (char)opnd);
133 			else
134 				fprintf(d, "%s", regchar((char)opnd));
135 			break;
136 		case OBOL:
137 			fprintf(d, "^");
138 			break;
139 		case OEOL:
140 			fprintf(d, "$");
141 			break;
142 		case OBOW:
143 			fprintf(d, "\\{");
144 			break;
145 		case OEOW:
146 			fprintf(d, "\\}");
147 			break;
148 		case OANY:
149 			fprintf(d, ".");
150 			break;
151 		case OANYOF:
152 			fprintf(d, "[(%ld)", (long)opnd);
153 			cs = &g->sets[opnd];
154 			last = -1;
155 			for (i = 0; i < g->csetsize+1; i++)	/* +1 flushes */
156 				if (CHIN(cs, i) && i < g->csetsize) {
157 					if (last < 0) {
158 						fprintf(d, "%s", regchar(i));
159 						last = i;
160 					}
161 				} else {
162 					if (last >= 0) {
163 						if (last != i-1)
164 							fprintf(d, "-%s",
165 								regchar(i-1));
166 						last = -1;
167 					}
168 				}
169 			fprintf(d, "]");
170 			break;
171 		case OBACK_:
172 			fprintf(d, "(\\<%ld>", (long)opnd);
173 			break;
174 		case O_BACK:
175 			fprintf(d, "<%ld>\\)", (long)opnd);
176 			break;
177 		case OPLUS_:
178 			fprintf(d, "(+");
179 			if (OP(*(s+opnd)) != O_PLUS)
180 				fprintf(d, "<%ld>", (long)opnd);
181 			break;
182 		case O_PLUS:
183 			if (OP(*(s-opnd)) != OPLUS_)
184 				fprintf(d, "<%ld>", (long)opnd);
185 			fprintf(d, "+)");
186 			break;
187 		case OQUEST_:
188 			fprintf(d, "(?");
189 			if (OP(*(s+opnd)) != O_QUEST)
190 				fprintf(d, "<%ld>", (long)opnd);
191 			break;
192 		case O_QUEST:
193 			if (OP(*(s-opnd)) != OQUEST_)
194 				fprintf(d, "<%ld>", (long)opnd);
195 			fprintf(d, "?)");
196 			break;
197 		case OLPAREN:
198 			fprintf(d, "((<%ld>", (long)opnd);
199 			break;
200 		case ORPAREN:
201 			fprintf(d, "<%ld>))", (long)opnd);
202 			break;
203 		case OCH_:
204 			fprintf(d, "<");
205 			if (OP(*(s+opnd)) != OOR2)
206 				fprintf(d, "<%ld>", (long)opnd);
207 			break;
208 		case OOR1:
209 			if (OP(*(s-opnd)) != OOR1 && OP(*(s-opnd)) != OCH_)
210 				fprintf(d, "<%ld>", (long)opnd);
211 			fprintf(d, "|");
212 			break;
213 		case OOR2:
214 			fprintf(d, "|");
215 			if (OP(*(s+opnd)) != OOR2 && OP(*(s+opnd)) != O_CH)
216 				fprintf(d, "<%ld>", (long)opnd);
217 			break;
218 		case O_CH:
219 			if (OP(*(s-opnd)) != OOR1)
220 				fprintf(d, "<%ld>", (long)opnd);
221 			fprintf(d, ">");
222 			break;
223 		default:
224 			fprintf(d, "!%d(%d)!", OP(*s), opnd);
225 			break;
226 		}
227 		if (!done)
228 			GAP();
229 	}
230 }
231 
232 /*
233  - regchar - make a character printable
234  == static char *regchar(int ch);
235  */
236 static char *			/* -> representation */
regchar(ch)237 regchar(ch)
238 int ch;
239 {
240 	static char buf[10];
241 
242 	if (isprint(ch) || ch == ' ')
243 		sprintf(buf, "%c", ch);
244 	else
245 		sprintf(buf, "\\%o", ch);
246 	return(buf);
247 }
248