1*b30d1939SAndy Fiddaman /***********************************************************************
2*b30d1939SAndy Fiddaman * *
3*b30d1939SAndy Fiddaman * This software is part of the ast package *
4*b30d1939SAndy Fiddaman * Copyright (c) 1985-2011 AT&T Intellectual Property *
5*b30d1939SAndy Fiddaman * and is licensed under the *
6*b30d1939SAndy Fiddaman * Eclipse Public License, Version 1.0 *
7*b30d1939SAndy Fiddaman * by AT&T Intellectual Property *
8*b30d1939SAndy Fiddaman * *
9*b30d1939SAndy Fiddaman * A copy of the License is available at *
10*b30d1939SAndy Fiddaman * http://www.eclipse.org/org/documents/epl-v10.html *
11*b30d1939SAndy Fiddaman * (with md5 checksum b35adb5213ca9657e911e9befb180842) *
12*b30d1939SAndy Fiddaman * *
13*b30d1939SAndy Fiddaman * Information and Software Systems Research *
14*b30d1939SAndy Fiddaman * AT&T Research *
15*b30d1939SAndy Fiddaman * Florham Park NJ *
16*b30d1939SAndy Fiddaman * *
17*b30d1939SAndy Fiddaman * Glenn Fowler <gsf@research.att.com> *
18*b30d1939SAndy Fiddaman * David Korn <dgk@research.att.com> *
19*b30d1939SAndy Fiddaman * Phong Vo <kpv@research.att.com> *
20*b30d1939SAndy Fiddaman * *
21*b30d1939SAndy Fiddaman ***********************************************************************/
22*b30d1939SAndy Fiddaman #pragma prototyped
23*b30d1939SAndy Fiddaman /*
24*b30d1939SAndy Fiddaman * Glenn Fowler
25*b30d1939SAndy Fiddaman * AT&T Research
26*b30d1939SAndy Fiddaman *
27*b30d1939SAndy Fiddaman * return string with expanded escape chars
28*b30d1939SAndy Fiddaman */
29*b30d1939SAndy Fiddaman
30*b30d1939SAndy Fiddaman #include <ast.h>
31*b30d1939SAndy Fiddaman #include <ccode.h>
32*b30d1939SAndy Fiddaman #include <ctype.h>
33*b30d1939SAndy Fiddaman #if _hdr_wchar && _hdr_wctype
34*b30d1939SAndy Fiddaman #include <wchar.h>
35*b30d1939SAndy Fiddaman #include <wctype.h>
36*b30d1939SAndy Fiddaman #endif
37*b30d1939SAndy Fiddaman
38*b30d1939SAndy Fiddaman /*
39*b30d1939SAndy Fiddaman * quote string as of length n with qb...qe
40*b30d1939SAndy Fiddaman * (flags&FMT_ALWAYS) always quotes, otherwise quote output only if necessary
41*b30d1939SAndy Fiddaman * qe and the usual suspects are \... escaped
42*b30d1939SAndy Fiddaman * (flags&FMT_WIDE) doesn't escape 8 bit chars
43*b30d1939SAndy Fiddaman * (flags&FMT_ESCAPED) doesn't \... escape the usual suspects
44*b30d1939SAndy Fiddaman * (flags&FMT_SHELL) escape $`"#;~&|()<>[]*?
45*b30d1939SAndy Fiddaman */
46*b30d1939SAndy Fiddaman
47*b30d1939SAndy Fiddaman char*
fmtquote(const char * as,const char * qb,const char * qe,size_t n,int flags)48*b30d1939SAndy Fiddaman fmtquote(const char* as, const char* qb, const char* qe, size_t n, int flags)
49*b30d1939SAndy Fiddaman {
50*b30d1939SAndy Fiddaman register unsigned char* s = (unsigned char*)as;
51*b30d1939SAndy Fiddaman register unsigned char* e = s + n;
52*b30d1939SAndy Fiddaman register char* b;
53*b30d1939SAndy Fiddaman register int c;
54*b30d1939SAndy Fiddaman register int m;
55*b30d1939SAndy Fiddaman register int escaped;
56*b30d1939SAndy Fiddaman register int spaced;
57*b30d1939SAndy Fiddaman register int doublequote;
58*b30d1939SAndy Fiddaman register int singlequote;
59*b30d1939SAndy Fiddaman int shell;
60*b30d1939SAndy Fiddaman char* f;
61*b30d1939SAndy Fiddaman char* buf;
62*b30d1939SAndy Fiddaman
63*b30d1939SAndy Fiddaman c = 4 * (n + 1);
64*b30d1939SAndy Fiddaman if (qb)
65*b30d1939SAndy Fiddaman c += strlen((char*)qb);
66*b30d1939SAndy Fiddaman if (qe)
67*b30d1939SAndy Fiddaman c += strlen((char*)qe);
68*b30d1939SAndy Fiddaman b = buf = fmtbuf(c);
69*b30d1939SAndy Fiddaman shell = 0;
70*b30d1939SAndy Fiddaman doublequote = 0;
71*b30d1939SAndy Fiddaman singlequote = 0;
72*b30d1939SAndy Fiddaman if (qb)
73*b30d1939SAndy Fiddaman {
74*b30d1939SAndy Fiddaman if (qb[0] == '$' && qb[1] == '\'' && qb[2] == 0)
75*b30d1939SAndy Fiddaman shell = 1;
76*b30d1939SAndy Fiddaman else if ((flags & FMT_SHELL) && qb[1] == 0)
77*b30d1939SAndy Fiddaman {
78*b30d1939SAndy Fiddaman if (qb[0] == '"')
79*b30d1939SAndy Fiddaman doublequote = 1;
80*b30d1939SAndy Fiddaman else if (qb[0] == '\'')
81*b30d1939SAndy Fiddaman singlequote = 1;
82*b30d1939SAndy Fiddaman }
83*b30d1939SAndy Fiddaman while (*b = *qb++)
84*b30d1939SAndy Fiddaman b++;
85*b30d1939SAndy Fiddaman }
86*b30d1939SAndy Fiddaman else if (flags & FMT_SHELL)
87*b30d1939SAndy Fiddaman doublequote = 1;
88*b30d1939SAndy Fiddaman f = b;
89*b30d1939SAndy Fiddaman escaped = spaced = !!(flags & FMT_ALWAYS);
90*b30d1939SAndy Fiddaman while (s < e)
91*b30d1939SAndy Fiddaman {
92*b30d1939SAndy Fiddaman if ((m = mbsize(s)) > 1 && (s + m) <= e)
93*b30d1939SAndy Fiddaman {
94*b30d1939SAndy Fiddaman #if _hdr_wchar && _hdr_wctype
95*b30d1939SAndy Fiddaman c = mbchar(s);
96*b30d1939SAndy Fiddaman if (!spaced && !escaped && (iswspace(c) || iswcntrl(c)))
97*b30d1939SAndy Fiddaman spaced = 1;
98*b30d1939SAndy Fiddaman s -= m;
99*b30d1939SAndy Fiddaman #endif
100*b30d1939SAndy Fiddaman while (m--)
101*b30d1939SAndy Fiddaman *b++ = *s++;
102*b30d1939SAndy Fiddaman }
103*b30d1939SAndy Fiddaman else
104*b30d1939SAndy Fiddaman {
105*b30d1939SAndy Fiddaman c = *s++;
106*b30d1939SAndy Fiddaman if (!(flags & FMT_ESCAPED) && (iscntrl(c) || !isprint(c) || c == '\\'))
107*b30d1939SAndy Fiddaman {
108*b30d1939SAndy Fiddaman escaped = 1;
109*b30d1939SAndy Fiddaman *b++ = '\\';
110*b30d1939SAndy Fiddaman switch (c)
111*b30d1939SAndy Fiddaman {
112*b30d1939SAndy Fiddaman case CC_bel:
113*b30d1939SAndy Fiddaman c = 'a';
114*b30d1939SAndy Fiddaman break;
115*b30d1939SAndy Fiddaman case '\b':
116*b30d1939SAndy Fiddaman c = 'b';
117*b30d1939SAndy Fiddaman break;
118*b30d1939SAndy Fiddaman case '\f':
119*b30d1939SAndy Fiddaman c = 'f';
120*b30d1939SAndy Fiddaman break;
121*b30d1939SAndy Fiddaman case '\n':
122*b30d1939SAndy Fiddaman c = 'n';
123*b30d1939SAndy Fiddaman break;
124*b30d1939SAndy Fiddaman case '\r':
125*b30d1939SAndy Fiddaman c = 'r';
126*b30d1939SAndy Fiddaman break;
127*b30d1939SAndy Fiddaman case '\t':
128*b30d1939SAndy Fiddaman c = 't';
129*b30d1939SAndy Fiddaman break;
130*b30d1939SAndy Fiddaman case CC_vt:
131*b30d1939SAndy Fiddaman c = 'v';
132*b30d1939SAndy Fiddaman break;
133*b30d1939SAndy Fiddaman case CC_esc:
134*b30d1939SAndy Fiddaman c = 'E';
135*b30d1939SAndy Fiddaman break;
136*b30d1939SAndy Fiddaman case '\\':
137*b30d1939SAndy Fiddaman break;
138*b30d1939SAndy Fiddaman default:
139*b30d1939SAndy Fiddaman if (!(flags & FMT_WIDE) || !(c & 0200))
140*b30d1939SAndy Fiddaman {
141*b30d1939SAndy Fiddaman *b++ = '0' + ((c >> 6) & 07);
142*b30d1939SAndy Fiddaman *b++ = '0' + ((c >> 3) & 07);
143*b30d1939SAndy Fiddaman c = '0' + (c & 07);
144*b30d1939SAndy Fiddaman }
145*b30d1939SAndy Fiddaman else
146*b30d1939SAndy Fiddaman b--;
147*b30d1939SAndy Fiddaman break;
148*b30d1939SAndy Fiddaman }
149*b30d1939SAndy Fiddaman }
150*b30d1939SAndy Fiddaman else if (c == '\\')
151*b30d1939SAndy Fiddaman {
152*b30d1939SAndy Fiddaman escaped = 1;
153*b30d1939SAndy Fiddaman *b++ = c;
154*b30d1939SAndy Fiddaman if (*s)
155*b30d1939SAndy Fiddaman c = *s++;
156*b30d1939SAndy Fiddaman }
157*b30d1939SAndy Fiddaman else if (qe && strchr(qe, c))
158*b30d1939SAndy Fiddaman {
159*b30d1939SAndy Fiddaman if (singlequote && c == '\'')
160*b30d1939SAndy Fiddaman {
161*b30d1939SAndy Fiddaman spaced = 1;
162*b30d1939SAndy Fiddaman *b++ = '\'';
163*b30d1939SAndy Fiddaman *b++ = '\\';
164*b30d1939SAndy Fiddaman *b++ = '\'';
165*b30d1939SAndy Fiddaman c = '\'';
166*b30d1939SAndy Fiddaman }
167*b30d1939SAndy Fiddaman else
168*b30d1939SAndy Fiddaman {
169*b30d1939SAndy Fiddaman escaped = 1;
170*b30d1939SAndy Fiddaman *b++ = '\\';
171*b30d1939SAndy Fiddaman }
172*b30d1939SAndy Fiddaman }
173*b30d1939SAndy Fiddaman else if (c == '$' || c == '`')
174*b30d1939SAndy Fiddaman {
175*b30d1939SAndy Fiddaman if (c == '$' && (flags & FMT_PARAM) && (*s == '{' || *s == '('))
176*b30d1939SAndy Fiddaman {
177*b30d1939SAndy Fiddaman if (singlequote || shell)
178*b30d1939SAndy Fiddaman {
179*b30d1939SAndy Fiddaman escaped = 1;
180*b30d1939SAndy Fiddaman *b++ = '\'';
181*b30d1939SAndy Fiddaman *b++ = c;
182*b30d1939SAndy Fiddaman *b++ = *s++;
183*b30d1939SAndy Fiddaman if (shell)
184*b30d1939SAndy Fiddaman {
185*b30d1939SAndy Fiddaman spaced = 1;
186*b30d1939SAndy Fiddaman *b++ = '$';
187*b30d1939SAndy Fiddaman }
188*b30d1939SAndy Fiddaman c = '\'';
189*b30d1939SAndy Fiddaman }
190*b30d1939SAndy Fiddaman else
191*b30d1939SAndy Fiddaman {
192*b30d1939SAndy Fiddaman escaped = 1;
193*b30d1939SAndy Fiddaman *b++ = c;
194*b30d1939SAndy Fiddaman c = *s++;
195*b30d1939SAndy Fiddaman }
196*b30d1939SAndy Fiddaman }
197*b30d1939SAndy Fiddaman else if (doublequote)
198*b30d1939SAndy Fiddaman *b++ = '\\';
199*b30d1939SAndy Fiddaman else if (singlequote || (flags & FMT_SHELL))
200*b30d1939SAndy Fiddaman spaced = 1;
201*b30d1939SAndy Fiddaman }
202*b30d1939SAndy Fiddaman else if (!spaced && !escaped && (isspace(c) || ((flags & FMT_SHELL) || shell) && (strchr("\";~&|()<>[]*?", c) || c == '#' && (b == f || isspace(*(b - 1))))))
203*b30d1939SAndy Fiddaman spaced = 1;
204*b30d1939SAndy Fiddaman *b++ = c;
205*b30d1939SAndy Fiddaman }
206*b30d1939SAndy Fiddaman }
207*b30d1939SAndy Fiddaman if (qb)
208*b30d1939SAndy Fiddaman {
209*b30d1939SAndy Fiddaman if (!escaped)
210*b30d1939SAndy Fiddaman buf += shell + !spaced;
211*b30d1939SAndy Fiddaman if (qe && (escaped || spaced))
212*b30d1939SAndy Fiddaman while (*b = *qe++)
213*b30d1939SAndy Fiddaman b++;
214*b30d1939SAndy Fiddaman }
215*b30d1939SAndy Fiddaman *b = 0;
216*b30d1939SAndy Fiddaman return buf;
217*b30d1939SAndy Fiddaman }
218*b30d1939SAndy Fiddaman
219*b30d1939SAndy Fiddaman /*
220*b30d1939SAndy Fiddaman * escape the usual suspects and quote chars in qs
221*b30d1939SAndy Fiddaman * in length n string as
222*b30d1939SAndy Fiddaman */
223*b30d1939SAndy Fiddaman
224*b30d1939SAndy Fiddaman char*
fmtnesq(const char * as,const char * qs,size_t n)225*b30d1939SAndy Fiddaman fmtnesq(const char* as, const char* qs, size_t n)
226*b30d1939SAndy Fiddaman {
227*b30d1939SAndy Fiddaman return fmtquote(as, NiL, qs, n, 0);
228*b30d1939SAndy Fiddaman }
229*b30d1939SAndy Fiddaman
230*b30d1939SAndy Fiddaman /*
231*b30d1939SAndy Fiddaman * escape the usual suspects and quote chars in qs
232*b30d1939SAndy Fiddaman */
233*b30d1939SAndy Fiddaman
234*b30d1939SAndy Fiddaman char*
fmtesq(const char * as,const char * qs)235*b30d1939SAndy Fiddaman fmtesq(const char* as, const char* qs)
236*b30d1939SAndy Fiddaman {
237*b30d1939SAndy Fiddaman return fmtquote(as, NiL, qs, strlen((char*)as), 0);
238*b30d1939SAndy Fiddaman }
239*b30d1939SAndy Fiddaman
240*b30d1939SAndy Fiddaman /*
241*b30d1939SAndy Fiddaman * escape the usual suspects
242*b30d1939SAndy Fiddaman */
243*b30d1939SAndy Fiddaman
244*b30d1939SAndy Fiddaman char*
fmtesc(const char * as)245*b30d1939SAndy Fiddaman fmtesc(const char* as)
246*b30d1939SAndy Fiddaman {
247*b30d1939SAndy Fiddaman return fmtquote(as, NiL, NiL, strlen((char*)as), 0);
248*b30d1939SAndy Fiddaman }
249