1 /* quotearg.c - quote arguments for output
2 
3    Copyright (C) 1998-2002, 2004-2021 Free Software Foundation, Inc.
4 
5    This program is free software: you can redistribute it and/or modify
6    it under the terms of the GNU General Public License as published by
7    the Free Software Foundation; either version 3 of the License, or
8    (at your option) any later version.
9 
10    This program is distributed in the hope that it will be useful,
11    but WITHOUT ANY WARRANTY; without even the implied warranty of
12    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
13    GNU General Public License for more details.
14 
15    You should have received a copy of the GNU General Public License
16    along with this program.  If not, see <https://www.gnu.org/licenses/>.  */
17 
18 /* Written by Paul Eggert <eggert@twinsun.com> */
19 
20 /* Without this pragma, gcc 4.7.0 20111124 mistakenly suggests that
21    the quoting_options_from_style function might be candidate for
22    attribute 'pure'  */
23 #if (__GNUC__ == 4 && 6 <= __GNUC_MINOR__) || 4 < __GNUC__
24 # pragma GCC diagnostic ignored "-Wsuggest-attribute=pure"
25 #endif
26 
27 #include <config.h>
28 
29 #include "quotearg.h"
30 #include "quote.h"
31 
32 #include "attribute.h"
33 #include "minmax.h"
34 #include "xalloc.h"
35 #include "c-strcaseeq.h"
36 #include "localcharset.h"
37 
38 #include <ctype.h>
39 #include <errno.h>
40 #include <limits.h>
41 #include <stdbool.h>
42 #include <stdint.h>
43 #include <stdlib.h>
44 #include <string.h>
45 #include <wchar.h>
46 #include <wctype.h>
47 
48 #include "gettext.h"
49 #define _(msgid) gettext (msgid)
50 #define N_(msgid) msgid
51 
52 #ifndef SIZE_MAX
53 # define SIZE_MAX ((size_t) -1)
54 #endif
55 
56 #define INT_BITS (sizeof (int) * CHAR_BIT)
57 
58 struct quoting_options
59 {
60   /* Basic quoting style.  */
61   enum quoting_style style;
62 
63   /* Additional flags.  Bitwise combination of enum quoting_flags.  */
64   int flags;
65 
66   /* Quote the characters indicated by this bit vector even if the
67      quoting style would not normally require them to be quoted.  */
68   unsigned int quote_these_too[(UCHAR_MAX / INT_BITS) + 1];
69 
70   /* The left quote for custom_quoting_style.  */
71   char const *left_quote;
72 
73   /* The right quote for custom_quoting_style.  */
74   char const *right_quote;
75 };
76 
77 /* Names of quoting styles.  */
78 char const *const quoting_style_args[] =
79 {
80   "literal",
81   "shell",
82   "shell-always",
83   "shell-escape",
84   "shell-escape-always",
85   "c",
86   "c-maybe",
87   "escape",
88   "locale",
89   "clocale",
90   0
91 };
92 
93 /* Correspondences to quoting style names.  */
94 enum quoting_style const quoting_style_vals[] =
95 {
96   literal_quoting_style,
97   shell_quoting_style,
98   shell_always_quoting_style,
99   shell_escape_quoting_style,
100   shell_escape_always_quoting_style,
101   c_quoting_style,
102   c_maybe_quoting_style,
103   escape_quoting_style,
104   locale_quoting_style,
105   clocale_quoting_style
106 };
107 
108 /* The default quoting options.  */
109 static struct quoting_options default_quoting_options;
110 
111 /* Allocate a new set of quoting options, with contents initially identical
112    to O if O is not null, or to the default if O is null.
113    It is the caller's responsibility to free the result.  */
114 struct quoting_options *
clone_quoting_options(struct quoting_options * o)115 clone_quoting_options (struct quoting_options *o)
116 {
117   int e = errno;
118   struct quoting_options *p = xmemdup (o ? o : &default_quoting_options,
119                                        sizeof *o);
120   errno = e;
121   return p;
122 }
123 
124 /* Get the value of O's quoting style.  If O is null, use the default.  */
125 enum quoting_style
get_quoting_style(struct quoting_options const * o)126 get_quoting_style (struct quoting_options const *o)
127 {
128   return (o ? o : &default_quoting_options)->style;
129 }
130 
131 /* In O (or in the default if O is null),
132    set the value of the quoting style to S.  */
133 void
set_quoting_style(struct quoting_options * o,enum quoting_style s)134 set_quoting_style (struct quoting_options *o, enum quoting_style s)
135 {
136   (o ? o : &default_quoting_options)->style = s;
137 }
138 
139 /* In O (or in the default if O is null),
140    set the value of the quoting options for character C to I.
141    Return the old value.  Currently, the only values defined for I are
142    0 (the default) and 1 (which means to quote the character even if
143    it would not otherwise be quoted).  */
144 int
set_char_quoting(struct quoting_options * o,char c,int i)145 set_char_quoting (struct quoting_options *o, char c, int i)
146 {
147   unsigned char uc = c;
148   unsigned int *p =
149     (o ? o : &default_quoting_options)->quote_these_too + uc / INT_BITS;
150   int shift = uc % INT_BITS;
151   int r = (*p >> shift) & 1;
152   *p ^= ((i & 1) ^ r) << shift;
153   return r;
154 }
155 
156 /* In O (or in the default if O is null),
157    set the value of the quoting options flag to I, which can be a
158    bitwise combination of enum quoting_flags, or 0 for default
159    behavior.  Return the old value.  */
160 int
set_quoting_flags(struct quoting_options * o,int i)161 set_quoting_flags (struct quoting_options *o, int i)
162 {
163   int r;
164   if (!o)
165     o = &default_quoting_options;
166   r = o->flags;
167   o->flags = i;
168   return r;
169 }
170 
171 void
set_custom_quoting(struct quoting_options * o,char const * left_quote,char const * right_quote)172 set_custom_quoting (struct quoting_options *o,
173                     char const *left_quote, char const *right_quote)
174 {
175   if (!o)
176     o = &default_quoting_options;
177   o->style = custom_quoting_style;
178   if (!left_quote || !right_quote)
179     abort ();
180   o->left_quote = left_quote;
181   o->right_quote = right_quote;
182 }
183 
184 /* Return quoting options for STYLE, with no extra quoting.  */
185 static struct quoting_options /* NOT PURE!! */
quoting_options_from_style(enum quoting_style style)186 quoting_options_from_style (enum quoting_style style)
187 {
188   struct quoting_options o = { literal_quoting_style, 0, { 0 }, NULL, NULL };
189   if (style == custom_quoting_style)
190     abort ();
191   o.style = style;
192   return o;
193 }
194 
195 /* MSGID approximates a quotation mark.  Return its translation if it
196    has one; otherwise, return either it or "\"", depending on S.
197 
198    S is either clocale_quoting_style or locale_quoting_style.  */
199 static char const *
gettext_quote(char const * msgid,enum quoting_style s)200 gettext_quote (char const *msgid, enum quoting_style s)
201 {
202   char const *translation = _(msgid);
203   char const *locale_code;
204 
205   if (translation != msgid)
206     return translation;
207 
208   /* For UTF-8 and GB-18030, use single quotes U+2018 and U+2019.
209      Here is a list of other locales that include U+2018 and U+2019:
210 
211         ISO-8859-7   0xA1                 KOI8-T       0x91
212         CP869        0x8B                 CP874        0x91
213         CP932        0x81 0x65            CP936        0xA1 0xAE
214         CP949        0xA1 0xAE            CP950        0xA1 0xA5
215         CP1250       0x91                 CP1251       0x91
216         CP1252       0x91                 CP1253       0x91
217         CP1254       0x91                 CP1255       0x91
218         CP1256       0x91                 CP1257       0x91
219         EUC-JP       0xA1 0xC6            EUC-KR       0xA1 0xAE
220         EUC-TW       0xA1 0xE4            BIG5         0xA1 0xA5
221         BIG5-HKSCS   0xA1 0xA5            EUC-CN       0xA1 0xAE
222         GBK          0xA1 0xAE            Georgian-PS  0x91
223         PT154        0x91
224 
225      None of these is still in wide use; using iconv is overkill.  */
226   locale_code = locale_charset ();
227   if (STRCASEEQ (locale_code, "UTF-8", 'U','T','F','-','8',0,0,0,0))
228     return msgid[0] == '`' ? "\xe2\x80\x98": "\xe2\x80\x99";
229   if (STRCASEEQ (locale_code, "GB18030", 'G','B','1','8','0','3','0',0,0))
230     return msgid[0] == '`' ? "\xa1\ae": "\xa1\xaf";
231 
232   return (s == clocale_quoting_style ? "\"" : "'");
233 }
234 
235 /* Place into buffer BUFFER (of size BUFFERSIZE) a quoted version of
236    argument ARG (of size ARGSIZE), using QUOTING_STYLE, FLAGS, and
237    QUOTE_THESE_TOO to control quoting.
238    Terminate the output with a null character, and return the written
239    size of the output, not counting the terminating null.
240    If BUFFERSIZE is too small to store the output string, return the
241    value that would have been returned had BUFFERSIZE been large enough.
242    If ARGSIZE is SIZE_MAX, use the string length of the argument for ARGSIZE.
243 
244    This function acts like quotearg_buffer (BUFFER, BUFFERSIZE, ARG,
245    ARGSIZE, O), except it breaks O into its component pieces and is
246    not careful about errno.  */
247 
248 static size_t
quotearg_buffer_restyled(char * buffer,size_t buffersize,char const * arg,size_t argsize,enum quoting_style quoting_style,int flags,unsigned int const * quote_these_too,char const * left_quote,char const * right_quote)249 quotearg_buffer_restyled (char *buffer, size_t buffersize,
250                           char const *arg, size_t argsize,
251                           enum quoting_style quoting_style, int flags,
252                           unsigned int const *quote_these_too,
253                           char const *left_quote,
254                           char const *right_quote)
255 {
256   size_t i;
257   size_t len = 0;
258   size_t orig_buffersize = 0;
259   char const *quote_string = 0;
260   size_t quote_string_len = 0;
261   bool backslash_escapes = false;
262   bool unibyte_locale = MB_CUR_MAX == 1;
263   bool elide_outer_quotes = (flags & QA_ELIDE_OUTER_QUOTES) != 0;
264   bool pending_shell_escape_end = false;
265   bool encountered_single_quote = false;
266   bool all_c_and_shell_quote_compat = true;
267 
268 #define STORE(c) \
269     do \
270       { \
271         if (len < buffersize) \
272           buffer[len] = (c); \
273         len++; \
274       } \
275     while (0)
276 
277 #define START_ESC() \
278     do \
279       { \
280         if (elide_outer_quotes) \
281           goto force_outer_quoting_style; \
282         escaping = true; \
283         if (quoting_style == shell_always_quoting_style \
284             && ! pending_shell_escape_end) \
285           { \
286             STORE ('\''); \
287             STORE ('$'); \
288             STORE ('\''); \
289             pending_shell_escape_end = true; \
290           } \
291         STORE ('\\'); \
292       } \
293     while (0)
294 
295 #define END_ESC() \
296     do \
297       { \
298         if (pending_shell_escape_end && ! escaping) \
299           { \
300             STORE ('\''); \
301             STORE ('\''); \
302             pending_shell_escape_end = false; \
303           } \
304       } \
305     while (0)
306 
307  process_input:
308 
309   switch (quoting_style)
310     {
311     case c_maybe_quoting_style:
312       quoting_style = c_quoting_style;
313       elide_outer_quotes = true;
314       FALLTHROUGH;
315     case c_quoting_style:
316       if (!elide_outer_quotes)
317         STORE ('"');
318       backslash_escapes = true;
319       quote_string = "\"";
320       quote_string_len = 1;
321       break;
322 
323     case escape_quoting_style:
324       backslash_escapes = true;
325       elide_outer_quotes = false;
326       break;
327 
328     case locale_quoting_style:
329     case clocale_quoting_style:
330     case custom_quoting_style:
331       {
332         if (quoting_style != custom_quoting_style)
333           {
334             /* TRANSLATORS:
335                Get translations for open and closing quotation marks.
336                The message catalog should translate "`" to a left
337                quotation mark suitable for the locale, and similarly for
338                "'".  For example, a French Unicode local should translate
339                these to U+00AB (LEFT-POINTING DOUBLE ANGLE
340                QUOTATION MARK), and U+00BB (RIGHT-POINTING DOUBLE ANGLE
341                QUOTATION MARK), respectively.
342 
343                If the catalog has no translation, we will try to
344                use Unicode U+2018 (LEFT SINGLE QUOTATION MARK) and
345                Unicode U+2019 (RIGHT SINGLE QUOTATION MARK).  If the
346                current locale is not Unicode, locale_quoting_style
347                will quote 'like this', and clocale_quoting_style will
348                quote "like this".  You should always include translations
349                for "`" and "'" even if U+2018 and U+2019 are appropriate
350                for your locale.
351 
352                If you don't know what to put here, please see
353                <https://en.wikipedia.org/wiki/Quotation_marks_in_other_languages>
354                and use glyphs suitable for your language.  */
355             left_quote = gettext_quote (N_("`"), quoting_style);
356             right_quote = gettext_quote (N_("'"), quoting_style);
357           }
358         if (!elide_outer_quotes)
359           for (quote_string = left_quote; *quote_string; quote_string++)
360             STORE (*quote_string);
361         backslash_escapes = true;
362         quote_string = right_quote;
363         quote_string_len = strlen (quote_string);
364       }
365       break;
366 
367     case shell_escape_quoting_style:
368       backslash_escapes = true;
369       FALLTHROUGH;
370     case shell_quoting_style:
371       elide_outer_quotes = true;
372       FALLTHROUGH;
373     case shell_escape_always_quoting_style:
374       if (!elide_outer_quotes)
375         backslash_escapes = true;
376       FALLTHROUGH;
377     case shell_always_quoting_style:
378       quoting_style = shell_always_quoting_style;
379       if (!elide_outer_quotes)
380         STORE ('\'');
381       quote_string = "'";
382       quote_string_len = 1;
383       break;
384 
385     case literal_quoting_style:
386       elide_outer_quotes = false;
387       break;
388 
389     default:
390       abort ();
391     }
392 
393   for (i = 0;  ! (argsize == SIZE_MAX ? arg[i] == '\0' : i == argsize);  i++)
394     {
395       unsigned char c;
396       unsigned char esc;
397       bool is_right_quote = false;
398       bool escaping = false;
399       bool c_and_shell_quote_compat = false;
400 
401       if (backslash_escapes
402           && quoting_style != shell_always_quoting_style
403           && quote_string_len
404           && (i + quote_string_len
405               <= (argsize == SIZE_MAX && 1 < quote_string_len
406                   /* Use strlen only if we must: when argsize is SIZE_MAX,
407                      and when the quote string is more than 1 byte long.
408                      If we do call strlen, save the result.  */
409                   ? (argsize = strlen (arg)) : argsize))
410           && memcmp (arg + i, quote_string, quote_string_len) == 0)
411         {
412           if (elide_outer_quotes)
413             goto force_outer_quoting_style;
414           is_right_quote = true;
415         }
416 
417       c = arg[i];
418       switch (c)
419         {
420         case '\0':
421           if (backslash_escapes)
422             {
423               START_ESC ();
424               /* If quote_string were to begin with digits, we'd need to
425                  test for the end of the arg as well.  However, it's
426                  hard to imagine any locale that would use digits in
427                  quotes, and set_custom_quoting is documented not to
428                  accept them.  Use only a single \0 with shell-escape
429                  as currently digits are not printed within $'...'  */
430               if (quoting_style != shell_always_quoting_style
431                   && i + 1 < argsize && '0' <= arg[i + 1] && arg[i + 1] <= '9')
432                 {
433                   STORE ('0');
434                   STORE ('0');
435                 }
436               c = '0';
437               /* We don't have to worry that this last '0' will be
438                  backslash-escaped because, again, quote_string should
439                  not start with it and because quote_these_too is
440                  documented as not accepting it.  */
441             }
442           else if (flags & QA_ELIDE_NULL_BYTES)
443             continue;
444           break;
445 
446         case '?':
447           switch (quoting_style)
448             {
449             case shell_always_quoting_style:
450               if (elide_outer_quotes)
451                 goto force_outer_quoting_style;
452               break;
453 
454             case c_quoting_style:
455               if ((flags & QA_SPLIT_TRIGRAPHS)
456                   && i + 2 < argsize && arg[i + 1] == '?')
457                 switch (arg[i + 2])
458                   {
459                   case '!': case '\'':
460                   case '(': case ')': case '-': case '/':
461                   case '<': case '=': case '>':
462                     /* Escape the second '?' in what would otherwise be
463                        a trigraph.  */
464                     if (elide_outer_quotes)
465                       goto force_outer_quoting_style;
466                     c = arg[i + 2];
467                     i += 2;
468                     STORE ('?');
469                     STORE ('"');
470                     STORE ('"');
471                     STORE ('?');
472                     break;
473 
474                   default:
475                     break;
476                   }
477               break;
478 
479             default:
480               break;
481             }
482           break;
483 
484         case '\a': esc = 'a'; goto c_escape;
485         case '\b': esc = 'b'; goto c_escape;
486         case '\f': esc = 'f'; goto c_escape;
487         case '\n': esc = 'n'; goto c_and_shell_escape;
488         case '\r': esc = 'r'; goto c_and_shell_escape;
489         case '\t': esc = 't'; goto c_and_shell_escape;
490         case '\v': esc = 'v'; goto c_escape;
491         case '\\': esc = c;
492           /* Never need to escape '\' in shell case.  */
493           if (quoting_style == shell_always_quoting_style)
494             {
495               if (elide_outer_quotes)
496                 goto force_outer_quoting_style;
497               goto store_c;
498             }
499 
500           /* No need to escape the escape if we are trying to elide
501              outer quotes and nothing else is problematic.  */
502           if (backslash_escapes && elide_outer_quotes && quote_string_len)
503             goto store_c;
504 
505         c_and_shell_escape:
506           if (quoting_style == shell_always_quoting_style
507               && elide_outer_quotes)
508             goto force_outer_quoting_style;
509           /* fall through */
510         c_escape:
511           if (backslash_escapes)
512             {
513               c = esc;
514               goto store_escape;
515             }
516           break;
517 
518         case '{': case '}': /* sometimes special if isolated */
519           if (! (argsize == SIZE_MAX ? arg[1] == '\0' : argsize == 1))
520             break;
521           FALLTHROUGH;
522         case '#': case '~':
523           if (i != 0)
524             break;
525           FALLTHROUGH;
526         case ' ':
527           c_and_shell_quote_compat = true;
528           FALLTHROUGH;
529         case '!': /* special in bash */
530         case '"': case '$': case '&':
531         case '(': case ')': case '*': case ';':
532         case '<':
533         case '=': /* sometimes special in 0th or (with "set -k") later args */
534         case '>': case '[':
535         case '^': /* special in old /bin/sh, e.g. SunOS 4.1.4 */
536         case '`': case '|':
537           /* A shell special character.  In theory, '$' and '`' could
538              be the first bytes of multibyte characters, which means
539              we should check them with mbrtowc, but in practice this
540              doesn't happen so it's not worth worrying about.  */
541           if (quoting_style == shell_always_quoting_style
542               && elide_outer_quotes)
543             goto force_outer_quoting_style;
544           break;
545 
546         case '\'':
547           encountered_single_quote = true;
548           c_and_shell_quote_compat = true;
549           if (quoting_style == shell_always_quoting_style)
550             {
551               if (elide_outer_quotes)
552                 goto force_outer_quoting_style;
553 
554               if (buffersize && ! orig_buffersize)
555                 {
556                   /* Just scan string to see if supports a more concise
557                      representation, rather than writing a longer string
558                      but returning the length of the more concise form.  */
559                   orig_buffersize = buffersize;
560                   buffersize = 0;
561                 }
562 
563               STORE ('\'');
564               STORE ('\\');
565               STORE ('\'');
566               pending_shell_escape_end = false;
567             }
568           break;
569 
570         case '%': case '+': case ',': case '-': case '.': case '/':
571         case '0': case '1': case '2': case '3': case '4': case '5':
572         case '6': case '7': case '8': case '9': case ':':
573         case 'A': case 'B': case 'C': case 'D': case 'E': case 'F':
574         case 'G': case 'H': case 'I': case 'J': case 'K': case 'L':
575         case 'M': case 'N': case 'O': case 'P': case 'Q': case 'R':
576         case 'S': case 'T': case 'U': case 'V': case 'W': case 'X':
577         case 'Y': case 'Z': case ']': case '_': case 'a': case 'b':
578         case 'c': case 'd': case 'e': case 'f': case 'g': case 'h':
579         case 'i': case 'j': case 'k': case 'l': case 'm': case 'n':
580         case 'o': case 'p': case 'q': case 'r': case 's': case 't':
581         case 'u': case 'v': case 'w': case 'x': case 'y': case 'z':
582           /* These characters don't cause problems, no matter what the
583              quoting style is.  They cannot start multibyte sequences.
584              A digit or a special letter would cause trouble if it
585              appeared at the beginning of quote_string because we'd then
586              escape by prepending a backslash.  However, it's hard to
587              imagine any locale that would use digits or letters as
588              quotes, and set_custom_quoting is documented not to accept
589              them.  Also, a digit or a special letter would cause
590              trouble if it appeared in quote_these_too, but that's also
591              documented as not accepting them.  */
592           c_and_shell_quote_compat = true;
593           break;
594 
595         default:
596           /* If we have a multibyte sequence, copy it until we reach
597              its end, find an error, or come back to the initial shift
598              state.  For C-like styles, if the sequence has
599              unprintable characters, escape the whole sequence, since
600              we can't easily escape single characters within it.  */
601           {
602             /* Length of multibyte sequence found so far.  */
603             size_t m;
604 
605             bool printable;
606 
607             if (unibyte_locale)
608               {
609                 m = 1;
610                 printable = isprint (c) != 0;
611               }
612             else
613               {
614                 mbstate_t mbstate;
615                 memset (&mbstate, 0, sizeof mbstate);
616 
617                 m = 0;
618                 printable = true;
619                 if (argsize == SIZE_MAX)
620                   argsize = strlen (arg);
621 
622                 do
623                   {
624                     wchar_t w;
625                     size_t bytes = mbrtowc (&w, &arg[i + m],
626                                             argsize - (i + m), &mbstate);
627                     if (bytes == 0)
628                       break;
629                     else if (bytes == (size_t) -1)
630                       {
631                         printable = false;
632                         break;
633                       }
634                     else if (bytes == (size_t) -2)
635                       {
636                         printable = false;
637                         while (i + m < argsize && arg[i + m])
638                           m++;
639                         break;
640                       }
641                     else
642                       {
643                         /* Work around a bug with older shells that "see" a '\'
644                            that is really the 2nd byte of a multibyte character.
645                            In practice the problem is limited to ASCII
646                            chars >= '@' that are shell special chars.  */
647                         if ('[' == 0x5b && elide_outer_quotes
648                             && quoting_style == shell_always_quoting_style)
649                           {
650                             size_t j;
651                             for (j = 1; j < bytes; j++)
652                               switch (arg[i + m + j])
653                                 {
654                                 case '[': case '\\': case '^':
655                                 case '`': case '|':
656                                   goto force_outer_quoting_style;
657 
658                                 default:
659                                   break;
660                                 }
661                           }
662 
663                         if (! iswprint (w))
664                           printable = false;
665                         m += bytes;
666                       }
667                   }
668                 while (! mbsinit (&mbstate));
669               }
670 
671             c_and_shell_quote_compat = printable;
672 
673             if (1 < m || (backslash_escapes && ! printable))
674               {
675                 /* Output a multibyte sequence, or an escaped
676                    unprintable unibyte character.  */
677                 size_t ilim = i + m;
678 
679                 for (;;)
680                   {
681                     if (backslash_escapes && ! printable)
682                       {
683                         START_ESC ();
684                         STORE ('0' + (c >> 6));
685                         STORE ('0' + ((c >> 3) & 7));
686                         c = '0' + (c & 7);
687                       }
688                     else if (is_right_quote)
689                       {
690                         STORE ('\\');
691                         is_right_quote = false;
692                       }
693                     if (ilim <= i + 1)
694                       break;
695                     END_ESC ();
696                     STORE (c);
697                     c = arg[++i];
698                   }
699 
700                 goto store_c;
701               }
702           }
703         }
704 
705       if (! (((backslash_escapes && quoting_style != shell_always_quoting_style)
706               || elide_outer_quotes)
707              && quote_these_too
708              && quote_these_too[c / INT_BITS] >> (c % INT_BITS) & 1)
709           && !is_right_quote)
710         goto store_c;
711 
712     store_escape:
713       START_ESC ();
714 
715     store_c:
716       END_ESC ();
717       STORE (c);
718 
719       if (! c_and_shell_quote_compat)
720         all_c_and_shell_quote_compat = false;
721     }
722 
723   if (len == 0 && quoting_style == shell_always_quoting_style
724       && elide_outer_quotes)
725     goto force_outer_quoting_style;
726 
727   /* Single shell quotes (') are commonly enough used as an apostrophe,
728      that we attempt to minimize the quoting in this case.  Note itʼs
729      better to use the apostrophe modifier "\u02BC" if possible, as that
730      renders better and works with the word match regex \W+ etc.  */
731   if (quoting_style == shell_always_quoting_style && ! elide_outer_quotes
732       && encountered_single_quote)
733     {
734       if (all_c_and_shell_quote_compat)
735         return quotearg_buffer_restyled (buffer, orig_buffersize, arg, argsize,
736                                          c_quoting_style,
737                                          flags, quote_these_too,
738                                          left_quote, right_quote);
739       else if (! buffersize && orig_buffersize)
740         {
741           /* Disable read-only scan, and reprocess to write quoted string.  */
742           buffersize = orig_buffersize;
743           len = 0;
744           goto process_input;
745         }
746     }
747 
748   if (quote_string && !elide_outer_quotes)
749     for (; *quote_string; quote_string++)
750       STORE (*quote_string);
751 
752   if (len < buffersize)
753     buffer[len] = '\0';
754   return len;
755 
756  force_outer_quoting_style:
757   /* Don't reuse quote_these_too, since the addition of outer quotes
758      sufficiently quotes the specified characters.  */
759   if (quoting_style == shell_always_quoting_style && backslash_escapes)
760     quoting_style = shell_escape_always_quoting_style;
761   return quotearg_buffer_restyled (buffer, buffersize, arg, argsize,
762                                    quoting_style,
763                                    flags & ~QA_ELIDE_OUTER_QUOTES, NULL,
764                                    left_quote, right_quote);
765 }
766 
767 /* Place into buffer BUFFER (of size BUFFERSIZE) a quoted version of
768    argument ARG (of size ARGSIZE), using O to control quoting.
769    If O is null, use the default.
770    Terminate the output with a null character, and return the written
771    size of the output, not counting the terminating null.
772    If BUFFERSIZE is too small to store the output string, return the
773    value that would have been returned had BUFFERSIZE been large enough.
774    If ARGSIZE is SIZE_MAX, use the string length of the argument for
775    ARGSIZE.  */
776 size_t
quotearg_buffer(char * buffer,size_t buffersize,char const * arg,size_t argsize,struct quoting_options const * o)777 quotearg_buffer (char *buffer, size_t buffersize,
778                  char const *arg, size_t argsize,
779                  struct quoting_options const *o)
780 {
781   struct quoting_options const *p = o ? o : &default_quoting_options;
782   int e = errno;
783   size_t r = quotearg_buffer_restyled (buffer, buffersize, arg, argsize,
784                                        p->style, p->flags, p->quote_these_too,
785                                        p->left_quote, p->right_quote);
786   errno = e;
787   return r;
788 }
789 
790 char *
quotearg_alloc(char const * arg,size_t argsize,struct quoting_options const * o)791 quotearg_alloc (char const *arg, size_t argsize,
792                 struct quoting_options const *o)
793 {
794   return quotearg_alloc_mem (arg, argsize, NULL, o);
795 }
796 
797 /* Like quotearg_buffer (..., ARG, ARGSIZE, O), except return newly
798    allocated storage containing the quoted string, and store the
799    resulting size into *SIZE, if non-NULL.  The result can contain
800    embedded null bytes only if ARGSIZE is not SIZE_MAX, SIZE is not
801    NULL, and set_quoting_flags has not set the null byte elision
802    flag.  */
803 char *
quotearg_alloc_mem(char const * arg,size_t argsize,size_t * size,struct quoting_options const * o)804 quotearg_alloc_mem (char const *arg, size_t argsize, size_t *size,
805                     struct quoting_options const *o)
806 {
807   struct quoting_options const *p = o ? o : &default_quoting_options;
808   int e = errno;
809   /* Elide embedded null bytes if we can't return a size.  */
810   int flags = p->flags | (size ? 0 : QA_ELIDE_NULL_BYTES);
811   size_t bufsize = quotearg_buffer_restyled (0, 0, arg, argsize, p->style,
812                                              flags, p->quote_these_too,
813                                              p->left_quote,
814                                              p->right_quote) + 1;
815   char *buf = xcharalloc (bufsize);
816   quotearg_buffer_restyled (buf, bufsize, arg, argsize, p->style, flags,
817                             p->quote_these_too,
818                             p->left_quote, p->right_quote);
819   errno = e;
820   if (size)
821     *size = bufsize - 1;
822   return buf;
823 }
824 
825 /* A storage slot with size and pointer to a value.  */
826 struct slotvec
827 {
828   size_t size;
829   char *val;
830 };
831 
832 /* Preallocate a slot 0 buffer, so that the caller can always quote
833    one small component of a "memory exhausted" message in slot 0.  */
834 static char slot0[256];
835 static int nslots = 1;
836 static struct slotvec slotvec0 = {sizeof slot0, slot0};
837 static struct slotvec *slotvec = &slotvec0;
838 
839 void
quotearg_free(void)840 quotearg_free (void)
841 {
842   struct slotvec *sv = slotvec;
843   int i;
844   for (i = 1; i < nslots; i++)
845     free (sv[i].val);
846   if (sv[0].val != slot0)
847     {
848       free (sv[0].val);
849       slotvec0.size = sizeof slot0;
850       slotvec0.val = slot0;
851     }
852   if (sv != &slotvec0)
853     {
854       free (sv);
855       slotvec = &slotvec0;
856     }
857   nslots = 1;
858 }
859 
860 /* Use storage slot N to return a quoted version of argument ARG.
861    ARG is of size ARGSIZE, but if that is SIZE_MAX, ARG is a
862    null-terminated string.
863    OPTIONS specifies the quoting options.
864    The returned value points to static storage that can be
865    reused by the next call to this function with the same value of N.
866    N must be nonnegative; it is typically small, and must be
867    less than MIN (INT_MAX, IDX_MAX).  The type of N is signed
868    to allow for future extensions (using negative values).  */
869 static char *
quotearg_n_options(int n,char const * arg,size_t argsize,struct quoting_options const * options)870 quotearg_n_options (int n, char const *arg, size_t argsize,
871                     struct quoting_options const *options)
872 {
873   int e = errno;
874 
875   struct slotvec *sv = slotvec;
876 
877   int nslots_max = MIN (INT_MAX, IDX_MAX);
878   if (! (0 <= n && n < nslots_max))
879     abort ();
880 
881   if (nslots <= n)
882     {
883       bool preallocated = (sv == &slotvec0);
884       idx_t new_nslots = nslots;
885 
886       slotvec = sv = xpalloc (preallocated ? NULL : sv, &new_nslots,
887                               n - nslots + 1, nslots_max, sizeof *sv);
888       if (preallocated)
889         *sv = slotvec0;
890       memset (sv + nslots, 0, (new_nslots - nslots) * sizeof *sv);
891       nslots = new_nslots;
892     }
893 
894   {
895     size_t size = sv[n].size;
896     char *val = sv[n].val;
897     /* Elide embedded null bytes since we don't return a size.  */
898     int flags = options->flags | QA_ELIDE_NULL_BYTES;
899     size_t qsize = quotearg_buffer_restyled (val, size, arg, argsize,
900                                              options->style, flags,
901                                              options->quote_these_too,
902                                              options->left_quote,
903                                              options->right_quote);
904 
905     if (size <= qsize)
906       {
907         sv[n].size = size = qsize + 1;
908         if (val != slot0)
909           free (val);
910         sv[n].val = val = xcharalloc (size);
911         quotearg_buffer_restyled (val, size, arg, argsize, options->style,
912                                   flags, options->quote_these_too,
913                                   options->left_quote,
914                                   options->right_quote);
915       }
916 
917     errno = e;
918     return val;
919   }
920 }
921 
922 char *
quotearg_n(int n,char const * arg)923 quotearg_n (int n, char const *arg)
924 {
925   return quotearg_n_options (n, arg, SIZE_MAX, &default_quoting_options);
926 }
927 
928 char *
quotearg_n_mem(int n,char const * arg,size_t argsize)929 quotearg_n_mem (int n, char const *arg, size_t argsize)
930 {
931   return quotearg_n_options (n, arg, argsize, &default_quoting_options);
932 }
933 
934 char *
quotearg(char const * arg)935 quotearg (char const *arg)
936 {
937   return quotearg_n (0, arg);
938 }
939 
940 char *
quotearg_mem(char const * arg,size_t argsize)941 quotearg_mem (char const *arg, size_t argsize)
942 {
943   return quotearg_n_mem (0, arg, argsize);
944 }
945 
946 char *
quotearg_n_style(int n,enum quoting_style s,char const * arg)947 quotearg_n_style (int n, enum quoting_style s, char const *arg)
948 {
949   struct quoting_options const o = quoting_options_from_style (s);
950   return quotearg_n_options (n, arg, SIZE_MAX, &o);
951 }
952 
953 char *
quotearg_n_style_mem(int n,enum quoting_style s,char const * arg,size_t argsize)954 quotearg_n_style_mem (int n, enum quoting_style s,
955                       char const *arg, size_t argsize)
956 {
957   struct quoting_options const o = quoting_options_from_style (s);
958   return quotearg_n_options (n, arg, argsize, &o);
959 }
960 
961 char *
quotearg_style(enum quoting_style s,char const * arg)962 quotearg_style (enum quoting_style s, char const *arg)
963 {
964   return quotearg_n_style (0, s, arg);
965 }
966 
967 char *
quotearg_style_mem(enum quoting_style s,char const * arg,size_t argsize)968 quotearg_style_mem (enum quoting_style s, char const *arg, size_t argsize)
969 {
970   return quotearg_n_style_mem (0, s, arg, argsize);
971 }
972 
973 char *
quotearg_char_mem(char const * arg,size_t argsize,char ch)974 quotearg_char_mem (char const *arg, size_t argsize, char ch)
975 {
976   struct quoting_options options;
977   options = default_quoting_options;
978   set_char_quoting (&options, ch, 1);
979   return quotearg_n_options (0, arg, argsize, &options);
980 }
981 
982 char *
quotearg_char(char const * arg,char ch)983 quotearg_char (char const *arg, char ch)
984 {
985   return quotearg_char_mem (arg, SIZE_MAX, ch);
986 }
987 
988 char *
quotearg_colon(char const * arg)989 quotearg_colon (char const *arg)
990 {
991   return quotearg_char (arg, ':');
992 }
993 
994 char *
quotearg_colon_mem(char const * arg,size_t argsize)995 quotearg_colon_mem (char const *arg, size_t argsize)
996 {
997   return quotearg_char_mem (arg, argsize, ':');
998 }
999 
1000 char *
quotearg_n_style_colon(int n,enum quoting_style s,char const * arg)1001 quotearg_n_style_colon (int n, enum quoting_style s, char const *arg)
1002 {
1003   struct quoting_options options;
1004   options = quoting_options_from_style (s);
1005   set_char_quoting (&options, ':', 1);
1006   return quotearg_n_options (n, arg, SIZE_MAX, &options);
1007 }
1008 
1009 char *
quotearg_n_custom(int n,char const * left_quote,char const * right_quote,char const * arg)1010 quotearg_n_custom (int n, char const *left_quote,
1011                    char const *right_quote, char const *arg)
1012 {
1013   return quotearg_n_custom_mem (n, left_quote, right_quote, arg,
1014                                 SIZE_MAX);
1015 }
1016 
1017 char *
quotearg_n_custom_mem(int n,char const * left_quote,char const * right_quote,char const * arg,size_t argsize)1018 quotearg_n_custom_mem (int n, char const *left_quote,
1019                        char const *right_quote,
1020                        char const *arg, size_t argsize)
1021 {
1022   struct quoting_options o = default_quoting_options;
1023   set_custom_quoting (&o, left_quote, right_quote);
1024   return quotearg_n_options (n, arg, argsize, &o);
1025 }
1026 
1027 char *
quotearg_custom(char const * left_quote,char const * right_quote,char const * arg)1028 quotearg_custom (char const *left_quote, char const *right_quote,
1029                  char const *arg)
1030 {
1031   return quotearg_n_custom (0, left_quote, right_quote, arg);
1032 }
1033 
1034 char *
quotearg_custom_mem(char const * left_quote,char const * right_quote,char const * arg,size_t argsize)1035 quotearg_custom_mem (char const *left_quote, char const *right_quote,
1036                      char const *arg, size_t argsize)
1037 {
1038   return quotearg_n_custom_mem (0, left_quote, right_quote, arg,
1039                                 argsize);
1040 }
1041 
1042 
1043 /* The quoting option used by the functions of quote.h.  */
1044 struct quoting_options quote_quoting_options =
1045   {
1046     locale_quoting_style,
1047     0,
1048     { 0 },
1049     NULL, NULL
1050   };
1051 
1052 char const *
quote_n_mem(int n,char const * arg,size_t argsize)1053 quote_n_mem (int n, char const *arg, size_t argsize)
1054 {
1055   return quotearg_n_options (n, arg, argsize, &quote_quoting_options);
1056 }
1057 
1058 char const *
quote_mem(char const * arg,size_t argsize)1059 quote_mem (char const *arg, size_t argsize)
1060 {
1061   return quote_n_mem (0, arg, argsize);
1062 }
1063 
1064 char const *
quote_n(int n,char const * arg)1065 quote_n (int n, char const *arg)
1066 {
1067   return quote_n_mem (n, arg, SIZE_MAX);
1068 }
1069 
1070 char const *
quote(char const * arg)1071 quote (char const *arg)
1072 {
1073   return quote_n (0, arg);
1074 }
1075 
1076 /*
1077  * Hey Emacs!
1078  * Local Variables:
1079  * coding: utf-8
1080  * End:
1081  */
1082