xref: /qemu/util/keyval.c (revision f9734d5d)
1 /*
2  * Parsing KEY=VALUE,... strings
3  *
4  * Copyright (C) 2017 Red Hat Inc.
5  *
6  * Authors:
7  *  Markus Armbruster <armbru@redhat.com>,
8  *
9  * This work is licensed under the terms of the GNU GPL, version 2 or later.
10  * See the COPYING file in the top-level directory.
11  */
12 
13 /*
14  * KEY=VALUE,... syntax:
15  *
16  *   key-vals     = [ key-val { ',' key-val } [ ',' ] ]
17  *   key-val      = key '=' val | help
18  *   key          = key-fragment { '.' key-fragment }
19  *   key-fragment = / [^=,.]+ /
20  *   val          = { / [^,]+ / | ',,' }
21  *   help         = 'help' | '?'
22  *
23  * Semantics defined by reduction to JSON:
24  *
25  *   key-vals specifies a JSON object, i.e. a tree whose root is an
26  *   object, inner nodes other than the root are objects or arrays,
27  *   and leaves are strings.
28  *
29  *   Each key-val = key-fragment '.' ... '=' val specifies a path from
30  *   root to a leaf (left of '='), and the leaf's value (right of
31  *   '=').
32  *
33  *   A path from the root is defined recursively:
34  *       L '.' key-fragment is a child of the node denoted by path L
35  *       key-fragment is a child of the tree root
36  *   If key-fragment is numeric, the parent is an array and the child
37  *   is its key-fragment-th member, counting from zero.
38  *   Else, the parent is an object, and the child is its member named
39  *   key-fragment.
40  *
41  *   This constrains inner nodes to be either array or object.  The
42  *   constraints must be satisfiable.  Counter-example: a.b=1,a=2 is
43  *   not, because root.a must be an object to satisfy a.b=1 and a
44  *   string to satisfy a=2.
45  *
46  *   Array subscripts can occur in any order, but the set of
47  *   subscripts must not have gaps.  For instance, a.1=v is not okay,
48  *   because root.a[0] is missing.
49  *
50  *   If multiple key-val denote the same leaf, the last one determines
51  *   the value.
52  *
53  * Key-fragments must be valid QAPI names or consist only of decimal
54  * digits.
55  *
56  * The length of any key-fragment must be between 1 and 127.
57  *
58  * If any key-val is help, the object is to be treated as a help
59  * request.
60  *
61  * Design flaw: there is no way to denote an empty array or non-root
62  * object.  While interpreting "key absent" as empty seems natural
63  * (removing a key-val from the input string removes the member when
64  * there are more, so why not when it's the last), it doesn't work:
65  * "key absent" already means "optional object/array absent", which
66  * isn't the same as "empty object/array present".
67  *
68  * Design flaw: scalar values can only be strings; there is no way to
69  * denote numbers, true, false or null.  The special QObject input
70  * visitor returned by qobject_input_visitor_new_keyval() mostly hides
71  * this by automatically converting strings to the type the visitor
72  * expects.  Breaks down for type 'any', where the visitor's
73  * expectation isn't clear.  Code visiting 'any' needs to do the
74  * conversion itself, but only when using this keyval visitor.
75  * Awkward.  Note that we carefully restrict alternate types to avoid
76  * similar ambiguity.
77  *
78  * Alternative syntax for use with an implied key:
79  *
80  *   key-vals     = [ key-val-1st { ',' key-val } [ ',' ] ]
81  *   key-val-1st  = val-no-key | key-val
82  *   val-no-key   = / [^=,]+ / - help
83  *
84  * where val-no-key is syntactic sugar for implied-key=val-no-key.
85  *
86  * Note that you can't use the sugared form when the value contains
87  * '=' or ','.
88  */
89 
90 #include "qemu/osdep.h"
91 #include "qapi/error.h"
92 #include "qapi/qmp/qdict.h"
93 #include "qapi/qmp/qlist.h"
94 #include "qapi/qmp/qstring.h"
95 #include "qemu/cutils.h"
96 #include "qemu/help_option.h"
97 #include "qemu/option.h"
98 
99 /*
100  * Convert @key to a list index.
101  * Convert all leading decimal digits to a (non-negative) number,
102  * capped at INT_MAX.
103  * If @end is non-null, assign a pointer to the first character after
104  * the number to *@end.
105  * Else, fail if any characters follow.
106  * On success, return the converted number.
107  * On failure, return a negative value.
108  * Note: since only digits are converted, no two keys can map to the
109  * same number, except by overflow to INT_MAX.
110  */
111 static int key_to_index(const char *key, const char **end)
112 {
113     int ret;
114     unsigned long index;
115 
116     if (*key < '0' || *key > '9') {
117         return -EINVAL;
118     }
119     ret = qemu_strtoul(key, end, 10, &index);
120     if (ret) {
121         return ret == -ERANGE ? INT_MAX : ret;
122     }
123     return index <= INT_MAX ? index : INT_MAX;
124 }
125 
126 /*
127  * Ensure @cur maps @key_in_cur the right way.
128  * If @value is null, it needs to map to a QDict, else to this
129  * QString.
130  * If @cur doesn't have @key_in_cur, put an empty QDict or @value,
131  * respectively.
132  * Else, if it needs to map to a QDict, and already does, do nothing.
133  * Else, if it needs to map to this QString, and already maps to a
134  * QString, replace it by @value.
135  * Else, fail because we have conflicting needs on how to map
136  * @key_in_cur.
137  * In any case, take over the reference to @value, i.e. if the caller
138  * wants to hold on to a reference, it needs to qobject_ref().
139  * Use @key up to @key_cursor to identify the key in error messages.
140  * On success, return the mapped value.
141  * On failure, store an error through @errp and return NULL.
142  */
143 static QObject *keyval_parse_put(QDict *cur,
144                                  const char *key_in_cur, QString *value,
145                                  const char *key, const char *key_cursor,
146                                  Error **errp)
147 {
148     QObject *old, *new;
149 
150     old = qdict_get(cur, key_in_cur);
151     if (old) {
152         if (qobject_type(old) != (value ? QTYPE_QSTRING : QTYPE_QDICT)) {
153             error_setg(errp, "Parameters '%.*s.*' used inconsistently",
154                        (int)(key_cursor - key), key);
155             qobject_unref(value);
156             return NULL;
157         }
158         if (!value) {
159             return old;         /* already QDict, do nothing */
160         }
161         new = QOBJECT(value);   /* replacement */
162     } else {
163         new = value ? QOBJECT(value) : QOBJECT(qdict_new());
164     }
165     qdict_put_obj(cur, key_in_cur, new);
166     return new;
167 }
168 
169 /*
170  * Parse one parameter from @params.
171  *
172  * If we're looking at KEY=VALUE, store result in @qdict.
173  * The first fragment of KEY applies to @qdict.  Subsequent fragments
174  * apply to nested QDicts, which are created on demand.  @implied_key
175  * is as in keyval_parse().
176  *
177  * If we're looking at "help" or "?", set *help to true.
178  *
179  * On success, return a pointer to the next parameter, or else to '\0'.
180  * On failure, return NULL.
181  */
182 static const char *keyval_parse_one(QDict *qdict, const char *params,
183                                     const char *implied_key, bool *help,
184                                     Error **errp)
185 {
186     const char *key, *key_end, *val_end, *s, *end;
187     size_t len;
188     char key_in_cur[128];
189     QDict *cur;
190     int ret;
191     QObject *next;
192     GString *val;
193 
194     key = params;
195     val_end = NULL;
196     len = strcspn(params, "=,");
197     if (len && key[len] != '=') {
198         if (starts_with_help_option(key) == len) {
199             *help = true;
200             s = key + len;
201             if (*s == ',') {
202                 s++;
203             }
204             return s;
205         }
206         if (implied_key) {
207             /* Desugar implied key */
208             key = implied_key;
209             val_end = params + len;
210             len = strlen(implied_key);
211         }
212     }
213     key_end = key + len;
214 
215     /*
216      * Loop over key fragments: @s points to current fragment, it
217      * applies to @cur.  @key_in_cur[] holds the previous fragment.
218      */
219     cur = qdict;
220     s = key;
221     for (;;) {
222         /* Want a key index (unless it's first) or a QAPI name */
223         if (s != key && key_to_index(s, &end) >= 0) {
224             len = end - s;
225         } else {
226             ret = parse_qapi_name(s, false);
227             len = ret < 0 ? 0 : ret;
228         }
229         assert(s + len <= key_end);
230         if (!len || (s + len < key_end && s[len] != '.')) {
231             assert(key != implied_key);
232             error_setg(errp, "Invalid parameter '%.*s'",
233                        (int)(key_end - key), key);
234             return NULL;
235         }
236         if (len >= sizeof(key_in_cur)) {
237             assert(key != implied_key);
238             error_setg(errp, "Parameter%s '%.*s' is too long",
239                        s != key || s + len != key_end ? " fragment" : "",
240                        (int)len, s);
241             return NULL;
242         }
243 
244         if (s != key) {
245             next = keyval_parse_put(cur, key_in_cur, NULL,
246                                     key, s - 1, errp);
247             if (!next) {
248                 return NULL;
249             }
250             cur = qobject_to(QDict, next);
251             assert(cur);
252         }
253 
254         memcpy(key_in_cur, s, len);
255         key_in_cur[len] = 0;
256         s += len;
257 
258         if (*s != '.') {
259             break;
260         }
261         s++;
262     }
263 
264     if (key == implied_key) {
265         assert(!*s);
266         val = g_string_new_len(params, val_end - params);
267         s = val_end;
268         if (*s == ',') {
269             s++;
270         }
271     } else {
272         if (*s != '=') {
273             error_setg(errp, "Expected '=' after parameter '%.*s'",
274                        (int)(s - key), key);
275             return NULL;
276         }
277         s++;
278 
279         val = g_string_new(NULL);
280         for (;;) {
281             if (!*s) {
282                 break;
283             } else if (*s == ',') {
284                 s++;
285                 if (*s != ',') {
286                     break;
287                 }
288             }
289             g_string_append_c(val, *s++);
290         }
291     }
292 
293     if (!keyval_parse_put(cur, key_in_cur, qstring_from_gstring(val),
294                           key, key_end, errp)) {
295         return NULL;
296     }
297     return s;
298 }
299 
300 static char *reassemble_key(GSList *key)
301 {
302     GString *s = g_string_new("");
303     GSList *p;
304 
305     for (p = key; p; p = p->next) {
306         g_string_prepend_c(s, '.');
307         g_string_prepend(s, (char *)p->data);
308     }
309 
310     return g_string_free(s, FALSE);
311 }
312 
313 /*
314  * Recursive worker for keyval_merge.
315  *
316  * @str is the path that led to the * current dictionary (to be used for
317  * error messages).  It is modified internally but restored before the
318  * function returns.
319  */
320 static void keyval_do_merge(QDict *dest, const QDict *merged, GString *str, Error **errp)
321 {
322     size_t save_len = str->len;
323     const QDictEntry *ent;
324     QObject *old_value;
325 
326     for (ent = qdict_first(merged); ent; ent = qdict_next(merged, ent)) {
327         old_value = qdict_get(dest, ent->key);
328         if (old_value) {
329             if (qobject_type(old_value) != qobject_type(ent->value)) {
330                 error_setg(errp, "Parameter '%s%s' used inconsistently",
331                            str->str, ent->key);
332                 return;
333             } else if (qobject_type(ent->value) == QTYPE_QDICT) {
334                 /* Merge sub-dictionaries.  */
335                 g_string_append(str, ent->key);
336                 g_string_append_c(str, '.');
337                 keyval_do_merge(qobject_to(QDict, old_value),
338                                 qobject_to(QDict, ent->value),
339                                 str, errp);
340                 g_string_truncate(str, save_len);
341                 continue;
342             } else if (qobject_type(ent->value) == QTYPE_QLIST) {
343                 /* Append to old list.  */
344                 QList *old = qobject_to(QList, old_value);
345                 QList *new = qobject_to(QList, ent->value);
346                 const QListEntry *item;
347                 QLIST_FOREACH_ENTRY(new, item) {
348                     qobject_ref(item->value);
349                     qlist_append_obj(old, item->value);
350                 }
351                 continue;
352             } else {
353                 assert(qobject_type(ent->value) == QTYPE_QSTRING);
354             }
355         }
356 
357         qobject_ref(ent->value);
358         qdict_put_obj(dest, ent->key, ent->value);
359     }
360 }
361 
362 /* Merge the @merged dictionary into @dest.
363  *
364  * The dictionaries are expected to be returned by the keyval parser, and
365  * therefore the only expected scalar type is the string.  In case the same
366  * path is present in both @dest and @merged, the semantics are as follows:
367  *
368  * - lists are concatenated
369  *
370  * - dictionaries are merged recursively
371  *
372  * - for scalar values, @merged wins
373  *
374  * In case an error is reported, @dest may already have been modified.
375  *
376  * This function can be used to implement semantics analogous to QemuOpts's
377  * .merge_lists = true case, or to implement -set for options backed by QDicts.
378  *
379  * Note: while QemuOpts is commonly used so that repeated keys overwrite
380  * ("last one wins"), it can also be used so that repeated keys build up
381  * a list. keyval_merge() can only be used when the options' semantics are
382  * the former, not the latter.
383  */
384 void keyval_merge(QDict *dest, const QDict *merged, Error **errp)
385 {
386     GString *str;
387 
388     str = g_string_new("");
389     keyval_do_merge(dest, merged, str, errp);
390     g_string_free(str, TRUE);
391 }
392 
393 /*
394  * Listify @cur recursively.
395  * Replace QDicts whose keys are all valid list indexes by QLists.
396  * @key_of_cur is the list of key fragments leading up to @cur.
397  * On success, return either @cur or its replacement.
398  * On failure, store an error through @errp and return NULL.
399  */
400 static QObject *keyval_listify(QDict *cur, GSList *key_of_cur, Error **errp)
401 {
402     GSList key_node;
403     bool has_index, has_member;
404     const QDictEntry *ent;
405     QDict *qdict;
406     QObject *val;
407     char *key;
408     size_t nelt;
409     QObject **elt;
410     int index, max_index, i;
411     QList *list;
412 
413     key_node.next = key_of_cur;
414 
415     /*
416      * Recursively listify @cur's members, and figure out whether @cur
417      * itself is to be listified.
418      */
419     has_index = false;
420     has_member = false;
421     for (ent = qdict_first(cur); ent; ent = qdict_next(cur, ent)) {
422         if (key_to_index(ent->key, NULL) >= 0) {
423             has_index = true;
424         } else {
425             has_member = true;
426         }
427 
428         qdict = qobject_to(QDict, ent->value);
429         if (!qdict) {
430             continue;
431         }
432 
433         key_node.data = ent->key;
434         val = keyval_listify(qdict, &key_node, errp);
435         if (!val) {
436             return NULL;
437         }
438         if (val != ent->value) {
439             qdict_put_obj(cur, ent->key, val);
440         }
441     }
442 
443     if (has_index && has_member) {
444         key = reassemble_key(key_of_cur);
445         error_setg(errp, "Parameters '%s*' used inconsistently", key);
446         g_free(key);
447         return NULL;
448     }
449     if (!has_index) {
450         return QOBJECT(cur);
451     }
452 
453     /* Copy @cur's values to @elt[] */
454     nelt = qdict_size(cur) + 1; /* one extra, for use as sentinel */
455     elt = g_new0(QObject *, nelt);
456     max_index = -1;
457     for (ent = qdict_first(cur); ent; ent = qdict_next(cur, ent)) {
458         index = key_to_index(ent->key, NULL);
459         assert(index >= 0);
460         if (index > max_index) {
461             max_index = index;
462         }
463         /*
464          * We iterate @nelt times.  If we get one exceeding @nelt
465          * here, we will put less than @nelt values into @elt[],
466          * triggering the error in the next loop.
467          */
468         if ((size_t)index >= nelt - 1) {
469             continue;
470         }
471         /* Even though dict keys are distinct, indexes need not be */
472         elt[index] = ent->value;
473     }
474 
475     /*
476      * Make a list from @elt[], reporting the first missing element,
477      * if any.
478      * If we dropped an index >= nelt in the previous loop, this loop
479      * will run into the sentinel and report index @nelt missing.
480      */
481     list = qlist_new();
482     assert(!elt[nelt-1]);       /* need the sentinel to be null */
483     for (i = 0; i < MIN(nelt, max_index + 1); i++) {
484         if (!elt[i]) {
485             key = reassemble_key(key_of_cur);
486             error_setg(errp, "Parameter '%s%d' missing", key, i);
487             g_free(key);
488             g_free(elt);
489             qobject_unref(list);
490             return NULL;
491         }
492         qobject_ref(elt[i]);
493         qlist_append_obj(list, elt[i]);
494     }
495 
496     g_free(elt);
497     return QOBJECT(list);
498 }
499 
500 /*
501  * Parse @params in QEMU's traditional KEY=VALUE,... syntax.
502  *
503  * If @implied_key, the first KEY= can be omitted.  @implied_key is
504  * implied then, and VALUE can't be empty or contain ',' or '='.
505  *
506  * A parameter "help" or "?" without a value isn't added to the
507  * resulting dictionary, but instead is interpreted as help request.
508  * All other options are parsed and returned normally so that context
509  * specific help can be printed.
510  *
511  * If @p_help is not NULL, store whether help is requested there.
512  * If @p_help is NULL and help is requested, fail.
513  *
514  * On success, return @dict, now filled with the parsed keys and values.
515  *
516  * On failure, store an error through @errp and return NULL.  Any keys
517  * and values parsed so far will be in @dict nevertheless.
518  */
519 QDict *keyval_parse_into(QDict *qdict, const char *params, const char *implied_key,
520                          bool *p_help, Error **errp)
521 {
522     QObject *listified;
523     const char *s;
524     bool help = false;
525 
526     s = params;
527     while (*s) {
528         s = keyval_parse_one(qdict, s, implied_key, &help, errp);
529         if (!s) {
530             return NULL;
531         }
532         implied_key = NULL;
533     }
534 
535     if (p_help) {
536         *p_help = help;
537     } else if (help) {
538         error_setg(errp, "Help is not available for this option");
539         return NULL;
540     }
541 
542     listified = keyval_listify(qdict, NULL, errp);
543     if (!listified) {
544         return NULL;
545     }
546     assert(listified == QOBJECT(qdict));
547     return qdict;
548 }
549 
550 /*
551  * Parse @params in QEMU's traditional KEY=VALUE,... syntax.
552  *
553  * If @implied_key, the first KEY= can be omitted.  @implied_key is
554  * implied then, and VALUE can't be empty or contain ',' or '='.
555  *
556  * A parameter "help" or "?" without a value isn't added to the
557  * resulting dictionary, but instead is interpreted as help request.
558  * All other options are parsed and returned normally so that context
559  * specific help can be printed.
560  *
561  * If @p_help is not NULL, store whether help is requested there.
562  * If @p_help is NULL and help is requested, fail.
563  *
564  * On success, return a dictionary of the parsed keys and values.
565  * On failure, store an error through @errp and return NULL.
566  */
567 QDict *keyval_parse(const char *params, const char *implied_key,
568                     bool *p_help, Error **errp)
569 {
570     QDict *qdict = qdict_new();
571     QDict *ret = keyval_parse_into(qdict, params, implied_key, p_help, errp);
572 
573     if (!ret) {
574         qobject_unref(qdict);
575     }
576     return ret;
577 }
578