1 /* CPP Library.
2    Copyright (C) 1986-2018 Free Software Foundation, Inc.
3    Contributed by Per Bothner, 1994-95.
4    Based on CCCP program by Paul Rubin, June 1986
5    Adapted to ANSI C, Richard Stallman, Jan 1987
6 
7 This program is free software; you can redistribute it and/or modify it
8 under the terms of the GNU General Public License as published by the
9 Free Software Foundation; either version 3, or (at your option) any
10 later version.
11 
12 This program is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 GNU General Public License for more details.
16 
17 You should have received a copy of the GNU General Public License
18 along with this program; see the file COPYING3.  If not see
19 <http://www.gnu.org/licenses/>.  */
20 
21 #include "config.h"
22 #include "system.h"
23 #include "cpplib.h"
24 #include "internal.h"
25 #include "mkdeps.h"
26 #include "localedir.h"
27 #include "filenames.h"
28 
29 #ifndef ENABLE_CANONICAL_SYSTEM_HEADERS
30 #ifdef HAVE_DOS_BASED_FILE_SYSTEM
31 #define ENABLE_CANONICAL_SYSTEM_HEADERS 1
32 #else
33 #define ENABLE_CANONICAL_SYSTEM_HEADERS 0
34 #endif
35 #endif
36 
37 static void init_library (void);
38 static void mark_named_operators (cpp_reader *, int);
39 static void read_original_filename (cpp_reader *);
40 static void read_original_directory (cpp_reader *);
41 static void post_options (cpp_reader *);
42 
43 /* If we have designated initializers (GCC >2.7) these tables can be
44    initialized, constant data.  Otherwise, they have to be filled in at
45    runtime.  */
46 #if HAVE_DESIGNATED_INITIALIZERS
47 
48 #define init_trigraph_map()  /* Nothing.  */
49 #define TRIGRAPH_MAP \
50 __extension__ const uchar _cpp_trigraph_map[UCHAR_MAX + 1] = {
51 
52 #define END };
53 #define s(p, v) [p] = v,
54 
55 #else
56 
57 #define TRIGRAPH_MAP uchar _cpp_trigraph_map[UCHAR_MAX + 1] = { 0 }; \
58  static void init_trigraph_map (void) { \
59  unsigned char *x = _cpp_trigraph_map;
60 
61 #define END }
62 #define s(p, v) x[p] = v;
63 
64 #endif
65 
66 TRIGRAPH_MAP
67   s('=', '#')	s(')', ']')	s('!', '|')
68   s('(', '[')	s('\'', '^')	s('>', '}')
69   s('/', '\\')	s('<', '{')	s('-', '~')
70 END
71 
72 #undef s
73 #undef END
74 #undef TRIGRAPH_MAP
75 
76 /* A set of booleans indicating what CPP features each source language
77    requires.  */
78 struct lang_flags
79 {
80   char c99;
81   char cplusplus;
82   char extended_numbers;
83   char extended_identifiers;
84   char c11_identifiers;
85   char std;
86   char digraphs;
87   char uliterals;
88   char rliterals;
89   char user_literals;
90   char binary_constants;
91   char digit_separators;
92   char trigraphs;
93   char utf8_char_literals;
94   char va_opt;
95 };
96 
97 static const struct lang_flags lang_defaults[] =
98 { /*              c99 c++ xnum xid c11 std digr ulit rlit udlit bincst digsep trig u8chlit vaopt */
99   /* GNUC89   */  { 0,  0,  1,  0,  0,  0,  1,   0,   0,   0,    0,     0,     0,   0,      1 },
100   /* GNUC99   */  { 1,  0,  1,  1,  0,  0,  1,   1,   1,   0,    0,     0,     0,   0,      1 },
101   /* GNUC11   */  { 1,  0,  1,  1,  1,  0,  1,   1,   1,   0,    0,     0,     0,   0,      1 },
102   /* GNUC17   */  { 1,  0,  1,  1,  1,  0,  1,   1,   1,   0,    0,     0,     0,   0,      1 },
103   /* STDC89   */  { 0,  0,  0,  0,  0,  1,  0,   0,   0,   0,    0,     0,     1,   0,      0 },
104   /* STDC94   */  { 0,  0,  0,  0,  0,  1,  1,   0,   0,   0,    0,     0,     1,   0,      0 },
105   /* STDC99   */  { 1,  0,  1,  1,  0,  1,  1,   0,   0,   0,    0,     0,     1,   0,      0 },
106   /* STDC11   */  { 1,  0,  1,  1,  1,  1,  1,   1,   0,   0,    0,     0,     1,   0,      0 },
107   /* STDC17   */  { 1,  0,  1,  1,  1,  1,  1,   1,   0,   0,    0,     0,     1,   0,      0 },
108   /* GNUCXX   */  { 0,  1,  1,  1,  0,  0,  1,   0,   0,   0,    0,     0,     0,   0,      1 },
109   /* CXX98    */  { 0,  1,  0,  1,  0,  1,  1,   0,   0,   0,    0,     0,     1,   0,      0 },
110   /* GNUCXX11 */  { 1,  1,  1,  1,  1,  0,  1,   1,   1,   1,    0,     0,     0,   0,      1 },
111   /* CXX11    */  { 1,  1,  0,  1,  1,  1,  1,   1,   1,   1,    0,     0,     1,   0,      0 },
112   /* GNUCXX14 */  { 1,  1,  1,  1,  1,  0,  1,   1,   1,   1,    1,     1,     0,   0,      1 },
113   /* CXX14    */  { 1,  1,  0,  1,  1,  1,  1,   1,   1,   1,    1,     1,     1,   0,      0 },
114   /* GNUCXX17 */  { 1,  1,  1,  1,  1,  0,  1,   1,   1,   1,    1,     1,     0,   1,      1 },
115   /* CXX17    */  { 1,  1,  1,  1,  1,  1,  1,   1,   1,   1,    1,     1,     0,   1,      0 },
116   /* GNUCXX2A */  { 1,  1,  1,  1,  1,  0,  1,   1,   1,   1,    1,     1,     0,   1,      1 },
117   /* CXX2A    */  { 1,  1,  1,  1,  1,  1,  1,   1,   1,   1,    1,     1,     0,   1,      1 },
118   /* ASM      */  { 0,  0,  1,  0,  0,  0,  0,   0,   0,   0,    0,     0,     0,   0,      0 }
119 };
120 
121 /* Sets internal flags correctly for a given language.  */
122 void
cpp_set_lang(cpp_reader * pfile,enum c_lang lang)123 cpp_set_lang (cpp_reader *pfile, enum c_lang lang)
124 {
125   const struct lang_flags *l = &lang_defaults[(int) lang];
126 
127   CPP_OPTION (pfile, lang) = lang;
128 
129   CPP_OPTION (pfile, c99)			 = l->c99;
130   CPP_OPTION (pfile, cplusplus)			 = l->cplusplus;
131   CPP_OPTION (pfile, extended_numbers)		 = l->extended_numbers;
132   CPP_OPTION (pfile, extended_identifiers)	 = l->extended_identifiers;
133   CPP_OPTION (pfile, c11_identifiers)		 = l->c11_identifiers;
134   CPP_OPTION (pfile, std)			 = l->std;
135   CPP_OPTION (pfile, digraphs)			 = l->digraphs;
136   CPP_OPTION (pfile, uliterals)			 = l->uliterals;
137   CPP_OPTION (pfile, rliterals)			 = l->rliterals;
138   CPP_OPTION (pfile, user_literals)		 = l->user_literals;
139   CPP_OPTION (pfile, binary_constants)		 = l->binary_constants;
140   CPP_OPTION (pfile, digit_separators)		 = l->digit_separators;
141   CPP_OPTION (pfile, trigraphs)			 = l->trigraphs;
142   CPP_OPTION (pfile, utf8_char_literals)	 = l->utf8_char_literals;
143   CPP_OPTION (pfile, va_opt)			 = l->va_opt;
144 }
145 
146 /* Initialize library global state.  */
147 static void
init_library(void)148 init_library (void)
149 {
150   static int initialized = 0;
151 
152   if (! initialized)
153     {
154       initialized = 1;
155 
156       _cpp_init_lexer ();
157 
158       /* Set up the trigraph map.  This doesn't need to do anything if
159 	 we were compiled with a compiler that supports C99 designated
160 	 initializers.  */
161       init_trigraph_map ();
162 
163 #ifdef ENABLE_NLS
164        (void) bindtextdomain (PACKAGE, LOCALEDIR);
165 #endif
166     }
167 }
168 
169 /* Initialize a cpp_reader structure.  */
170 cpp_reader *
cpp_create_reader(enum c_lang lang,cpp_hash_table * table,struct line_maps * line_table)171 cpp_create_reader (enum c_lang lang, cpp_hash_table *table,
172 		   struct line_maps *line_table)
173 {
174   cpp_reader *pfile;
175 
176   /* Initialize this instance of the library if it hasn't been already.  */
177   init_library ();
178 
179   pfile = XCNEW (cpp_reader);
180   memset (&pfile->base_context, 0, sizeof (pfile->base_context));
181 
182   cpp_set_lang (pfile, lang);
183   CPP_OPTION (pfile, warn_multichar) = 1;
184   CPP_OPTION (pfile, discard_comments) = 1;
185   CPP_OPTION (pfile, discard_comments_in_macro_exp) = 1;
186   CPP_OPTION (pfile, tabstop) = 8;
187   CPP_OPTION (pfile, operator_names) = 1;
188   CPP_OPTION (pfile, warn_trigraphs) = 2;
189   CPP_OPTION (pfile, warn_endif_labels) = 1;
190   CPP_OPTION (pfile, cpp_warn_c90_c99_compat) = -1;
191   CPP_OPTION (pfile, cpp_warn_cxx11_compat) = 0;
192   CPP_OPTION (pfile, cpp_warn_deprecated) = 1;
193   CPP_OPTION (pfile, cpp_warn_long_long) = 0;
194   CPP_OPTION (pfile, dollars_in_ident) = 1;
195   CPP_OPTION (pfile, warn_dollars) = 1;
196   CPP_OPTION (pfile, warn_variadic_macros) = 1;
197   CPP_OPTION (pfile, warn_builtin_macro_redefined) = 1;
198   CPP_OPTION (pfile, cpp_warn_implicit_fallthrough) = 0;
199   /* By default, track locations of tokens resulting from macro
200      expansion.  The '2' means, track the locations with the highest
201      accuracy.  Read the comments for struct
202      cpp_options::track_macro_expansion to learn about the other
203      values.  */
204   CPP_OPTION (pfile, track_macro_expansion) = 2;
205   CPP_OPTION (pfile, warn_normalize) = normalized_C;
206   CPP_OPTION (pfile, warn_literal_suffix) = 1;
207   CPP_OPTION (pfile, canonical_system_headers)
208       = ENABLE_CANONICAL_SYSTEM_HEADERS;
209   CPP_OPTION (pfile, ext_numeric_literals) = 1;
210   CPP_OPTION (pfile, warn_date_time) = 0;
211 
212   /* Default CPP arithmetic to something sensible for the host for the
213      benefit of dumb users like fix-header.  */
214   CPP_OPTION (pfile, precision) = CHAR_BIT * sizeof (long);
215   CPP_OPTION (pfile, char_precision) = CHAR_BIT;
216   CPP_OPTION (pfile, wchar_precision) = CHAR_BIT * sizeof (int);
217   CPP_OPTION (pfile, int_precision) = CHAR_BIT * sizeof (int);
218   CPP_OPTION (pfile, unsigned_char) = 0;
219   CPP_OPTION (pfile, unsigned_wchar) = 1;
220   CPP_OPTION (pfile, bytes_big_endian) = 1;  /* does not matter */
221 
222   /* Default to no charset conversion.  */
223   CPP_OPTION (pfile, narrow_charset) = _cpp_default_encoding ();
224   CPP_OPTION (pfile, wide_charset) = 0;
225 
226   /* Default the input character set to UTF-8.  */
227   CPP_OPTION (pfile, input_charset) = _cpp_default_encoding ();
228 
229   /* A fake empty "directory" used as the starting point for files
230      looked up without a search path.  Name cannot be '/' because we
231      don't want to prepend anything at all to filenames using it.  All
232      other entries are correct zero-initialized.  */
233   pfile->no_search_path.name = (char *) "";
234 
235   /* Initialize the line map.  */
236   pfile->line_table = line_table;
237 
238   /* Initialize lexer state.  */
239   pfile->state.save_comments = ! CPP_OPTION (pfile, discard_comments);
240 
241   /* Set up static tokens.  */
242   pfile->avoid_paste.type = CPP_PADDING;
243   pfile->avoid_paste.val.source = NULL;
244   pfile->eof.type = CPP_EOF;
245   pfile->eof.flags = 0;
246 
247   /* Create a token buffer for the lexer.  */
248   _cpp_init_tokenrun (&pfile->base_run, 250);
249   pfile->cur_run = &pfile->base_run;
250   pfile->cur_token = pfile->base_run.base;
251 
252   /* Initialize the base context.  */
253   pfile->context = &pfile->base_context;
254   pfile->base_context.c.macro = 0;
255   pfile->base_context.prev = pfile->base_context.next = 0;
256 
257   /* Aligned and unaligned storage.  */
258   pfile->a_buff = _cpp_get_buff (pfile, 0);
259   pfile->u_buff = _cpp_get_buff (pfile, 0);
260 
261   /* Initialize table for push_macro/pop_macro.  */
262   pfile->pushed_macros = 0;
263 
264   /* Do not force token locations by default.  */
265   pfile->forced_token_location_p = NULL;
266 
267   /* Initialize source_date_epoch to -2 (not yet set).  */
268   pfile->source_date_epoch = (time_t) -2;
269 
270   /* The expression parser stack.  */
271   _cpp_expand_op_stack (pfile);
272 
273   /* Initialize the buffer obstack.  */
274   obstack_specify_allocation (&pfile->buffer_ob, 0, 0, xmalloc, free);
275 
276   _cpp_init_files (pfile);
277 
278   _cpp_init_hashtable (pfile, table);
279 
280   return pfile;
281 }
282 
283 /* Set the line_table entry in PFILE.  This is called after reading a
284    PCH file, as the old line_table will be incorrect.  */
285 void
cpp_set_line_map(cpp_reader * pfile,struct line_maps * line_table)286 cpp_set_line_map (cpp_reader *pfile, struct line_maps *line_table)
287 {
288   pfile->line_table = line_table;
289 }
290 
291 /* Free resources used by PFILE.  Accessing PFILE after this function
292    returns leads to undefined behavior.  Returns the error count.  */
293 void
cpp_destroy(cpp_reader * pfile)294 cpp_destroy (cpp_reader *pfile)
295 {
296   cpp_context *context, *contextn;
297   struct def_pragma_macro *pmacro;
298   tokenrun *run, *runn;
299   int i;
300 
301   free (pfile->op_stack);
302 
303   while (CPP_BUFFER (pfile) != NULL)
304     _cpp_pop_buffer (pfile);
305 
306   free (pfile->out.base);
307 
308   if (pfile->macro_buffer)
309     {
310       free (pfile->macro_buffer);
311       pfile->macro_buffer = NULL;
312       pfile->macro_buffer_len = 0;
313     }
314 
315   if (pfile->deps)
316     deps_free (pfile->deps);
317   obstack_free (&pfile->buffer_ob, 0);
318 
319   _cpp_destroy_hashtable (pfile);
320   _cpp_cleanup_files (pfile);
321   _cpp_destroy_iconv (pfile);
322 
323   _cpp_free_buff (pfile->a_buff);
324   _cpp_free_buff (pfile->u_buff);
325   _cpp_free_buff (pfile->free_buffs);
326 
327   for (run = &pfile->base_run; run; run = runn)
328     {
329       runn = run->next;
330       free (run->base);
331       if (run != &pfile->base_run)
332 	free (run);
333     }
334 
335   for (context = pfile->base_context.next; context; context = contextn)
336     {
337       contextn = context->next;
338       free (context);
339     }
340 
341   if (pfile->comments.entries)
342     {
343       for (i = 0; i < pfile->comments.count; i++)
344 	free (pfile->comments.entries[i].comment);
345 
346       free (pfile->comments.entries);
347     }
348   if (pfile->pushed_macros)
349     {
350       do
351 	{
352 	  pmacro = pfile->pushed_macros;
353 	  pfile->pushed_macros = pmacro->next;
354 	  free (pmacro->name);
355 	  free (pmacro);
356 	}
357       while (pfile->pushed_macros);
358     }
359 
360   free (pfile);
361 }
362 
363 /* This structure defines one built-in identifier.  A node will be
364    entered in the hash table under the name NAME, with value VALUE.
365 
366    There are two tables of these.  builtin_array holds all the
367    "builtin" macros: these are handled by builtin_macro() in
368    macro.c.  Builtin is somewhat of a misnomer -- the property of
369    interest is that these macros require special code to compute their
370    expansions.  The value is a "cpp_builtin_type" enumerator.
371 
372    operator_array holds the C++ named operators.  These are keywords
373    which act as aliases for punctuators.  In C++, they cannot be
374    altered through #define, and #if recognizes them as operators.  In
375    C, these are not entered into the hash table at all (but see
376    <iso646.h>).  The value is a token-type enumerator.  */
377 struct builtin_macro
378 {
379   const uchar *const name;
380   const unsigned short len;
381   const unsigned short value;
382   const bool always_warn_if_redefined;
383 };
384 
385 #define B(n, t, f)    { DSC(n), t, f }
386 static const struct builtin_macro builtin_array[] =
387 {
388   B("__TIMESTAMP__",	 BT_TIMESTAMP,     false),
389   B("__TIME__",		 BT_TIME,          false),
390   B("__DATE__",		 BT_DATE,          false),
391   B("__FILE__",		 BT_FILE,          false),
392   B("__BASE_FILE__",	 BT_BASE_FILE,     false),
393   B("__LINE__",		 BT_SPECLINE,      true),
394   B("__INCLUDE_LEVEL__", BT_INCLUDE_LEVEL, true),
395   B("__COUNTER__",	 BT_COUNTER,       true),
396   B("__has_attribute",	 BT_HAS_ATTRIBUTE, true),
397   B("__has_cpp_attribute", BT_HAS_ATTRIBUTE, true),
398   /* Keep builtins not used for -traditional-cpp at the end, and
399      update init_builtins() if any more are added.  */
400   B("_Pragma",		 BT_PRAGMA,        true),
401   B("__STDC__",		 BT_STDC,          true),
402 };
403 #undef B
404 
405 struct builtin_operator
406 {
407   const uchar *const name;
408   const unsigned short len;
409   const unsigned short value;
410 };
411 
412 #define B(n, t)    { DSC(n), t }
413 static const struct builtin_operator operator_array[] =
414 {
415   B("and",	CPP_AND_AND),
416   B("and_eq",	CPP_AND_EQ),
417   B("bitand",	CPP_AND),
418   B("bitor",	CPP_OR),
419   B("compl",	CPP_COMPL),
420   B("not",	CPP_NOT),
421   B("not_eq",	CPP_NOT_EQ),
422   B("or",	CPP_OR_OR),
423   B("or_eq",	CPP_OR_EQ),
424   B("xor",	CPP_XOR),
425   B("xor_eq",	CPP_XOR_EQ)
426 };
427 #undef B
428 
429 /* Mark the C++ named operators in the hash table.  */
430 static void
mark_named_operators(cpp_reader * pfile,int flags)431 mark_named_operators (cpp_reader *pfile, int flags)
432 {
433   const struct builtin_operator *b;
434 
435   for (b = operator_array;
436        b < (operator_array + ARRAY_SIZE (operator_array));
437        b++)
438     {
439       cpp_hashnode *hp = cpp_lookup (pfile, b->name, b->len);
440       hp->flags |= flags;
441       hp->is_directive = 0;
442       hp->directive_index = b->value;
443     }
444 }
445 
446 /* Helper function of cpp_type2name. Return the string associated with
447    named operator TYPE.  */
448 const char *
cpp_named_operator2name(enum cpp_ttype type)449 cpp_named_operator2name (enum cpp_ttype type)
450 {
451   const struct builtin_operator *b;
452 
453   for (b = operator_array;
454        b < (operator_array + ARRAY_SIZE (operator_array));
455        b++)
456     {
457       if (type == b->value)
458 	return (const char *) b->name;
459     }
460 
461   return NULL;
462 }
463 
464 void
cpp_init_special_builtins(cpp_reader * pfile)465 cpp_init_special_builtins (cpp_reader *pfile)
466 {
467   const struct builtin_macro *b;
468   size_t n = ARRAY_SIZE (builtin_array);
469 
470   if (CPP_OPTION (pfile, traditional))
471     n -= 2;
472   else if (! CPP_OPTION (pfile, stdc_0_in_system_headers)
473 	   || CPP_OPTION (pfile, std))
474     n--;
475 
476   for (b = builtin_array; b < builtin_array + n; b++)
477     {
478       if (b->value == BT_HAS_ATTRIBUTE
479 	  && (CPP_OPTION (pfile, lang) == CLK_ASM
480 	      || pfile->cb.has_attribute == NULL))
481 	continue;
482       cpp_hashnode *hp = cpp_lookup (pfile, b->name, b->len);
483       hp->type = NT_MACRO;
484       hp->flags |= NODE_BUILTIN;
485       if (b->always_warn_if_redefined)
486 	hp->flags |= NODE_WARN;
487       hp->value.builtin = (enum cpp_builtin_type) b->value;
488     }
489 }
490 
491 /* Restore macro C to builtin macro definition.  */
492 
493 void
_cpp_restore_special_builtin(cpp_reader * pfile,struct def_pragma_macro * c)494 _cpp_restore_special_builtin (cpp_reader *pfile, struct def_pragma_macro *c)
495 {
496   size_t len = strlen (c->name);
497 
498   for (const struct builtin_macro *b = builtin_array;
499        b < builtin_array + ARRAY_SIZE (builtin_array); b++)
500     if (b->len == len && memcmp (c->name, b->name, len + 1) == 0)
501       {
502 	cpp_hashnode *hp = cpp_lookup (pfile, b->name, b->len);
503 	hp->type = NT_MACRO;
504 	hp->flags |= NODE_BUILTIN;
505 	if (b->always_warn_if_redefined)
506 	  hp->flags |= NODE_WARN;
507 	hp->value.builtin = (enum cpp_builtin_type) b->value;
508       }
509 }
510 
511 /* Read the builtins table above and enter them, and language-specific
512    macros, into the hash table.  HOSTED is true if this is a hosted
513    environment.  */
514 void
cpp_init_builtins(cpp_reader * pfile,int hosted)515 cpp_init_builtins (cpp_reader *pfile, int hosted)
516 {
517   cpp_init_special_builtins (pfile);
518 
519   if (!CPP_OPTION (pfile, traditional)
520       && (! CPP_OPTION (pfile, stdc_0_in_system_headers)
521 	  || CPP_OPTION (pfile, std)))
522     _cpp_define_builtin (pfile, "__STDC__ 1");
523 
524   if (CPP_OPTION (pfile, cplusplus))
525     {
526       if (CPP_OPTION (pfile, lang) == CLK_CXX2A
527 	  || CPP_OPTION (pfile, lang) == CLK_GNUCXX2A)
528 	_cpp_define_builtin (pfile, "__cplusplus 201709L");
529       else if (CPP_OPTION (pfile, lang) == CLK_CXX17
530 	  || CPP_OPTION (pfile, lang) == CLK_GNUCXX17)
531 	_cpp_define_builtin (pfile, "__cplusplus 201703L");
532       else if (CPP_OPTION (pfile, lang) == CLK_CXX14
533 	  || CPP_OPTION (pfile, lang) == CLK_GNUCXX14)
534 	_cpp_define_builtin (pfile, "__cplusplus 201402L");
535       else if (CPP_OPTION (pfile, lang) == CLK_CXX11
536 	       || CPP_OPTION (pfile, lang) == CLK_GNUCXX11)
537 	_cpp_define_builtin (pfile, "__cplusplus 201103L");
538       else
539 	_cpp_define_builtin (pfile, "__cplusplus 199711L");
540     }
541   else if (CPP_OPTION (pfile, lang) == CLK_ASM)
542     _cpp_define_builtin (pfile, "__ASSEMBLER__ 1");
543   else if (CPP_OPTION (pfile, lang) == CLK_STDC94)
544     _cpp_define_builtin (pfile, "__STDC_VERSION__ 199409L");
545   else if (CPP_OPTION (pfile, lang) == CLK_STDC17
546 	   || CPP_OPTION (pfile, lang) == CLK_GNUC17)
547     _cpp_define_builtin (pfile, "__STDC_VERSION__ 201710L");
548   else if (CPP_OPTION (pfile, lang) == CLK_STDC11
549 	   || CPP_OPTION (pfile, lang) == CLK_GNUC11)
550     _cpp_define_builtin (pfile, "__STDC_VERSION__ 201112L");
551   else if (CPP_OPTION (pfile, c99))
552     _cpp_define_builtin (pfile, "__STDC_VERSION__ 199901L");
553 
554   if (CPP_OPTION (pfile, uliterals)
555       && !(CPP_OPTION (pfile, cplusplus)
556 	   && (CPP_OPTION (pfile, lang) == CLK_GNUCXX
557 	    || CPP_OPTION (pfile, lang) == CLK_CXX98)))
558     {
559       _cpp_define_builtin (pfile, "__STDC_UTF_16__ 1");
560       _cpp_define_builtin (pfile, "__STDC_UTF_32__ 1");
561     }
562 
563   if (hosted)
564     _cpp_define_builtin (pfile, "__STDC_HOSTED__ 1");
565   else
566     _cpp_define_builtin (pfile, "__STDC_HOSTED__ 0");
567 
568   if (CPP_OPTION (pfile, objc))
569     _cpp_define_builtin (pfile, "__OBJC__ 1");
570 }
571 
572 /* Sanity-checks are dependent on command-line options, so it is
573    called as a subroutine of cpp_read_main_file.  */
574 #if CHECKING_P
575 static void sanity_checks (cpp_reader *);
sanity_checks(cpp_reader * pfile)576 static void sanity_checks (cpp_reader *pfile)
577 {
578   cppchar_t test = 0;
579   size_t max_precision = 2 * CHAR_BIT * sizeof (cpp_num_part);
580 
581   /* Sanity checks for assumptions about CPP arithmetic and target
582      type precisions made by cpplib.  */
583   test--;
584   if (test < 1)
585     cpp_error (pfile, CPP_DL_ICE, "cppchar_t must be an unsigned type");
586 
587   if (CPP_OPTION (pfile, precision) > max_precision)
588     cpp_error (pfile, CPP_DL_ICE,
589 	       "preprocessor arithmetic has maximum precision of %lu bits;"
590 	       " target requires %lu bits",
591 	       (unsigned long) max_precision,
592 	       (unsigned long) CPP_OPTION (pfile, precision));
593 
594   if (CPP_OPTION (pfile, precision) < CPP_OPTION (pfile, int_precision))
595     cpp_error (pfile, CPP_DL_ICE,
596 	       "CPP arithmetic must be at least as precise as a target int");
597 
598   if (CPP_OPTION (pfile, char_precision) < 8)
599     cpp_error (pfile, CPP_DL_ICE, "target char is less than 8 bits wide");
600 
601   if (CPP_OPTION (pfile, wchar_precision) < CPP_OPTION (pfile, char_precision))
602     cpp_error (pfile, CPP_DL_ICE,
603 	       "target wchar_t is narrower than target char");
604 
605   if (CPP_OPTION (pfile, int_precision) < CPP_OPTION (pfile, char_precision))
606     cpp_error (pfile, CPP_DL_ICE,
607 	       "target int is narrower than target char");
608 
609   /* This is assumed in eval_token() and could be fixed if necessary.  */
610   if (sizeof (cppchar_t) > sizeof (cpp_num_part))
611     cpp_error (pfile, CPP_DL_ICE,
612 	       "CPP half-integer narrower than CPP character");
613 
614   if (CPP_OPTION (pfile, wchar_precision) > BITS_PER_CPPCHAR_T)
615     cpp_error (pfile, CPP_DL_ICE,
616 	       "CPP on this host cannot handle wide character constants over"
617 	       " %lu bits, but the target requires %lu bits",
618 	       (unsigned long) BITS_PER_CPPCHAR_T,
619 	       (unsigned long) CPP_OPTION (pfile, wchar_precision));
620 }
621 #else
622 # define sanity_checks(PFILE)
623 #endif
624 
625 /* This is called after options have been parsed, and partially
626    processed.  */
627 void
cpp_post_options(cpp_reader * pfile)628 cpp_post_options (cpp_reader *pfile)
629 {
630   int flags;
631 
632   sanity_checks (pfile);
633 
634   post_options (pfile);
635 
636   /* Mark named operators before handling command line macros.  */
637   flags = 0;
638   if (CPP_OPTION (pfile, cplusplus) && CPP_OPTION (pfile, operator_names))
639     flags |= NODE_OPERATOR;
640   if (CPP_OPTION (pfile, warn_cxx_operator_names))
641     flags |= NODE_DIAGNOSTIC | NODE_WARN_OPERATOR;
642   if (flags != 0)
643     mark_named_operators (pfile, flags);
644 }
645 
646 /* Setup for processing input from the file named FNAME, or stdin if
647    it is the empty string.  Return the original filename
648    on success (e.g. foo.i->foo.c), or NULL on failure.  */
649 const char *
cpp_read_main_file(cpp_reader * pfile,const char * fname)650 cpp_read_main_file (cpp_reader *pfile, const char *fname)
651 {
652   const source_location loc = 0;
653 
654   if (CPP_OPTION (pfile, deps.style) != DEPS_NONE)
655     {
656       if (!pfile->deps)
657 	pfile->deps = deps_init ();
658 
659       /* Set the default target (if there is none already).  */
660       deps_add_default_target (pfile->deps, fname);
661     }
662 
663   pfile->main_file
664     = _cpp_find_file (pfile, fname, &pfile->no_search_path, false, 0, false,
665 		      loc);
666   if (_cpp_find_failed (pfile->main_file))
667     return NULL;
668 
669   _cpp_stack_file (pfile, pfile->main_file, false, loc);
670 
671   /* For foo.i, read the original filename foo.c now, for the benefit
672      of the front ends.  */
673   if (CPP_OPTION (pfile, preprocessed))
674     {
675       read_original_filename (pfile);
676       fname =
677 	ORDINARY_MAP_FILE_NAME
678 	((LINEMAPS_LAST_ORDINARY_MAP (pfile->line_table)));
679     }
680   return fname;
681 }
682 
683 /* For preprocessed files, if the first tokens are of the form # NUM.
684    handle the directive so we know the original file name.  This will
685    generate file_change callbacks, which the front ends must handle
686    appropriately given their state of initialization.  */
687 static void
read_original_filename(cpp_reader * pfile)688 read_original_filename (cpp_reader *pfile)
689 {
690   const cpp_token *token, *token1;
691 
692   /* Lex ahead; if the first tokens are of the form # NUM, then
693      process the directive, otherwise back up.  */
694   token = _cpp_lex_direct (pfile);
695   if (token->type == CPP_HASH)
696     {
697       pfile->state.in_directive = 1;
698       token1 = _cpp_lex_direct (pfile);
699       _cpp_backup_tokens (pfile, 1);
700       pfile->state.in_directive = 0;
701 
702       /* If it's a #line directive, handle it.  */
703       if (token1->type == CPP_NUMBER
704 	  && _cpp_handle_directive (pfile, token->flags & PREV_WHITE))
705 	{
706 	  read_original_directory (pfile);
707 	  return;
708 	}
709     }
710 
711   /* Backup as if nothing happened.  */
712   _cpp_backup_tokens (pfile, 1);
713 }
714 
715 /* For preprocessed files, if the tokens following the first filename
716    line is of the form # <line> "/path/name//", handle the
717    directive so we know the original current directory.  */
718 static void
read_original_directory(cpp_reader * pfile)719 read_original_directory (cpp_reader *pfile)
720 {
721   const cpp_token *hash, *token;
722 
723   /* Lex ahead; if the first tokens are of the form # NUM, then
724      process the directive, otherwise back up.  */
725   hash = _cpp_lex_direct (pfile);
726   if (hash->type != CPP_HASH)
727     {
728       _cpp_backup_tokens (pfile, 1);
729       return;
730     }
731 
732   token = _cpp_lex_direct (pfile);
733 
734   if (token->type != CPP_NUMBER)
735     {
736       _cpp_backup_tokens (pfile, 2);
737       return;
738     }
739 
740   token = _cpp_lex_direct (pfile);
741 
742   if (token->type != CPP_STRING
743       || ! (token->val.str.len >= 5
744 	    && IS_DIR_SEPARATOR (token->val.str.text[token->val.str.len-2])
745 	    && IS_DIR_SEPARATOR (token->val.str.text[token->val.str.len-3])))
746     {
747       _cpp_backup_tokens (pfile, 3);
748       return;
749     }
750 
751   if (pfile->cb.dir_change)
752     {
753       char *debugdir = (char *) alloca (token->val.str.len - 3);
754 
755       memcpy (debugdir, (const char *) token->val.str.text + 1,
756 	      token->val.str.len - 4);
757       debugdir[token->val.str.len - 4] = '\0';
758 
759       pfile->cb.dir_change (pfile, debugdir);
760     }
761 }
762 
763 /* This is called at the end of preprocessing.  It pops the last
764    buffer and writes dependency output.
765 
766    Maybe it should also reset state, such that you could call
767    cpp_start_read with a new filename to restart processing.  */
768 void
cpp_finish(cpp_reader * pfile,FILE * deps_stream)769 cpp_finish (cpp_reader *pfile, FILE *deps_stream)
770 {
771   /* Warn about unused macros before popping the final buffer.  */
772   if (CPP_OPTION (pfile, warn_unused_macros))
773     cpp_forall_identifiers (pfile, _cpp_warn_if_unused_macro, NULL);
774 
775   /* lex.c leaves the final buffer on the stack.  This it so that
776      it returns an unending stream of CPP_EOFs to the client.  If we
777      popped the buffer, we'd dereference a NULL buffer pointer and
778      segfault.  It's nice to allow the client to do worry-free excess
779      cpp_get_token calls.  */
780   while (pfile->buffer)
781     _cpp_pop_buffer (pfile);
782 
783   if (CPP_OPTION (pfile, deps.style) != DEPS_NONE
784       && deps_stream)
785     {
786       deps_write (pfile->deps, deps_stream, 72);
787 
788       if (CPP_OPTION (pfile, deps.phony_targets))
789 	deps_phony_targets (pfile->deps, deps_stream);
790     }
791 
792   /* Report on headers that could use multiple include guards.  */
793   if (CPP_OPTION (pfile, print_include_names))
794     _cpp_report_missing_guards (pfile);
795 }
796 
797 static void
post_options(cpp_reader * pfile)798 post_options (cpp_reader *pfile)
799 {
800   /* -Wtraditional is not useful in C++ mode.  */
801   if (CPP_OPTION (pfile, cplusplus))
802     CPP_OPTION (pfile, cpp_warn_traditional) = 0;
803 
804   /* Permanently disable macro expansion if we are rescanning
805      preprocessed text.  Read preprocesed source in ISO mode.  */
806   if (CPP_OPTION (pfile, preprocessed))
807     {
808       if (!CPP_OPTION (pfile, directives_only))
809 	pfile->state.prevent_expansion = 1;
810       CPP_OPTION (pfile, traditional) = 0;
811     }
812 
813   if (CPP_OPTION (pfile, warn_trigraphs) == 2)
814     CPP_OPTION (pfile, warn_trigraphs) = !CPP_OPTION (pfile, trigraphs);
815 
816   if (CPP_OPTION (pfile, traditional))
817     {
818       CPP_OPTION (pfile, trigraphs) = 0;
819       CPP_OPTION (pfile, warn_trigraphs) = 0;
820     }
821 }
822