1 /* input_scrub.c - Break up input buffers into whole numbers of lines. 2 Copyright 1987, 1990, 1991, 1992, 1993, 1994, 1995, 1996, 1997, 1998, 3 2000 4 Free Software Foundation, Inc. 5 6 This file is part of GAS, the GNU Assembler. 7 8 GAS is free software; you can redistribute it and/or modify 9 it under the terms of the GNU General Public License as published by 10 the Free Software Foundation; either version 2, or (at your option) 11 any later version. 12 13 GAS is distributed in the hope that it will be useful, 14 but WITHOUT ANY WARRANTY; without even the implied warranty of 15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 16 GNU General Public License for more details. 17 18 You should have received a copy of the GNU General Public License 19 along with GAS; see the file COPYING. If not, write to the Free 20 Software Foundation, 59 Temple Place - Suite 330, Boston, MA 21 02111-1307, USA. */ 22 23 #include <errno.h> /* Need this to make errno declaration right */ 24 #include "as.h" 25 #include "input-file.h" 26 #include "sb.h" 27 #include "listing.h" 28 29 /* 30 * O/S independent module to supply buffers of sanitised source code 31 * to rest of assembler. We get sanitised input data of arbitrary length. 32 * We break these buffers on line boundaries, recombine pieces that 33 * were broken across buffers, and return a buffer of full lines to 34 * the caller. 35 * The last partial line begins the next buffer we build and return to caller. 36 * The buffer returned to caller is preceded by BEFORE_STRING and followed 37 * by AFTER_STRING, as sentinels. The last character before AFTER_STRING 38 * is a newline. 39 * Also looks after line numbers, for e.g. error messages. 40 */ 41 42 /* 43 * We don't care how filthy our buffers are, but our callers assume 44 * that the following sanitation has already been done. 45 * 46 * No comments, reduce a comment to a space. 47 * Reduce a tab to a space unless it is 1st char of line. 48 * All multiple tabs and spaces collapsed into 1 char. Tab only 49 * legal if 1st char of line. 50 * # line file statements converted to .line x;.file y; statements. 51 * Escaped newlines at end of line: remove them but add as many newlines 52 * to end of statement as you removed in the middle, to synch line numbers. 53 */ 54 55 #define BEFORE_STRING ("\n") 56 #define AFTER_STRING ("\0") /* memcpy of 0 chars might choke. */ 57 #define BEFORE_SIZE (1) 58 #define AFTER_SIZE (1) 59 60 static char *buffer_start; /*->1st char of full buffer area. */ 61 static char *partial_where; /*->after last full line in buffer. */ 62 static int partial_size; /* >=0. Number of chars in partial line in buffer. */ 63 64 /* Because we need AFTER_STRING just after last full line, it clobbers 65 1st part of partial line. So we preserve 1st part of partial line 66 here. */ 67 static char save_source[AFTER_SIZE]; 68 69 /* What is the largest size buffer that input_file_give_next_buffer() 70 could return to us? */ 71 static unsigned int buffer_length; 72 73 /* The index into an sb structure we are reading from. -1 if none. */ 74 static int sb_index = -1; 75 76 /* If we are reading from an sb structure, this is it. */ 77 static sb from_sb; 78 79 /* Should we do a conditional check on from_sb? */ 80 static int from_sb_is_expansion = 1; 81 82 /* The number of nested sb structures we have included. */ 83 int macro_nest; 84 85 /* We can have more than one source file open at once, though the info for all 86 but the latest one are saved off in a struct input_save. These files remain 87 open, so we are limited by the number of open files allowed by the 88 underlying OS. We may also sequentially read more than one source file in an 89 assembly. */ 90 91 /* We must track the physical file and line number for error messages. We also 92 track a "logical" file and line number corresponding to (C?) compiler 93 source line numbers. Whenever we open a file we must fill in 94 physical_input_file. So if it is NULL we have not opened any files yet. */ 95 96 static char *physical_input_file; 97 static char *logical_input_file; 98 99 typedef unsigned int line_numberT; /* 1-origin line number in a source file. */ 100 /* A line ends in '\n' or eof. */ 101 102 static line_numberT physical_input_line; 103 static int logical_input_line; 104 105 /* Struct used to save the state of the input handler during include files */ 106 struct input_save { 107 char * buffer_start; 108 char * partial_where; 109 int partial_size; 110 char save_source[AFTER_SIZE]; 111 unsigned int buffer_length; 112 char * physical_input_file; 113 char * logical_input_file; 114 line_numberT physical_input_line; 115 int logical_input_line; 116 int sb_index; 117 sb from_sb; 118 int from_sb_is_expansion; /* Should we do a conditional check? */ 119 struct input_save * next_saved_file; /* Chain of input_saves. */ 120 char * input_file_save; /* Saved state of input routines. */ 121 char * saved_position; /* Caller's saved position in buf. */ 122 }; 123 124 static struct input_save *input_scrub_push (char *saved_position); 125 static char *input_scrub_pop (struct input_save *arg); 126 static void as_1_char (unsigned int c, FILE * stream); 127 128 /* Saved information about the file that .include'd this one. When we hit EOF, 129 we automatically pop to that file. */ 130 131 static struct input_save *next_saved_file; 132 133 /* Push the state of input reading and scrubbing so that we can #include. 134 The return value is a 'void *' (fudged for old compilers) to a save 135 area, which can be restored by passing it to input_scrub_pop(). */ 136 137 static struct input_save * 138 input_scrub_push (char *saved_position) 139 { 140 register struct input_save *saved; 141 142 saved = (struct input_save *) xmalloc (sizeof *saved); 143 144 saved->saved_position = saved_position; 145 saved->buffer_start = buffer_start; 146 saved->partial_where = partial_where; 147 saved->partial_size = partial_size; 148 saved->buffer_length = buffer_length; 149 saved->physical_input_file = physical_input_file; 150 saved->logical_input_file = logical_input_file; 151 saved->physical_input_line = physical_input_line; 152 saved->logical_input_line = logical_input_line; 153 saved->sb_index = sb_index; 154 saved->from_sb = from_sb; 155 saved->from_sb_is_expansion = from_sb_is_expansion; 156 memcpy (saved->save_source, save_source, sizeof (save_source)); 157 saved->next_saved_file = next_saved_file; 158 saved->input_file_save = input_file_push (); 159 160 input_file_begin (); /* Reinitialize! */ 161 logical_input_line = -1; 162 logical_input_file = (char *) NULL; 163 buffer_length = input_file_buffer_size (); 164 sb_index = -1; 165 166 buffer_start = xmalloc ((BEFORE_SIZE + buffer_length + buffer_length + AFTER_SIZE)); 167 memcpy (buffer_start, BEFORE_STRING, (int) BEFORE_SIZE); 168 169 return saved; 170 } 171 172 static char * 173 input_scrub_pop (struct input_save *saved) 174 { 175 char *saved_position; 176 177 input_scrub_end (); /* Finish off old buffer */ 178 179 input_file_pop (saved->input_file_save); 180 saved_position = saved->saved_position; 181 buffer_start = saved->buffer_start; 182 buffer_length = saved->buffer_length; 183 physical_input_file = saved->physical_input_file; 184 logical_input_file = saved->logical_input_file; 185 physical_input_line = saved->physical_input_line; 186 logical_input_line = saved->logical_input_line; 187 sb_index = saved->sb_index; 188 from_sb = saved->from_sb; 189 from_sb_is_expansion = saved->from_sb_is_expansion; 190 partial_where = saved->partial_where; 191 partial_size = saved->partial_size; 192 next_saved_file = saved->next_saved_file; 193 memcpy (save_source, saved->save_source, sizeof (save_source)); 194 195 free (saved); 196 return saved_position; 197 } 198 199 void 200 input_scrub_begin (void) 201 { 202 know (strlen (BEFORE_STRING) == BEFORE_SIZE); 203 know (strlen (AFTER_STRING) == AFTER_SIZE 204 || (AFTER_STRING[0] == '\0' && AFTER_SIZE == 1)); 205 206 input_file_begin (); 207 208 buffer_length = input_file_buffer_size (); 209 210 buffer_start = xmalloc ((BEFORE_SIZE + buffer_length + buffer_length + AFTER_SIZE)); 211 memcpy (buffer_start, BEFORE_STRING, (int) BEFORE_SIZE); 212 213 /* Line number things. */ 214 logical_input_line = -1; 215 logical_input_file = (char *) NULL; 216 physical_input_file = NULL; /* No file read yet. */ 217 next_saved_file = NULL; /* At EOF, don't pop to any other file */ 218 do_scrub_begin (flag_m68k_mri); 219 } 220 221 void 222 input_scrub_end (void) 223 { 224 if (buffer_start) 225 { 226 free (buffer_start); 227 buffer_start = 0; 228 input_file_end (); 229 } 230 } 231 232 /* Start reading input from a new file. 233 Return start of caller's part of buffer. */ 234 235 char * 236 input_scrub_new_file (char *filename) 237 { 238 input_file_open (filename, !flag_no_comments); 239 physical_input_file = filename[0] ? filename : _("{standard input}"); 240 physical_input_line = 0; 241 242 partial_size = 0; 243 return (buffer_start + BEFORE_SIZE); 244 } 245 246 /* Include a file from the current file. Save our state, cause it to 247 be restored on EOF, and begin handling a new file. Same result as 248 input_scrub_new_file. */ 249 250 char * 251 input_scrub_include_file (char *filename, char *position) 252 { 253 next_saved_file = input_scrub_push (position); 254 return input_scrub_new_file (filename); 255 } 256 257 /* Start getting input from an sb structure. This is used when 258 expanding a macro. */ 259 260 void 261 input_scrub_include_sb (sb *from, char *position, int is_expansion) 262 { 263 if (macro_nest > max_macro_nest) 264 as_fatal (_("macros nested too deeply")); 265 ++macro_nest; 266 267 #ifdef md_macro_start 268 if (is_expansion) 269 { 270 md_macro_start (); 271 } 272 #endif 273 274 next_saved_file = input_scrub_push (position); 275 276 sb_new (&from_sb); 277 from_sb_is_expansion = is_expansion; 278 if (from->len >= 1 && from->ptr[0] != '\n') 279 { 280 /* Add the sentinel required by read.c. */ 281 sb_add_char (&from_sb, '\n'); 282 } 283 sb_add_sb (&from_sb, from); 284 sb_index = 1; 285 286 /* These variables are reset by input_scrub_push. Restore them 287 since we are, after all, still at the same point in the file. */ 288 logical_input_line = next_saved_file->logical_input_line; 289 logical_input_file = next_saved_file->logical_input_file; 290 } 291 292 void 293 input_scrub_close (void) 294 { 295 input_file_close (); 296 } 297 298 char * 299 input_scrub_next_buffer (char **bufp) 300 { 301 register char *limit; /*->just after last char of buffer. */ 302 303 if (sb_index >= 0) 304 { 305 if (sb_index >= from_sb.len) 306 { 307 sb_kill (&from_sb); 308 if (from_sb_is_expansion 309 ) 310 { 311 cond_finish_check (macro_nest); 312 #ifdef md_macro_end 313 /* Allow the target to clean up per-macro expansion 314 data. */ 315 md_macro_end (); 316 #endif 317 } 318 --macro_nest; 319 partial_where = NULL; 320 if (next_saved_file != NULL) 321 *bufp = input_scrub_pop (next_saved_file); 322 return partial_where; 323 } 324 325 partial_where = from_sb.ptr + from_sb.len; 326 partial_size = 0; 327 *bufp = from_sb.ptr + sb_index; 328 sb_index = from_sb.len; 329 return partial_where; 330 } 331 332 *bufp = buffer_start + BEFORE_SIZE; 333 334 if (partial_size) 335 { 336 memmove (buffer_start + BEFORE_SIZE, partial_where, 337 (unsigned int) partial_size); 338 memcpy (buffer_start + BEFORE_SIZE, save_source, AFTER_SIZE); 339 } 340 limit = input_file_give_next_buffer (buffer_start 341 + BEFORE_SIZE 342 + partial_size); 343 if (limit) 344 { 345 register char *p; /* Find last newline. */ 346 347 for (p = limit - 1; *p != '\n'; --p) 348 ; 349 ++p; 350 351 while (p <= buffer_start + BEFORE_SIZE) 352 { 353 int limoff; 354 355 limoff = limit - buffer_start; 356 buffer_length += input_file_buffer_size (); 357 buffer_start = xrealloc (buffer_start, 358 (BEFORE_SIZE 359 + 2 * buffer_length 360 + AFTER_SIZE)); 361 *bufp = buffer_start + BEFORE_SIZE; 362 limit = input_file_give_next_buffer (buffer_start + limoff); 363 364 if (limit == NULL) 365 { 366 as_warn (_("partial line at end of file ignored")); 367 partial_where = NULL; 368 if (next_saved_file) 369 *bufp = input_scrub_pop (next_saved_file); 370 return NULL; 371 } 372 373 for (p = limit - 1; *p != '\n'; --p) 374 ; 375 ++p; 376 } 377 378 partial_where = p; 379 partial_size = limit - p; 380 memcpy (save_source, partial_where, (int) AFTER_SIZE); 381 memcpy (partial_where, AFTER_STRING, (int) AFTER_SIZE); 382 } 383 else 384 { 385 partial_where = 0; 386 if (partial_size > 0) 387 { 388 as_warn (_("partial line at end of file ignored")); 389 } 390 391 /* Tell the listing we've finished the file. */ 392 LISTING_EOF (); 393 394 /* If we should pop to another file at EOF, do it. */ 395 if (next_saved_file) 396 { 397 *bufp = input_scrub_pop (next_saved_file); /* Pop state */ 398 /* partial_where is now correct to return, since we popped it. */ 399 } 400 } 401 return (partial_where); 402 } 403 404 /* The remaining part of this file deals with line numbers, error 405 messages and so on. Return TRUE if we opened any file. */ 406 407 int 408 seen_at_least_1_file (void) 409 { 410 return (physical_input_file != NULL); 411 } 412 413 void 414 bump_line_counters (void) 415 { 416 if (sb_index < 0) 417 { 418 ++physical_input_line; 419 if (logical_input_line >= 0) 420 ++logical_input_line; 421 } 422 } 423 424 /* Tells us what the new logical line number and file are. 425 If the line_number is -1, we don't change the current logical line 426 number. If it is -2, we decrement the logical line number (this is 427 to support the .appfile pseudo-op inserted into the stream by 428 do_scrub_chars). 429 If the fname is NULL, we don't change the current logical file name. 430 Returns nonzero if the filename actually changes. */ 431 432 int 433 new_logical_line (char *fname, /* DON'T destroy it! We point to it! */ 434 int line_number) 435 { 436 if (line_number >= 0) 437 logical_input_line = line_number; 438 else if (line_number == -2 && logical_input_line > 0) 439 --logical_input_line; 440 441 if (fname 442 && (logical_input_file == NULL 443 || strcmp (logical_input_file, fname))) 444 { 445 logical_input_file = fname; 446 return 1; 447 } 448 else 449 return 0; 450 } 451 452 /* Return the current file name and line number. 453 namep should be char * const *, but there are compilers which screw 454 up declarations like that, and it's easier to avoid it. */ 455 456 void 457 as_where (char **namep, unsigned int *linep) 458 { 459 if (logical_input_file != NULL 460 && (linep == NULL || logical_input_line >= 0)) 461 { 462 *namep = logical_input_file; 463 if (linep != NULL) 464 *linep = logical_input_line; 465 } 466 else if (physical_input_file != NULL) 467 { 468 *namep = physical_input_file; 469 if (linep != NULL) 470 *linep = physical_input_line; 471 } 472 else 473 { 474 *namep = 0; 475 if (linep != NULL) 476 *linep = 0; 477 } 478 } 479 480 /* Output to given stream how much of line we have scanned so far. 481 Assumes we have scanned up to and including input_line_pointer. 482 No free '\n' at end of line. */ 483 484 void 485 as_howmuch (FILE *stream /* Opened for write please. */) 486 { 487 register char *p; /* Scan input line. */ 488 489 for (p = input_line_pointer - 1; *p != '\n'; --p) 490 { 491 } 492 ++p; /* p->1st char of line. */ 493 for (; p <= input_line_pointer; p++) 494 { 495 /* Assume ASCII. EBCDIC & other micro-computer char sets ignored. */ 496 as_1_char ((unsigned char) *p, stream); 497 } 498 } 499 500 static void 501 as_1_char (unsigned int c, FILE *stream) 502 { 503 if (c > 127) 504 { 505 (void) putc ('%', stream); 506 c -= 128; 507 } 508 if (c < 32) 509 { 510 (void) putc ('^', stream); 511 c += '@'; 512 } 513 (void) putc (c, stream); 514 } 515