Coverage Report

Created: 2025-07-08 11:15

/src/binutils-gdb/gas/input-scrub.c
Line
Count
Source (jump to first uncovered line)
1
/* input_scrub.c - Break up input buffers into whole numbers of lines.
2
   Copyright (C) 1987-2025 Free Software Foundation, Inc.
3
4
   This file is part of GAS, the GNU Assembler.
5
6
   GAS is free software; you can redistribute it and/or modify
7
   it under the terms of the GNU General Public License as published by
8
   the Free Software Foundation; either version 3, or (at your option)
9
   any later version.
10
11
   GAS is distributed in the hope that it will be useful,
12
   but WITHOUT ANY WARRANTY; without even the implied warranty of
13
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14
   GNU General Public License for more details.
15
16
   You should have received a copy of the GNU General Public License
17
   along with GAS; see the file COPYING.  If not, write to the Free
18
   Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19
   02110-1301, USA.  */
20
21
#include "as.h"
22
#include "filenames.h"
23
#include "input-file.h"
24
#include "sb.h"
25
#include "listing.h"
26
27
/*
28
 * O/S independent module to supply buffers of sanitised source code
29
 * to rest of assembler.  We get sanitised input data of arbitrary length.
30
 * We break these buffers on line boundaries, recombine pieces that
31
 * were broken across buffers, and return a buffer of full lines to
32
 * the caller.
33
 * The last partial line begins the next buffer we build and return to caller.
34
 * The buffer returned to caller is preceded by BEFORE_STRING and followed
35
 * by AFTER_STRING, as sentinels. The last character before AFTER_STRING
36
 * is a newline.
37
 * Also looks after line numbers, for e.g. error messages.
38
 */
39
40
/*
41
 * We don't care how filthy our buffers are, but our callers assume
42
 * that the following sanitation has already been done.
43
 *
44
 * No comments, reduce a comment to a space.
45
 * Reduce a tab to a space unless it is 1st char of line.
46
 * All multiple tabs and spaces collapsed into 1 char. Tab only
47
 *   legal if 1st char of line.
48
 * # line file statements converted to .line x;.file y; statements.
49
 * Escaped newlines at end of line: remove them but add as many newlines
50
 *   to end of statement as you removed in the middle, to synch line numbers.
51
 */
52

53
0
#define BEFORE_STRING ("\n")
54
0
#define AFTER_STRING ("\0")  /* memcpy of 0 chars might choke.  */
55
0
#define BEFORE_SIZE (1)
56
0
#define AFTER_SIZE  (1)
57
58
#ifndef TC_EOL_IN_INSN
59
0
#define TC_EOL_IN_INSN(P) 0
60
#endif
61
62
static char *buffer_start;  /*->1st char of full buffer area.  */
63
static char *partial_where; /*->after last full line in buffer.  */
64
static size_t partial_size; /* >=0. Number of chars in partial line in buffer.  */
65
66
/* Because we need AFTER_STRING just after last full line, it clobbers
67
   1st part of partial line. So we preserve 1st part of partial line
68
   here.  */
69
static char save_source[AFTER_SIZE];
70
71
/* The size of the input buffer we concatenate
72
   input_file_give_next_buffer chunks into.  Excludes the BEFORE and
73
   AFTER counts.  */
74
static size_t buffer_length;
75
76
/* The index into an sb structure we are reading from.  -1 if none.  */
77
static size_t sb_index = -1;
78
79
/* If we are reading from an sb structure, this is it.  */
80
static sb from_sb;
81
82
/* Should we do a conditional check on from_sb? */
83
static enum expansion from_sb_expansion = expanding_none;
84
85
/* The number of nested sb structures we have included.  */
86
int macro_nest;
87
88
/* We can have more than one source file open at once, though the info for all
89
   but the latest one are saved off in a struct input_save.  These files remain
90
   open, so we are limited by the number of open files allowed by the
91
   underlying OS. We may also sequentially read more than one source file in an
92
   assembly.  */
93
94
/* We must track the physical file and line number for error messages. We also
95
   track a "logical" file and line number corresponding to (C?)  compiler
96
   source line numbers.  Whenever we open a file we must fill in
97
   physical_input_file. So if it is NULL we have not opened any files yet.  */
98
99
static const char *physical_input_file;
100
static const char *logical_input_file;
101
102
/* 1-origin line number in a source file.  */
103
/* A line ends in '\n' or eof.  */
104
static unsigned int physical_input_line;
105
static unsigned int logical_input_line;
106
107
/* Indicator whether the origin of an update was a .linefile directive. */
108
static bool is_linefile;
109
110
/* Struct used to save the state of the input handler during include files */
111
struct input_save {
112
  char *              buffer_start;
113
  char *              partial_where;
114
  size_t              partial_size;
115
  char                save_source[AFTER_SIZE];
116
  size_t              buffer_length;
117
  const char *        physical_input_file;
118
  const char *        logical_input_file;
119
  unsigned int        physical_input_line;
120
  unsigned int        logical_input_line;
121
  bool                is_linefile;
122
  size_t              sb_index;
123
  sb                  from_sb;
124
  enum expansion      from_sb_expansion; /* Should we do a conditional check?  */
125
  struct input_save * next_saved_file;  /* Chain of input_saves.  */
126
  char *              input_file_save;  /* Saved state of input routines.  */
127
  char *              saved_position; /* Caller's saved position in buf.  */
128
};
129
130
static struct input_save *input_scrub_push (char *saved_position);
131
static char *input_scrub_pop (struct input_save *arg);
132
133
/* Saved information about the file that .include'd this one.  When we hit EOF,
134
   we automatically pop to that file.  */
135
136
static struct input_save *next_saved_file;
137
138
/* Initialize input buffering.  */
139
140
static void
141
input_scrub_reinit (void)
142
0
{
143
0
  input_file_begin ();    /* Reinitialize! */
144
0
  logical_input_line = -1u;
145
0
  logical_input_file = NULL;
146
0
  sb_index = -1;
147
148
0
  buffer_length = input_file_buffer_size () * 2;
149
0
  buffer_start = XNEWVEC (char, BEFORE_SIZE + AFTER_SIZE + 1 + buffer_length);
150
0
  memcpy (buffer_start, BEFORE_STRING, (int) BEFORE_SIZE);
151
0
}
152
153
/* Finish off old buffers.  */
154
155
static void
156
input_scrub_free (void)
157
0
{
158
0
  if (sb_index != (size_t) -1)
159
0
    {
160
0
      sb_kill (&from_sb);
161
0
      sb_index = -1;
162
0
    }
163
0
  free (buffer_start);
164
0
  buffer_start = NULL;
165
0
  input_file_end ();
166
0
}
167
168
/* Push the state of input reading and scrubbing so that we can #include.
169
   The return value is a 'void *' (fudged for old compilers) to a save
170
   area, which can be restored by passing it to input_scrub_pop().  */
171
172
static struct input_save *
173
input_scrub_push (char *saved_position)
174
0
{
175
0
  struct input_save *saved;
176
177
0
  saved = XNEW (struct input_save);
178
179
0
  saved->saved_position = saved_position;
180
0
  saved->buffer_start = buffer_start;
181
0
  saved->partial_where = partial_where;
182
0
  saved->partial_size = partial_size;
183
0
  saved->buffer_length = buffer_length;
184
0
  saved->physical_input_file = physical_input_file;
185
0
  saved->logical_input_file = logical_input_file;
186
0
  saved->physical_input_line = physical_input_line;
187
0
  saved->logical_input_line = logical_input_line;
188
0
  saved->is_linefile = is_linefile;
189
0
  saved->sb_index = sb_index;
190
0
  saved->from_sb = from_sb;
191
0
  saved->from_sb_expansion = from_sb_expansion;
192
0
  memcpy (saved->save_source, save_source, sizeof (save_source));
193
0
  saved->next_saved_file = next_saved_file;
194
0
  saved->input_file_save = input_file_push ();
195
196
0
  input_scrub_reinit ();
197
198
0
  return saved;
199
0
}
200
201
static char *
202
input_scrub_pop (struct input_save *saved)
203
0
{
204
0
  char *saved_position;
205
206
0
  input_scrub_free ();
207
208
0
  input_file_pop (saved->input_file_save);
209
0
  saved_position = saved->saved_position;
210
0
  buffer_start = saved->buffer_start;
211
0
  buffer_length = saved->buffer_length;
212
213
  /* When expanding an #APP / #NO_APP block, original lines are re-
214
     processed, so whatever they did to physical file/line needs
215
     retaining.  If logical file/line weren't changed, the logical
216
     line number will want bumping by a corresponding value.  */
217
0
  if (from_sb_expansion != expanding_app)
218
0
    {
219
0
      if (logical_input_file == 0 && logical_input_line == -1u
220
0
    && saved->logical_input_line != -1u)
221
0
  saved->logical_input_line
222
0
    += physical_input_line - saved->physical_input_line;
223
0
      physical_input_file = saved->physical_input_file;
224
0
      physical_input_line = saved->physical_input_line;
225
0
    }
226
0
  logical_input_file = saved->logical_input_file;
227
0
  logical_input_line = saved->logical_input_line;
228
229
0
  is_linefile = saved->is_linefile;
230
0
  sb_index = saved->sb_index;
231
0
  from_sb = saved->from_sb;
232
0
  from_sb_expansion = saved->from_sb_expansion;
233
0
  partial_where = saved->partial_where;
234
0
  partial_size = saved->partial_size;
235
0
  next_saved_file = saved->next_saved_file;
236
0
  memcpy (save_source, saved->save_source, sizeof (save_source));
237
238
0
  free (saved);
239
0
  return saved_position;
240
0
}
241

242
void
243
input_scrub_begin (void)
244
0
{
245
0
  know (strlen (BEFORE_STRING) == BEFORE_SIZE);
246
0
  know (strlen (AFTER_STRING) == AFTER_SIZE
247
0
  || (AFTER_STRING[0] == '\0' && AFTER_SIZE == 1));
248
249
0
  physical_input_file = NULL; /* No file read yet.  */
250
0
  next_saved_file = NULL; /* At EOF, don't pop to any other file */
251
0
  macro_nest = 0;
252
0
  input_scrub_reinit ();
253
0
  do_scrub_begin (flag_m68k_mri);
254
0
}
255
256
void
257
input_scrub_end (void)
258
0
{
259
0
  while (next_saved_file != NULL)
260
0
    input_scrub_pop (next_saved_file);
261
0
  input_scrub_free ();
262
0
}
263
264
/* Start reading input from a new file.
265
   Return start of caller's part of buffer.  */
266
267
char *
268
input_scrub_new_file (const char *filename)
269
0
{
270
0
  input_file_open (filename, !flag_no_comments);
271
0
  physical_input_file = filename[0] ? filename : _("{standard input}");
272
0
  physical_input_line = 0;
273
274
0
  partial_size = 0;
275
0
  return (buffer_start + BEFORE_SIZE);
276
0
}
277
278
/* Include a file from the current file.  Save our state, cause it to
279
   be restored on EOF, and begin handling a new file.  Same result as
280
   input_scrub_new_file.  */
281
282
char *
283
input_scrub_include_file (const char *filename, char *position)
284
0
{
285
0
  next_saved_file = input_scrub_push (position);
286
0
  from_sb_expansion = expanding_none;
287
0
  return input_scrub_new_file (filename);
288
0
}
289
290
/* Start getting input from an sb structure.  This is used when
291
   expanding a macro.  */
292
293
void
294
input_scrub_include_sb (sb *from, char *position, enum expansion expansion)
295
0
{
296
0
  int newline;
297
298
0
  if (expansion != expanding_app)
299
0
    {
300
0
      if (macro_nest > max_macro_nest)
301
0
  as_fatal (_("macros nested too deeply"));
302
0
      ++macro_nest;
303
0
    }
304
305
#ifdef md_macro_start
306
  if (expansion == expanding_macro)
307
    {
308
      md_macro_start ();
309
    }
310
#endif
311
312
0
  next_saved_file = input_scrub_push (position);
313
314
  /* Allocate sufficient space: from->len plus optional newline
315
     plus two ".linefile " directives, plus a little more for other
316
     expansion.  */
317
0
  newline = from->len >= 1 && from->ptr[0] != '\n';
318
0
  sb_build (&from_sb, from->len + newline + 2 * sizeof (".linefile") + 30);
319
0
  from_sb_expansion = expansion;
320
0
  if (newline)
321
0
    {
322
      /* Add the sentinel required by read.c.  */
323
0
      sb_add_char (&from_sb, '\n');
324
0
    }
325
0
  sb_scrub_and_add_sb (&from_sb, from);
326
327
  /* Make sure the parser looks at defined contents when it scans for
328
     e.g. end-of-line at the end of a macro.  */
329
0
  sb_terminate (&from_sb);
330
331
0
  sb_index = 1;
332
333
  /* These variables are reset by input_scrub_push.  Restore them
334
     since we are, after all, still at the same point in the file.  */
335
0
  logical_input_line = next_saved_file->logical_input_line;
336
0
  logical_input_file = next_saved_file->logical_input_file;
337
0
}
338
339
void
340
input_scrub_close (void)
341
0
{
342
0
  input_file_close ();
343
0
  physical_input_line = 0;
344
0
  logical_input_line = -1u;
345
0
}
346
347
char *
348
input_scrub_next_buffer (char **bufp)
349
0
{
350
0
  char *limit;    /*->just after last char of buffer.  */
351
352
0
  if (sb_index != (size_t) -1)
353
0
    {
354
0
      if (sb_index >= from_sb.len)
355
0
  {
356
0
    if (from_sb_expansion == expanding_macro)
357
0
      {
358
0
        cond_finish_check (macro_nest);
359
#ifdef md_macro_end
360
        /* Allow the target to clean up per-macro expansion
361
           data.  */
362
        md_macro_end ();
363
#endif
364
0
      }
365
0
    if (from_sb_expansion != expanding_app)
366
0
      --macro_nest;
367
0
    partial_where = NULL;
368
0
    partial_size = 0;
369
0
    if (next_saved_file != NULL)
370
0
      *bufp = input_scrub_pop (next_saved_file);
371
0
    return partial_where;
372
0
  }
373
374
0
      partial_where = from_sb.ptr + from_sb.len;
375
0
      partial_size = 0;
376
0
      *bufp = from_sb.ptr + sb_index;
377
0
      sb_index = from_sb.len;
378
0
      return partial_where;
379
0
    }
380
381
0
  if (partial_size)
382
0
    {
383
0
      memmove (buffer_start + BEFORE_SIZE, partial_where, partial_size);
384
0
      memcpy (buffer_start + BEFORE_SIZE, save_source, AFTER_SIZE);
385
0
    }
386
387
0
  while (1)
388
0
    {
389
0
      char *p;
390
0
      char *start = buffer_start + BEFORE_SIZE + partial_size;
391
392
0
      *bufp = buffer_start + BEFORE_SIZE;
393
0
      limit = input_file_give_next_buffer (start);
394
0
      if (!limit)
395
0
  {
396
0
    if (!partial_size)
397
      /* End of this file.  */
398
0
      break;
399
400
0
    as_warn (_("end of file not at end of a line; newline inserted"));
401
0
    p = buffer_start + BEFORE_SIZE + partial_size;
402
0
    *p++ = '\n';
403
0
    limit = p;
404
0
  }
405
0
      else
406
0
  {
407
    /* Terminate the buffer to avoid confusing TC_EOL_IN_INSN.  */
408
0
    *limit = '\0';
409
410
    /* Find last newline.  */
411
0
    for (p = limit - 1; *p != '\n' || TC_EOL_IN_INSN (p); --p)
412
0
      if (p < start)
413
0
        goto read_more;
414
0
    ++p;
415
0
  }
416
417
      /* We found a newline in the newly read chars.  */
418
0
      partial_where = p;
419
0
      partial_size = limit - p;
420
421
      /* Save the fragment after that last newline.  */
422
0
      memcpy (save_source, partial_where, (int) AFTER_SIZE);
423
0
      memcpy (partial_where, AFTER_STRING, (int) AFTER_SIZE);
424
0
      return partial_where;
425
426
0
    read_more:
427
      /* Didn't find a newline.  Read more text.  */
428
0
      partial_size = limit - (buffer_start + BEFORE_SIZE);
429
0
      if (buffer_length - input_file_buffer_size () < partial_size)
430
0
  {
431
    /* Increase the buffer when it doesn't have room for the
432
       next block of input.  */
433
0
    buffer_length *= 2;
434
0
    buffer_start = XRESIZEVEC (char, buffer_start,
435
0
             (buffer_length
436
0
              + BEFORE_SIZE + AFTER_SIZE + 1));
437
0
  }
438
0
    }
439
440
  /* Tell the listing we've finished the file.  */
441
0
  LISTING_EOF ();
442
443
  /* If we should pop to another file at EOF, do it.  */
444
0
  partial_where = NULL;
445
0
  if (next_saved_file)
446
0
    *bufp = input_scrub_pop (next_saved_file);
447
448
0
  return partial_where;
449
0
}
450

451
/* The remaining part of this file deals with line numbers, error
452
   messages and so on.  Return TRUE if we opened any file.  */
453
454
int
455
seen_at_least_1_file (void)
456
0
{
457
0
  return (physical_input_file != NULL);
458
0
}
459
460
void
461
bump_line_counters (void)
462
0
{
463
0
  if (sb_index == (size_t) -1 || from_sb_expansion == expanding_app)
464
0
    ++physical_input_line;
465
466
0
  if (logical_input_line != -1u)
467
0
    ++logical_input_line;
468
0
}
469

470
/* Tells us what the new logical line number and file are.
471
   If the line_number is -1, we don't change the current logical line
472
   number.
473
   If fname is NULL, we don't change the current logical file name, unless
474
   bit 3 of flags is set.
475
   Returns nonzero if the filename actually changes.  */
476
477
void
478
new_logical_line_flags (const char *fname, /* DON'T destroy it!  We point to it!  */
479
      int line_number,
480
      int flags)
481
0
{
482
0
  switch (flags)
483
0
    {
484
0
    case 0:
485
0
      break;
486
0
    case 1:
487
0
      if (line_number != -1)
488
0
  abort ();
489
0
      break;
490
0
    case 1 << 1:
491
0
    case 1 << 2:
492
      /* FIXME: we could check that include nesting is correct.  */
493
0
      break;
494
0
    case 1 << 3:
495
0
      if (line_number < 0 || fname != NULL)
496
0
  abort ();
497
0
      if (next_saved_file == NULL)
498
0
  fname = physical_input_file;
499
0
      else if (next_saved_file->logical_input_file)
500
0
  fname = next_saved_file->logical_input_file;
501
0
      else
502
0
  fname = next_saved_file->physical_input_file;
503
0
      break;
504
0
    default:
505
0
      abort ();
506
0
    }
507
508
0
  is_linefile = flags != 1 && (flags != 0 || fname);
509
510
0
  if (line_number >= 0)
511
0
    logical_input_line = line_number;
512
0
  else if (line_number == -1 && fname && !*fname && (flags & (1 << 2)))
513
0
    {
514
0
      logical_input_file = physical_input_file;
515
0
      logical_input_line = physical_input_line;
516
0
      fname = NULL;
517
0
    }
518
519
0
  if (fname
520
0
      && (logical_input_file == NULL
521
0
    || filename_cmp (logical_input_file, fname)))
522
0
    logical_input_file = fname;
523
0
}
524
525
void
526
new_logical_line (const char *fname, int line_number)
527
0
{
528
0
  new_logical_line_flags (fname, line_number, 0);
529
0
}
530
531
void
532
as_report_context (void)
533
0
{
534
0
  const struct input_save *saved = next_saved_file;
535
0
  enum expansion expansion = from_sb_expansion;
536
0
  int indent = 1;
537
538
0
  if (!macro_nest)
539
0
    return;
540
541
0
  do
542
0
    {
543
0
      if (expansion != expanding_macro)
544
0
  /* Nothing.  */;
545
0
      else if (saved->logical_input_file != NULL
546
0
         && saved->logical_input_line != -1u)
547
0
  as_info_where (saved->logical_input_file, saved->logical_input_line,
548
0
           indent, _("macro invoked from here"));
549
0
      else
550
0
  as_info_where (saved->physical_input_file, saved->physical_input_line,
551
0
           indent, _("macro invoked from here"));
552
553
0
      expansion = saved->from_sb_expansion;
554
0
      ++indent;
555
0
    }
556
0
  while ((saved = saved->next_saved_file) != NULL);
557
0
}
558

559
/* Return the current physical input file name and line number, if known  */
560
561
const char *
562
as_where_physical (unsigned int *linep)
563
0
{
564
0
  if (physical_input_file != NULL)
565
0
    {
566
0
      if (linep != NULL)
567
0
  *linep = physical_input_line;
568
0
      return physical_input_file;
569
0
    }
570
571
0
  if (linep != NULL)
572
0
    *linep = 0;
573
0
  return NULL;
574
0
}
575
576
/* Return the file name and line number at the top most macro
577
   invocation, unless .file / .line were used inside a macro.  */
578
579
const char *
580
as_where (unsigned int *linep)
581
0
{
582
0
  const char *file = as_where_top (linep);
583
584
0
  if (macro_nest && is_linefile)
585
0
    {
586
0
      const struct input_save *saved = next_saved_file;
587
0
      enum expansion expansion = from_sb_expansion;
588
589
0
      do
590
0
  {
591
0
    if (expansion != expanding_macro)
592
0
      /* Nothing.  */;
593
0
    else if (saved->logical_input_file != NULL
594
0
       && (linep == NULL || saved->logical_input_line != -1u))
595
0
      {
596
0
        if (linep != NULL)
597
0
    *linep = saved->logical_input_line;
598
0
        file = saved->logical_input_file;
599
0
      }
600
0
    else if (saved->physical_input_file != NULL)
601
0
      {
602
0
        if (linep != NULL)
603
0
    *linep = saved->physical_input_line;
604
0
        file = saved->physical_input_file;
605
0
      }
606
607
0
    expansion = saved->from_sb_expansion;
608
0
  }
609
0
      while ((saved = saved->next_saved_file) != NULL);
610
0
    }
611
612
0
  return file;
613
0
}
614
615
/* Return the current file name and line number.  */
616
617
const char *
618
as_where_top (unsigned int *linep)
619
0
{
620
0
  if (logical_input_file != NULL
621
0
      && (linep == NULL || logical_input_line != -1u))
622
0
    {
623
0
      if (linep != NULL)
624
0
  *linep = logical_input_line;
625
0
      return logical_input_file;
626
0
    }
627
628
0
  return as_where_physical (linep);
629
0
}