]> git.ipfire.org Git - thirdparty/gcc.git/blame - gcc/fortran/scanner.c
tm.texi (MALLOC_ABI_ALIGNMENT): New macro.
[thirdparty/gcc.git] / gcc / fortran / scanner.c
CommitLineData
6de9cd9a 1/* Character scanner.
835aac92 2 Copyright (C) 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008
ec378180 3 Free Software Foundation, Inc.
6de9cd9a
DN
4 Contributed by Andy Vaught
5
9fc4d79b 6This file is part of GCC.
6de9cd9a 7
9fc4d79b
TS
8GCC is free software; you can redistribute it and/or modify it under
9the terms of the GNU General Public License as published by the Free
d234d788 10Software Foundation; either version 3, or (at your option) any later
9fc4d79b 11version.
6de9cd9a 12
9fc4d79b
TS
13GCC is distributed in the hope that it will be useful, but WITHOUT ANY
14WARRANTY; without even the implied warranty of MERCHANTABILITY or
15FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16for more details.
6de9cd9a
DN
17
18You should have received a copy of the GNU General Public License
d234d788
NC
19along with GCC; see the file COPYING3. If not see
20<http://www.gnu.org/licenses/>. */
6de9cd9a
DN
21
22/* Set of subroutines to (ultimately) return the next character to the
23 various matching subroutines. This file's job is to read files and
24 build up lines that are parsed by the parser. This means that we
25 handle continuation lines and "include" lines.
26
27 The first thing the scanner does is to load an entire file into
28 memory. We load the entire file into memory for a couple reasons.
29 The first is that we want to be able to deal with nonseekable input
30 (pipes, stdin) and there is a lot of backing up involved during
31 parsing.
32
33 The second is that we want to be able to print the locus of errors,
34 and an error on line 999999 could conflict with something on line
35 one. Given nonseekable input, we've got to store the whole thing.
36
37 One thing that helps are the column truncation limits that give us
38 an upper bound on the size of individual lines. We don't store the
39 truncated stuff.
40
41 From the scanner's viewpoint, the higher level subroutines ask for
42 new characters and do a lot of jumping backwards. */
43
44#include "config.h"
d22e4895 45#include "system.h"
6de9cd9a 46#include "gfortran.h"
2d7c7df6 47#include "toplev.h"
9e8a6720
FXC
48#include "debug.h"
49#include "flags.h"
670637ee 50#include "cpp.h"
6de9cd9a
DN
51
52/* Structure for holding module and include file search path. */
53typedef struct gfc_directorylist
54{
55 char *path;
31198773 56 bool use_for_modules;
6de9cd9a
DN
57 struct gfc_directorylist *next;
58}
59gfc_directorylist;
60
61/* List of include file search directories. */
31198773 62static gfc_directorylist *include_dirs, *intrinsic_modules_dirs;
6de9cd9a 63
d4fa05b9 64static gfc_file *file_head, *current_file;
6de9cd9a 65
6c7a4dfd 66static int continue_flag, end_flag, openmp_flag;
5a06474c 67static int continue_count, continue_line;
6c7a4dfd 68static locus openmp_locus;
6de9cd9a 69
d4fa05b9
TS
70gfc_source_form gfc_current_form;
71static gfc_linebuf *line_head, *line_tail;
72
63645982 73locus gfc_current_locus;
e0bcf78c 74const char *gfc_source_file;
2d7c7df6 75static FILE *gfc_src_file;
8fc541d3 76static gfc_char_t *gfc_src_preprocessor_lines[2];
2d7c7df6 77
5a06474c 78extern int pedantic;
6de9cd9a 79
1b271c9b
JJ
80static struct gfc_file_change
81{
82 const char *filename;
83 gfc_linebuf *lb;
84 int line;
85} *file_changes;
86size_t file_changes_cur, file_changes_count;
87size_t file_changes_allocated;
88
8fc541d3
FXC
89
90/* Functions dealing with our wide characters (gfc_char_t) and
91 sequences of such characters. */
92
93int
94gfc_wide_fits_in_byte (gfc_char_t c)
95{
96 return (c <= UCHAR_MAX);
97}
98
99static inline int
100wide_is_ascii (gfc_char_t c)
101{
102 return (gfc_wide_fits_in_byte (c) && ((unsigned char) c & ~0x7f) == 0);
103}
104
105int
106gfc_wide_is_printable (gfc_char_t c)
107{
108 return (gfc_wide_fits_in_byte (c) && ISPRINT ((unsigned char) c));
109}
110
111gfc_char_t
112gfc_wide_tolower (gfc_char_t c)
113{
114 return (wide_is_ascii (c) ? (gfc_char_t) TOLOWER((unsigned char) c) : c);
115}
116
00660189
FXC
117gfc_char_t
118gfc_wide_toupper (gfc_char_t c)
119{
120 return (wide_is_ascii (c) ? (gfc_char_t) TOUPPER((unsigned char) c) : c);
121}
122
8fc541d3
FXC
123int
124gfc_wide_is_digit (gfc_char_t c)
125{
126 return (c >= '0' && c <= '9');
127}
128
129static inline int
130wide_atoi (gfc_char_t *c)
131{
132#define MAX_DIGITS 20
133 char buf[MAX_DIGITS+1];
134 int i = 0;
135
136 while (gfc_wide_is_digit(*c) && i < MAX_DIGITS)
137 buf[i++] = *c++;
138 buf[i] = '\0';
139 return atoi (buf);
140}
141
142size_t
143gfc_wide_strlen (const gfc_char_t *str)
144{
145 size_t i;
146
147 for (i = 0; str[i]; i++)
148 ;
149
150 return i;
151}
152
00660189
FXC
153gfc_char_t *
154gfc_wide_memset (gfc_char_t *b, gfc_char_t c, size_t len)
155{
156 size_t i;
157
158 for (i = 0; i < len; i++)
159 b[i] = c;
160
161 return b;
162}
163
8fc541d3
FXC
164static gfc_char_t *
165wide_strcpy (gfc_char_t *dest, const gfc_char_t *src)
166{
167 gfc_char_t *d;
168
169 for (d = dest; (*d = *src) != '\0'; ++src, ++d)
170 ;
171
172 return dest;
173}
174
175static gfc_char_t *
00660189 176wide_strchr (const gfc_char_t *s, gfc_char_t c)
8fc541d3
FXC
177{
178 do {
179 if (*s == c)
180 {
00660189 181 return CONST_CAST(gfc_char_t *, s);
8fc541d3
FXC
182 }
183 } while (*s++);
184 return 0;
185}
186
00660189
FXC
187char *
188gfc_widechar_to_char (const gfc_char_t *s, int length)
189{
190 size_t len, i;
191 char *res;
192
193 if (s == NULL)
194 return NULL;
195
196 /* Passing a negative length is used to indicate that length should be
197 calculated using gfc_wide_strlen(). */
198 len = (length >= 0 ? (size_t) length : gfc_wide_strlen (s));
ece3f663 199 res = XNEWVEC (char, len + 1);
00660189
FXC
200
201 for (i = 0; i < len; i++)
202 {
203 gcc_assert (gfc_wide_fits_in_byte (s[i]));
204 res[i] = (unsigned char) s[i];
205 }
206
207 res[len] = '\0';
208 return res;
209}
210
211gfc_char_t *
212gfc_char_to_widechar (const char *s)
8fc541d3 213{
00660189
FXC
214 size_t len, i;
215 gfc_char_t *res;
216
217 if (s == NULL)
218 return NULL;
219
220 len = strlen (s);
221 res = gfc_get_wide_string (len + 1);
8fc541d3
FXC
222
223 for (i = 0; i < len; i++)
00660189 224 res[i] = (unsigned char) s[i];
8fc541d3
FXC
225
226 res[len] = '\0';
227 return res;
228}
229
230static int
231wide_strncmp (const gfc_char_t *s1, const char *s2, size_t n)
232{
233 gfc_char_t c1, c2;
234
235 while (n-- > 0)
236 {
237 c1 = *s1++;
238 c2 = *s2++;
239 if (c1 != c2)
240 return (c1 > c2 ? 1 : -1);
241 if (c1 == '\0')
242 return 0;
243 }
244 return 0;
245}
246
00660189
FXC
247int
248gfc_wide_strncasecmp (const gfc_char_t *s1, const char *s2, size_t n)
8fc541d3
FXC
249{
250 gfc_char_t c1, c2;
251
252 while (n-- > 0)
253 {
254 c1 = gfc_wide_tolower (*s1++);
255 c2 = TOLOWER (*s2++);
256 if (c1 != c2)
257 return (c1 > c2 ? 1 : -1);
258 if (c1 == '\0')
259 return 0;
260 }
261 return 0;
262}
263
264
6de9cd9a
DN
265/* Main scanner initialization. */
266
267void
268gfc_scanner_init_1 (void)
269{
d4fa05b9
TS
270 file_head = NULL;
271 line_head = NULL;
272 line_tail = NULL;
6de9cd9a 273
5a06474c
JD
274 continue_count = 0;
275 continue_line = 0;
276
6de9cd9a
DN
277 end_flag = 0;
278}
279
280
281/* Main scanner destructor. */
282
283void
284gfc_scanner_done_1 (void)
285{
d4fa05b9
TS
286 gfc_linebuf *lb;
287 gfc_file *f;
6de9cd9a 288
d4fa05b9 289 while(line_head != NULL)
6de9cd9a 290 {
d4fa05b9
TS
291 lb = line_head->next;
292 gfc_free(line_head);
293 line_head = lb;
6de9cd9a 294 }
d4fa05b9
TS
295
296 while(file_head != NULL)
6de9cd9a 297 {
d4fa05b9
TS
298 f = file_head->next;
299 gfc_free(file_head->filename);
300 gfc_free(file_head);
301 file_head = f;
6de9cd9a
DN
302 }
303}
304
305
306/* Adds path to the list pointed to by list. */
307
31198773
FXC
308static void
309add_path_to_list (gfc_directorylist **list, const char *path,
310 bool use_for_modules)
6de9cd9a
DN
311{
312 gfc_directorylist *dir;
313 const char *p;
314
315 p = path;
31198773 316 while (*p == ' ' || *p == '\t') /* someone might do "-I include" */
6de9cd9a
DN
317 if (*p++ == '\0')
318 return;
319
31198773 320 dir = *list;
6de9cd9a 321 if (!dir)
ece3f663 322 dir = *list = XCNEW (gfc_directorylist);
6de9cd9a
DN
323 else
324 {
325 while (dir->next)
326 dir = dir->next;
327
ece3f663 328 dir->next = XCNEW (gfc_directorylist);
6de9cd9a
DN
329 dir = dir->next;
330 }
331
332 dir->next = NULL;
31198773 333 dir->use_for_modules = use_for_modules;
ece3f663 334 dir->path = XCNEWVEC (char, strlen (p) + 2);
6de9cd9a
DN
335 strcpy (dir->path, p);
336 strcat (dir->path, "/"); /* make '/' last character */
337}
338
339
31198773
FXC
340void
341gfc_add_include_path (const char *path, bool use_for_modules)
342{
343 add_path_to_list (&include_dirs, path, use_for_modules);
670637ee 344 gfc_cpp_add_include_path (xstrdup(path), true);
31198773
FXC
345}
346
347
348void
349gfc_add_intrinsic_modules_path (const char *path)
350{
351 add_path_to_list (&intrinsic_modules_dirs, path, true);
352}
353
354
6de9cd9a
DN
355/* Release resources allocated for options. */
356
357void
358gfc_release_include_path (void)
359{
360 gfc_directorylist *p;
361
6de9cd9a
DN
362 while (include_dirs != NULL)
363 {
364 p = include_dirs;
365 include_dirs = include_dirs->next;
366 gfc_free (p->path);
367 gfc_free (p);
368 }
31198773 369
31198773
FXC
370 while (intrinsic_modules_dirs != NULL)
371 {
372 p = intrinsic_modules_dirs;
373 intrinsic_modules_dirs = intrinsic_modules_dirs->next;
374 gfc_free (p->path);
375 gfc_free (p);
376 }
1bc23383
FXC
377
378 gfc_free (gfc_option.module_dir);
6de9cd9a
DN
379}
380
6de9cd9a 381
31198773
FXC
382static FILE *
383open_included_file (const char *name, gfc_directorylist *list, bool module)
6de9cd9a 384{
200cfbe7 385 char *fullname;
6de9cd9a
DN
386 gfc_directorylist *p;
387 FILE *f;
388
31198773 389 for (p = list; p; p = p->next)
b424a572 390 {
31198773
FXC
391 if (module && !p->use_for_modules)
392 continue;
6de9cd9a 393
200cfbe7 394 fullname = (char *) alloca(strlen (p->path) + strlen (name) + 1);
6de9cd9a
DN
395 strcpy (fullname, p->path);
396 strcat (fullname, name);
397
398 f = gfc_open_file (fullname);
399 if (f != NULL)
400 return f;
401 }
402
403 return NULL;
404}
405
31198773
FXC
406
407/* Opens file for reading, searching through the include directories
408 given if necessary. If the include_cwd argument is true, we try
409 to open the file in the current directory first. */
410
411FILE *
412gfc_open_included_file (const char *name, bool include_cwd, bool module)
413{
414 FILE *f;
415
e01f74e0
TB
416 if (IS_ABSOLUTE_PATH (name))
417 return gfc_open_file (name);
418
31198773
FXC
419 if (include_cwd)
420 {
421 f = gfc_open_file (name);
422 if (f != NULL)
423 return f;
424 }
425
426 return open_included_file (name, include_dirs, module);
427}
428
429FILE *
430gfc_open_intrinsic_module (const char *name)
431{
e01f74e0
TB
432 if (IS_ABSOLUTE_PATH (name))
433 return gfc_open_file (name);
434
31198773
FXC
435 return open_included_file (name, intrinsic_modules_dirs, true);
436}
437
edf1eac2 438
6de9cd9a
DN
439/* Test to see if we're at the end of the main source file. */
440
441int
442gfc_at_end (void)
443{
6de9cd9a
DN
444 return end_flag;
445}
446
447
448/* Test to see if we're at the end of the current file. */
449
450int
451gfc_at_eof (void)
452{
6de9cd9a
DN
453 if (gfc_at_end ())
454 return 1;
455
d4fa05b9 456 if (line_head == NULL)
6de9cd9a
DN
457 return 1; /* Null file */
458
63645982 459 if (gfc_current_locus.lb == NULL)
6de9cd9a
DN
460 return 1;
461
462 return 0;
463}
464
465
466/* Test to see if we're at the beginning of a new line. */
467
468int
469gfc_at_bol (void)
470{
6de9cd9a
DN
471 if (gfc_at_eof ())
472 return 1;
473
63645982 474 return (gfc_current_locus.nextc == gfc_current_locus.lb->line);
6de9cd9a
DN
475}
476
477
478/* Test to see if we're at the end of a line. */
479
480int
481gfc_at_eol (void)
482{
6de9cd9a
DN
483 if (gfc_at_eof ())
484 return 1;
485
63645982 486 return (*gfc_current_locus.nextc == '\0');
6de9cd9a
DN
487}
488
60332588 489static void
1b271c9b 490add_file_change (const char *filename, int line)
60332588 491{
1b271c9b
JJ
492 if (file_changes_count == file_changes_allocated)
493 {
494 if (file_changes_allocated)
495 file_changes_allocated *= 2;
496 else
497 file_changes_allocated = 16;
ece3f663
KG
498 file_changes = XRESIZEVEC (struct gfc_file_change, file_changes,
499 file_changes_allocated);
1b271c9b
JJ
500 }
501 file_changes[file_changes_count].filename = filename;
502 file_changes[file_changes_count].lb = NULL;
503 file_changes[file_changes_count++].line = line;
504}
60332588 505
1b271c9b
JJ
506static void
507report_file_change (gfc_linebuf *lb)
508{
509 size_t c = file_changes_cur;
510 while (c < file_changes_count
511 && file_changes[c].lb == lb)
512 {
513 if (file_changes[c].filename)
514 (*debug_hooks->start_source_file) (file_changes[c].line,
515 file_changes[c].filename);
516 else
517 (*debug_hooks->end_source_file) (file_changes[c].line);
518 ++c;
519 }
520 file_changes_cur = c;
60332588
JJ
521}
522
523void
524gfc_start_source_files (void)
525{
526 /* If the debugger wants the name of the main source file,
527 we give it. */
528 if (debug_hooks->start_end_main_source_file)
529 (*debug_hooks->start_source_file) (0, gfc_source_file);
530
1b271c9b
JJ
531 file_changes_cur = 0;
532 report_file_change (gfc_current_locus.lb);
60332588
JJ
533}
534
535void
536gfc_end_source_files (void)
537{
1b271c9b 538 report_file_change (NULL);
60332588
JJ
539
540 if (debug_hooks->start_end_main_source_file)
541 (*debug_hooks->end_source_file) (0);
542}
6de9cd9a
DN
543
544/* Advance the current line pointer to the next line. */
545
546void
547gfc_advance_line (void)
548{
6de9cd9a 549 if (gfc_at_end ())
4a58b9ad 550 return;
6de9cd9a 551
63645982 552 if (gfc_current_locus.lb == NULL)
6de9cd9a 553 {
d4fa05b9
TS
554 end_flag = 1;
555 return;
556 }
6de9cd9a 557
9e8a6720 558 if (gfc_current_locus.lb->next
60332588 559 && !gfc_current_locus.lb->next->dbg_emitted)
9e8a6720 560 {
1b271c9b 561 report_file_change (gfc_current_locus.lb->next);
60332588 562 gfc_current_locus.lb->next->dbg_emitted = true;
9e8a6720
FXC
563 }
564
63645982 565 gfc_current_locus.lb = gfc_current_locus.lb->next;
6de9cd9a 566
edf1eac2 567 if (gfc_current_locus.lb != NULL)
63645982 568 gfc_current_locus.nextc = gfc_current_locus.lb->line;
d4fa05b9
TS
569 else
570 {
63645982 571 gfc_current_locus.nextc = NULL;
d4fa05b9
TS
572 end_flag = 1;
573 }
6de9cd9a
DN
574}
575
576
577/* Get the next character from the input, advancing gfc_current_file's
578 locus. When we hit the end of the line or the end of the file, we
579 start returning a '\n' in order to complete the current statement.
580 No Fortran line conventions are implemented here.
581
582 Requiring explicit advances to the next line prevents the parse
583 pointer from being on the wrong line if the current statement ends
584 prematurely. */
585
8fc541d3 586static gfc_char_t
6de9cd9a
DN
587next_char (void)
588{
8fc541d3 589 gfc_char_t c;
d4fa05b9 590
63645982 591 if (gfc_current_locus.nextc == NULL)
6de9cd9a
DN
592 return '\n';
593
8fc541d3 594 c = *gfc_current_locus.nextc++;
6de9cd9a
DN
595 if (c == '\0')
596 {
63645982 597 gfc_current_locus.nextc--; /* Remain on this line. */
6de9cd9a
DN
598 c = '\n';
599 }
600
601 return c;
602}
603
edf1eac2 604
6de9cd9a
DN
605/* Skip a comment. When we come here the parse pointer is positioned
606 immediately after the comment character. If we ever implement
607 compiler directives withing comments, here is where we parse the
608 directive. */
609
610static void
611skip_comment_line (void)
612{
8fc541d3 613 gfc_char_t c;
6de9cd9a
DN
614
615 do
616 {
617 c = next_char ();
618 }
619 while (c != '\n');
620
621 gfc_advance_line ();
622}
623
624
9e8a6720
FXC
625int
626gfc_define_undef_line (void)
627{
8fc541d3
FXC
628 char *tmp;
629
9e8a6720 630 /* All lines beginning with '#' are either #define or #undef. */
8fc541d3 631 if (debug_info_level != DINFO_LEVEL_VERBOSE || gfc_peek_ascii_char () != '#')
9e8a6720
FXC
632 return 0;
633
8fc541d3
FXC
634 if (wide_strncmp (gfc_current_locus.nextc, "#define ", 8) == 0)
635 {
00660189 636 tmp = gfc_widechar_to_char (&gfc_current_locus.nextc[8], -1);
8fc541d3
FXC
637 (*debug_hooks->define) (gfc_linebuf_linenum (gfc_current_locus.lb),
638 tmp);
639 gfc_free (tmp);
640 }
9e8a6720 641
8fc541d3
FXC
642 if (wide_strncmp (gfc_current_locus.nextc, "#undef ", 7) == 0)
643 {
00660189 644 tmp = gfc_widechar_to_char (&gfc_current_locus.nextc[7], -1);
8fc541d3
FXC
645 (*debug_hooks->undef) (gfc_linebuf_linenum (gfc_current_locus.lb),
646 tmp);
647 gfc_free (tmp);
648 }
9e8a6720
FXC
649
650 /* Skip the rest of the line. */
651 skip_comment_line ();
652
653 return 1;
654}
655
656
6de9cd9a 657/* Comment lines are null lines, lines containing only blanks or lines
0d3abf6f
JJ
658 on which the first nonblank line is a '!'.
659 Return true if !$ openmp conditional compilation sentinel was
660 seen. */
6de9cd9a 661
0d3abf6f 662static bool
6de9cd9a
DN
663skip_free_comments (void)
664{
665 locus start;
8fc541d3 666 gfc_char_t c;
6c7a4dfd 667 int at_bol;
6de9cd9a
DN
668
669 for (;;)
670 {
6c7a4dfd 671 at_bol = gfc_at_bol ();
63645982 672 start = gfc_current_locus;
6de9cd9a
DN
673 if (gfc_at_eof ())
674 break;
675
676 do
6c7a4dfd 677 c = next_char ();
6de9cd9a
DN
678 while (gfc_is_whitespace (c));
679
680 if (c == '\n')
681 {
682 gfc_advance_line ();
683 continue;
684 }
685
686 if (c == '!')
687 {
6c7a4dfd
JJ
688 /* If -fopenmp, we need to handle here 2 things:
689 1) don't treat !$omp as comments, but directives
690 2) handle OpenMP conditional compilation, where
691 !$ should be treated as 2 spaces (for initial lines
692 only if followed by space). */
693 if (gfc_option.flag_openmp && at_bol)
694 {
695 locus old_loc = gfc_current_locus;
696 if (next_char () == '$')
697 {
698 c = next_char ();
699 if (c == 'o' || c == 'O')
700 {
701 if (((c = next_char ()) == 'm' || c == 'M')
9fa6cfec 702 && ((c = next_char ()) == 'p' || c == 'P'))
6c7a4dfd 703 {
a68ab351
JJ
704 if ((c = next_char ()) == ' ' || c == '\t'
705 || continue_flag)
6c7a4dfd 706 {
9fa6cfec
TB
707 while (gfc_is_whitespace (c))
708 c = next_char ();
709 if (c != '\n' && c != '!')
710 {
711 openmp_flag = 1;
712 openmp_locus = old_loc;
713 gfc_current_locus = start;
714 return false;
715 }
6c7a4dfd 716 }
9fa6cfec
TB
717 else
718 gfc_warning_now ("!$OMP at %C starts a commented "
719 "line as it neither is followed "
720 "by a space nor is a "
721 "continuation line");
6c7a4dfd
JJ
722 }
723 gfc_current_locus = old_loc;
724 next_char ();
725 c = next_char ();
726 }
a68ab351 727 if (continue_flag || c == ' ' || c == '\t')
6c7a4dfd
JJ
728 {
729 gfc_current_locus = old_loc;
730 next_char ();
b30c6a0d 731 openmp_flag = 0;
0d3abf6f 732 return true;
6c7a4dfd
JJ
733 }
734 }
735 gfc_current_locus = old_loc;
736 }
6de9cd9a
DN
737 skip_comment_line ();
738 continue;
739 }
740
741 break;
742 }
743
6c7a4dfd
JJ
744 if (openmp_flag && at_bol)
745 openmp_flag = 0;
63645982 746 gfc_current_locus = start;
0d3abf6f 747 return false;
6de9cd9a
DN
748}
749
750
751/* Skip comment lines in fixed source mode. We have the same rules as
752 in skip_free_comment(), except that we can have a 'c', 'C' or '*'
e0bcf78c
TS
753 in column 1, and a '!' cannot be in column 6. Also, we deal with
754 lines with 'd' or 'D' in column 1, if the user requested this. */
6de9cd9a
DN
755
756static void
757skip_fixed_comments (void)
758{
759 locus start;
760 int col;
8fc541d3 761 gfc_char_t c;
6de9cd9a 762
6c7a4dfd
JJ
763 if (! gfc_at_bol ())
764 {
765 start = gfc_current_locus;
766 if (! gfc_at_eof ())
767 {
768 do
769 c = next_char ();
770 while (gfc_is_whitespace (c));
771
772 if (c == '\n')
773 gfc_advance_line ();
774 else if (c == '!')
775 skip_comment_line ();
776 }
777
778 if (! gfc_at_bol ())
779 {
780 gfc_current_locus = start;
781 return;
782 }
783 }
784
6de9cd9a
DN
785 for (;;)
786 {
63645982 787 start = gfc_current_locus;
6de9cd9a
DN
788 if (gfc_at_eof ())
789 break;
790
791 c = next_char ();
792 if (c == '\n')
793 {
794 gfc_advance_line ();
795 continue;
796 }
797
798 if (c == '!' || c == 'c' || c == 'C' || c == '*')
799 {
6c7a4dfd
JJ
800 /* If -fopenmp, we need to handle here 2 things:
801 1) don't treat !$omp|c$omp|*$omp as comments, but directives
802 2) handle OpenMP conditional compilation, where
803 !$|c$|*$ should be treated as 2 spaces if the characters
804 in columns 3 to 6 are valid fixed form label columns
805 characters. */
f449022d
JD
806 if (gfc_current_locus.lb != NULL
807 && continue_line < gfc_linebuf_linenum (gfc_current_locus.lb))
808 continue_line = gfc_linebuf_linenum (gfc_current_locus.lb);
809
6c7a4dfd
JJ
810 if (gfc_option.flag_openmp)
811 {
812 if (next_char () == '$')
813 {
814 c = next_char ();
815 if (c == 'o' || c == 'O')
816 {
817 if (((c = next_char ()) == 'm' || c == 'M')
818 && ((c = next_char ()) == 'p' || c == 'P'))
819 {
820 c = next_char ();
821 if (c != '\n'
822 && ((openmp_flag && continue_flag)
a68ab351 823 || c == ' ' || c == '\t' || c == '0'))
6c7a4dfd 824 {
a68ab351 825 do
6c7a4dfd 826 c = next_char ();
a68ab351 827 while (gfc_is_whitespace (c));
6c7a4dfd
JJ
828 if (c != '\n' && c != '!')
829 {
830 /* Canonicalize to *$omp. */
831 *start.nextc = '*';
832 openmp_flag = 1;
833 gfc_current_locus = start;
834 return;
835 }
836 }
837 }
838 }
839 else
840 {
841 int digit_seen = 0;
842
843 for (col = 3; col < 6; col++, c = next_char ())
844 if (c == ' ')
845 continue;
a68ab351
JJ
846 else if (c == '\t')
847 {
848 col = 6;
849 break;
850 }
6c7a4dfd
JJ
851 else if (c < '0' || c > '9')
852 break;
853 else
854 digit_seen = 1;
855
856 if (col == 6 && c != '\n'
857 && ((continue_flag && !digit_seen)
a68ab351 858 || c == ' ' || c == '\t' || c == '0'))
6c7a4dfd
JJ
859 {
860 gfc_current_locus = start;
861 start.nextc[0] = ' ';
862 start.nextc[1] = ' ';
863 continue;
864 }
865 }
866 }
867 gfc_current_locus = start;
868 }
6de9cd9a
DN
869 skip_comment_line ();
870 continue;
871 }
872
e0bcf78c
TS
873 if (gfc_option.flag_d_lines != -1 && (c == 'd' || c == 'D'))
874 {
875 if (gfc_option.flag_d_lines == 0)
876 {
877 skip_comment_line ();
878 continue;
879 }
880 else
881 *start.nextc = c = ' ';
882 }
883
6de9cd9a 884 col = 1;
e0bcf78c
TS
885
886 while (gfc_is_whitespace (c))
6de9cd9a
DN
887 {
888 c = next_char ();
889 col++;
890 }
6de9cd9a
DN
891
892 if (c == '\n')
893 {
894 gfc_advance_line ();
895 continue;
896 }
897
898 if (col != 6 && c == '!')
899 {
f449022d
JD
900 if (gfc_current_locus.lb != NULL
901 && continue_line < gfc_linebuf_linenum (gfc_current_locus.lb))
902 continue_line = gfc_linebuf_linenum (gfc_current_locus.lb);
6de9cd9a
DN
903 skip_comment_line ();
904 continue;
905 }
906
907 break;
908 }
909
6c7a4dfd 910 openmp_flag = 0;
63645982 911 gfc_current_locus = start;
6de9cd9a
DN
912}
913
914
6c7a4dfd 915/* Skips the current line if it is a comment. */
6de9cd9a
DN
916
917void
918gfc_skip_comments (void)
919{
6c7a4dfd 920 if (gfc_current_form == FORM_FREE)
6de9cd9a
DN
921 skip_free_comments ();
922 else
923 skip_fixed_comments ();
924}
925
926
927/* Get the next character from the input, taking continuation lines
928 and end-of-line comments into account. This implies that comment
929 lines between continued lines must be eaten here. For higher-level
930 subroutines, this flattens continued lines into a single logical
931 line. The in_string flag denotes whether we're inside a character
932 context or not. */
933
8fc541d3 934gfc_char_t
6de9cd9a
DN
935gfc_next_char_literal (int in_string)
936{
937 locus old_loc;
8fc541d3
FXC
938 int i, prev_openmp_flag;
939 gfc_char_t c;
6de9cd9a
DN
940
941 continue_flag = 0;
942
943restart:
944 c = next_char ();
945 if (gfc_at_end ())
5a06474c
JD
946 {
947 continue_count = 0;
948 return c;
949 }
6de9cd9a 950
d4fa05b9 951 if (gfc_current_form == FORM_FREE)
6de9cd9a 952 {
0d3abf6f
JJ
953 bool openmp_cond_flag;
954
6de9cd9a
DN
955 if (!in_string && c == '!')
956 {
6c7a4dfd
JJ
957 if (openmp_flag
958 && memcmp (&gfc_current_locus, &openmp_locus,
959 sizeof (gfc_current_locus)) == 0)
960 goto done;
961
6de9cd9a
DN
962 /* This line can't be continued */
963 do
964 {
965 c = next_char ();
966 }
967 while (c != '\n');
968
a34938be
RG
969 /* Avoid truncation warnings for comment ending lines. */
970 gfc_current_locus.lb->truncated = 0;
971
6de9cd9a
DN
972 goto done;
973 }
974
975 if (c != '&')
976 goto done;
977
978 /* If the next nonblank character is a ! or \n, we've got a
6c7a4dfd 979 continuation line. */
63645982 980 old_loc = gfc_current_locus;
6de9cd9a
DN
981
982 c = next_char ();
983 while (gfc_is_whitespace (c))
984 c = next_char ();
985
986 /* Character constants to be continued cannot have commentary
6c7a4dfd 987 after the '&'. */
6de9cd9a
DN
988
989 if (in_string && c != '\n')
990 {
63645982 991 gfc_current_locus = old_loc;
6de9cd9a
DN
992 c = '&';
993 goto done;
994 }
995
996 if (c != '!' && c != '\n')
997 {
63645982 998 gfc_current_locus = old_loc;
6de9cd9a
DN
999 c = '&';
1000 goto done;
1001 }
1002
6c7a4dfd 1003 prev_openmp_flag = openmp_flag;
6de9cd9a
DN
1004 continue_flag = 1;
1005 if (c == '!')
1006 skip_comment_line ();
1007 else
1008 gfc_advance_line ();
0267ffdc
JD
1009
1010 if (gfc_at_eof())
1011 goto not_continuation;
6de9cd9a 1012
5a06474c
JD
1013 /* We've got a continuation line. If we are on the very next line after
1014 the last continuation, increment the continuation line count and
1015 check whether the limit has been exceeded. */
5ffeb913 1016 if (gfc_linebuf_linenum (gfc_current_locus.lb) == continue_line + 1)
5a06474c
JD
1017 {
1018 if (++continue_count == gfc_option.max_continue_free)
1019 {
edf1eac2
SK
1020 if (gfc_notification_std (GFC_STD_GNU) || pedantic)
1021 gfc_warning ("Limit of %d continuations exceeded in "
1022 "statement at %C", gfc_option.max_continue_free);
5a06474c
JD
1023 }
1024 }
5a06474c
JD
1025
1026 /* Now find where it continues. First eat any comment lines. */
0d3abf6f 1027 openmp_cond_flag = skip_free_comments ();
6de9cd9a 1028
f449022d
JD
1029 if (gfc_current_locus.lb != NULL
1030 && continue_line < gfc_linebuf_linenum (gfc_current_locus.lb))
1031 continue_line = gfc_linebuf_linenum (gfc_current_locus.lb);
1032
6c7a4dfd
JJ
1033 if (prev_openmp_flag != openmp_flag)
1034 {
1035 gfc_current_locus = old_loc;
1036 openmp_flag = prev_openmp_flag;
1037 c = '&';
1038 goto done;
1039 }
1040
6de9cd9a 1041 /* Now that we have a non-comment line, probe ahead for the
6c7a4dfd
JJ
1042 first non-whitespace character. If it is another '&', then
1043 reading starts at the next character, otherwise we must back
1044 up to where the whitespace started and resume from there. */
6de9cd9a 1045
63645982 1046 old_loc = gfc_current_locus;
6de9cd9a
DN
1047
1048 c = next_char ();
1049 while (gfc_is_whitespace (c))
1050 c = next_char ();
1051
6c7a4dfd
JJ
1052 if (openmp_flag)
1053 {
1054 for (i = 0; i < 5; i++, c = next_char ())
1055 {
8fc541d3 1056 gcc_assert (gfc_wide_tolower (c) == (unsigned char) "!$omp"[i]);
6c7a4dfd
JJ
1057 if (i == 4)
1058 old_loc = gfc_current_locus;
1059 }
1060 while (gfc_is_whitespace (c))
1061 c = next_char ();
1062 }
1063
6de9cd9a 1064 if (c != '&')
3fbab549 1065 {
5a06474c
JD
1066 if (in_string)
1067 {
1068 if (gfc_option.warn_ampersand)
edf1eac2
SK
1069 gfc_warning_now ("Missing '&' in continued character "
1070 "constant at %C");
5a06474c
JD
1071 gfc_current_locus.nextc--;
1072 }
0d3abf6f
JJ
1073 /* Both !$omp and !$ -fopenmp continuation lines have & on the
1074 continuation line only optionally. */
1075 else if (openmp_flag || openmp_cond_flag)
1076 gfc_current_locus.nextc--;
5a06474c
JD
1077 else
1078 {
1079 c = ' ';
1080 gfc_current_locus = old_loc;
1081 goto done;
1082 }
3fbab549 1083 }
6de9cd9a
DN
1084 }
1085 else
1086 {
1087 /* Fixed form continuation. */
1088 if (!in_string && c == '!')
1089 {
1090 /* Skip comment at end of line. */
1091 do
1092 {
1093 c = next_char ();
1094 }
1095 while (c != '\n');
a34938be
RG
1096
1097 /* Avoid truncation warnings for comment ending lines. */
1098 gfc_current_locus.lb->truncated = 0;
6de9cd9a
DN
1099 }
1100
1101 if (c != '\n')
1102 goto done;
1103
6c7a4dfd 1104 prev_openmp_flag = openmp_flag;
6de9cd9a 1105 continue_flag = 1;
63645982 1106 old_loc = gfc_current_locus;
6de9cd9a
DN
1107
1108 gfc_advance_line ();
0d3abf6f 1109 skip_fixed_comments ();
6de9cd9a
DN
1110
1111 /* See if this line is a continuation line. */
6c7a4dfd 1112 if (openmp_flag != prev_openmp_flag)
6de9cd9a 1113 {
6c7a4dfd
JJ
1114 openmp_flag = prev_openmp_flag;
1115 goto not_continuation;
6de9cd9a
DN
1116 }
1117
6c7a4dfd
JJ
1118 if (!openmp_flag)
1119 for (i = 0; i < 5; i++)
1120 {
1121 c = next_char ();
1122 if (c != ' ')
1123 goto not_continuation;
1124 }
1125 else
1126 for (i = 0; i < 5; i++)
1127 {
1128 c = next_char ();
8fc541d3 1129 if (gfc_wide_tolower (c) != (unsigned char) "*$omp"[i])
6c7a4dfd
JJ
1130 goto not_continuation;
1131 }
1132
6de9cd9a 1133 c = next_char ();
6c7a4dfd 1134 if (c == '0' || c == ' ' || c == '\n')
6de9cd9a 1135 goto not_continuation;
5a06474c
JD
1136
1137 /* We've got a continuation line. If we are on the very next line after
1138 the last continuation, increment the continuation line count and
1139 check whether the limit has been exceeded. */
5ffeb913 1140 if (gfc_linebuf_linenum (gfc_current_locus.lb) == continue_line + 1)
5a06474c
JD
1141 {
1142 if (++continue_count == gfc_option.max_continue_fixed)
1143 {
edf1eac2
SK
1144 if (gfc_notification_std (GFC_STD_GNU) || pedantic)
1145 gfc_warning ("Limit of %d continuations exceeded in "
1146 "statement at %C",
1147 gfc_option.max_continue_fixed);
5a06474c
JD
1148 }
1149 }
1150
f449022d
JD
1151 if (gfc_current_locus.lb != NULL
1152 && continue_line < gfc_linebuf_linenum (gfc_current_locus.lb))
5ffeb913 1153 continue_line = gfc_linebuf_linenum (gfc_current_locus.lb);
6de9cd9a
DN
1154 }
1155
1156 /* Ready to read first character of continuation line, which might
1157 be another continuation line! */
1158 goto restart;
1159
1160not_continuation:
1161 c = '\n';
63645982 1162 gfc_current_locus = old_loc;
6de9cd9a
DN
1163
1164done:
5a06474c
JD
1165 if (c == '\n')
1166 continue_count = 0;
6de9cd9a
DN
1167 continue_flag = 0;
1168 return c;
1169}
1170
1171
1172/* Get the next character of input, folded to lowercase. In fixed
1173 form mode, we also ignore spaces. When matcher subroutines are
1174 parsing character literals, they have to call
1175 gfc_next_char_literal(). */
1176
8fc541d3 1177gfc_char_t
6de9cd9a
DN
1178gfc_next_char (void)
1179{
8fc541d3 1180 gfc_char_t c;
6de9cd9a
DN
1181
1182 do
1183 {
1184 c = gfc_next_char_literal (0);
1185 }
d4fa05b9 1186 while (gfc_current_form == FORM_FIXED && gfc_is_whitespace (c));
6de9cd9a 1187
8fc541d3 1188 return gfc_wide_tolower (c);
6de9cd9a
DN
1189}
1190
8fc541d3
FXC
1191char
1192gfc_next_ascii_char (void)
1193{
1194 gfc_char_t c = gfc_next_char ();
6de9cd9a 1195
8fc541d3
FXC
1196 return (gfc_wide_fits_in_byte (c) ? (unsigned char) c
1197 : (unsigned char) UCHAR_MAX);
1198}
1199
1200
1201gfc_char_t
6de9cd9a
DN
1202gfc_peek_char (void)
1203{
1204 locus old_loc;
8fc541d3 1205 gfc_char_t c;
6de9cd9a 1206
63645982 1207 old_loc = gfc_current_locus;
6de9cd9a 1208 c = gfc_next_char ();
63645982 1209 gfc_current_locus = old_loc;
6de9cd9a
DN
1210
1211 return c;
1212}
1213
1214
8fc541d3
FXC
1215char
1216gfc_peek_ascii_char (void)
1217{
1218 gfc_char_t c = gfc_peek_char ();
1219
1220 return (gfc_wide_fits_in_byte (c) ? (unsigned char) c
1221 : (unsigned char) UCHAR_MAX);
1222}
1223
1224
6de9cd9a
DN
1225/* Recover from an error. We try to get past the current statement
1226 and get lined up for the next. The next statement follows a '\n'
1227 or a ';'. We also assume that we are not within a character
1228 constant, and deal with finding a '\'' or '"'. */
1229
1230void
1231gfc_error_recovery (void)
1232{
8fc541d3 1233 gfc_char_t c, delim;
6de9cd9a
DN
1234
1235 if (gfc_at_eof ())
1236 return;
1237
1238 for (;;)
1239 {
1240 c = gfc_next_char ();
1241 if (c == '\n' || c == ';')
1242 break;
1243
1244 if (c != '\'' && c != '"')
1245 {
1246 if (gfc_at_eof ())
1247 break;
1248 continue;
1249 }
1250 delim = c;
1251
1252 for (;;)
1253 {
1254 c = next_char ();
1255
1256 if (c == delim)
1257 break;
1258 if (c == '\n')
ba1defa5 1259 return;
6de9cd9a
DN
1260 if (c == '\\')
1261 {
1262 c = next_char ();
1263 if (c == '\n')
ba1defa5 1264 return;
6de9cd9a
DN
1265 }
1266 }
1267 if (gfc_at_eof ())
1268 break;
1269 }
6de9cd9a
DN
1270}
1271
1272
1273/* Read ahead until the next character to be read is not whitespace. */
1274
1275void
1276gfc_gobble_whitespace (void)
1277{
840bd9f7 1278 static int linenum = 0;
6de9cd9a 1279 locus old_loc;
8fc541d3 1280 gfc_char_t c;
6de9cd9a
DN
1281
1282 do
1283 {
63645982 1284 old_loc = gfc_current_locus;
6de9cd9a 1285 c = gfc_next_char_literal (0);
840bd9f7
SK
1286 /* Issue a warning for nonconforming tabs. We keep track of the line
1287 number because the Fortran matchers will often back up and the same
1288 line will be scanned multiple times. */
45a82bd9 1289 if (!gfc_option.warn_tabs && c == '\t')
840bd9f7 1290 {
45a82bd9 1291 int cur_linenum = LOCATION_LINE (gfc_current_locus.lb->location);
45a82bd9
PB
1292 if (cur_linenum != linenum)
1293 {
1294 linenum = cur_linenum;
1295 gfc_warning_now ("Nonconforming tab character at %C");
1296 }
840bd9f7 1297 }
6de9cd9a
DN
1298 }
1299 while (gfc_is_whitespace (c));
1300
63645982 1301 gfc_current_locus = old_loc;
6de9cd9a
DN
1302}
1303
1304
f56c5d5d
TS
1305/* Load a single line into pbuf.
1306
1307 If pbuf points to a NULL pointer, it is allocated.
1308 We truncate lines that are too long, unless we're dealing with
1309 preprocessor lines or if the option -ffixed-line-length-none is set,
1310 in which case we reallocate the buffer to fit the entire line, if
1311 need be.
1312 In fixed mode, we expand a tab that occurs within the statement
1313 label region to expand to spaces that leave the next character in
ba1defa5 1314 the source region.
f2f5443c
FXC
1315
1316 If first_char is not NULL, it's a pointer to a single char value holding
1317 the first character of the line, which has already been read by the
1318 caller. This avoids the use of ungetc().
1319
1526c4b5
JD
1320 load_line returns whether the line was truncated.
1321
1322 NOTE: The error machinery isn't available at this point, so we can't
1323 easily report line and column numbers consistent with other
1324 parts of gfortran. */
6de9cd9a 1325
ba1defa5 1326static int
f2f5443c 1327load_line (FILE *input, gfc_char_t **pbuf, int *pbuflen, const int *first_char)
6de9cd9a 1328{
840bd9f7 1329 static int linenum = 0, current_line = 1;
d1e3d6ae 1330 int c, maxlen, i, preprocessor_flag, buflen = *pbuflen;
840bd9f7 1331 int trunc_flag = 0, seen_comment = 0;
1526c4b5 1332 int seen_printable = 0, seen_ampersand = 0;
8fc541d3 1333 gfc_char_t *buffer;
fd1935d5 1334 bool found_tab = false;
f56c5d5d 1335
1dde8683 1336 /* Determine the maximum allowed line length. */
f56c5d5d 1337 if (gfc_current_form == FORM_FREE)
1dde8683 1338 maxlen = gfc_option.free_line_length;
16ab8e74 1339 else if (gfc_current_form == FORM_FIXED)
1dde8683 1340 maxlen = gfc_option.fixed_line_length;
f56c5d5d 1341 else
16ab8e74 1342 maxlen = 72;
f56c5d5d
TS
1343
1344 if (*pbuf == NULL)
1345 {
1dde8683
BM
1346 /* Allocate the line buffer, storing its length into buflen.
1347 Note that if maxlen==0, indicating that arbitrary-length lines
1348 are allowed, the buffer will be reallocated if this length is
1349 insufficient; since 132 characters is the length of a standard
1350 free-form line, we use that as a starting guess. */
f56c5d5d
TS
1351 if (maxlen > 0)
1352 buflen = maxlen;
1353 else
1dde8683 1354 buflen = 132;
6de9cd9a 1355
00660189 1356 *pbuf = gfc_get_wide_string (buflen + 1);
f56c5d5d 1357 }
6de9cd9a
DN
1358
1359 i = 0;
f56c5d5d 1360 buffer = *pbuf;
6de9cd9a 1361
f2f5443c
FXC
1362 if (first_char)
1363 c = *first_char;
1364 else
1365 c = getc (input);
1366
1367 /* In order to not truncate preprocessor lines, we have to
1368 remember that this is one. */
1369 preprocessor_flag = (c == '#' ? 1 : 0);
fa841200 1370
6de9cd9a
DN
1371 for (;;)
1372 {
6de9cd9a
DN
1373 if (c == EOF)
1374 break;
f2f5443c 1375
6de9cd9a 1376 if (c == '\n')
1526c4b5
JD
1377 {
1378 /* Check for illegal use of ampersand. See F95 Standard 3.3.1.3. */
1379 if (gfc_current_form == FORM_FREE
c284e499 1380 && !seen_printable && seen_ampersand)
1526c4b5
JD
1381 {
1382 if (pedantic)
edf1eac2
SK
1383 gfc_error_now ("'&' not allowed by itself in line %d",
1384 current_line);
1526c4b5 1385 else
edf1eac2
SK
1386 gfc_warning_now ("'&' not allowed by itself in line %d",
1387 current_line);
1526c4b5
JD
1388 }
1389 break;
1390 }
6de9cd9a 1391
f2f5443c
FXC
1392 if (c == '\r' || c == '\0')
1393 goto next_char; /* Gobble characters. */
6de9cd9a 1394
1526c4b5 1395 if (c == '&')
1526c4b5 1396 {
c284e499
JD
1397 if (seen_ampersand)
1398 seen_ampersand = 0;
1526c4b5 1399 else
c284e499 1400 seen_ampersand = 1;
1526c4b5
JD
1401 }
1402
bd5db9de 1403 if ((c != '&' && c != '!' && c != ' ') || (c == '!' && !seen_ampersand))
c284e499
JD
1404 seen_printable = 1;
1405
840bd9f7
SK
1406 /* Is this a fixed-form comment? */
1407 if (gfc_current_form == FORM_FIXED && i == 0
1408 && (c == '*' || c == 'c' || c == 'd'))
1409 seen_comment = 1;
1410
fd1935d5
TB
1411 /* Vendor extension: "<tab>1" marks a continuation line. */
1412 if (found_tab)
840bd9f7 1413 {
fd1935d5
TB
1414 found_tab = false;
1415 if (c >= '1' && c <= '9')
1416 {
1417 *(buffer-1) = c;
f2f5443c 1418 goto next_char;
fd1935d5
TB
1419 }
1420 }
1421
1422 if (gfc_current_form == FORM_FIXED && c == '\t' && i < 6)
1423 {
1424 found_tab = true;
1425
840bd9f7
SK
1426 if (!gfc_option.warn_tabs && seen_comment == 0
1427 && current_line != linenum)
1428 {
1429 linenum = current_line;
fd1935d5
TB
1430 gfc_warning_now ("Nonconforming tab character in column %d "
1431 "of line %d", i+1, linenum);
840bd9f7
SK
1432 }
1433
fd1935d5 1434 while (i < 6)
6de9cd9a
DN
1435 {
1436 *buffer++ = ' ';
1437 i++;
1438 }
1439
f2f5443c 1440 goto next_char;
6de9cd9a
DN
1441 }
1442
1443 *buffer++ = c;
1444 i++;
1445
d1e3d6ae 1446 if (maxlen == 0 || preprocessor_flag)
f56c5d5d 1447 {
d1e3d6ae
JJ
1448 if (i >= buflen)
1449 {
1450 /* Reallocate line buffer to double size to hold the
3fbab549 1451 overlong line. */
d1e3d6ae 1452 buflen = buflen * 2;
ece3f663 1453 *pbuf = XRESIZEVEC (gfc_char_t, *pbuf, (buflen + 1));
edf1eac2 1454 buffer = (*pbuf) + i;
d1e3d6ae 1455 }
f56c5d5d 1456 }
d1e3d6ae 1457 else if (i >= maxlen)
16ab8e74 1458 {
f56c5d5d 1459 /* Truncate the rest of the line. */
6de9cd9a
DN
1460 for (;;)
1461 {
c4da1827 1462 c = getc (input);
6de9cd9a
DN
1463 if (c == '\n' || c == EOF)
1464 break;
a34938be
RG
1465
1466 trunc_flag = 1;
6de9cd9a
DN
1467 }
1468
f2f5443c
FXC
1469 c = '\n';
1470 continue;
6de9cd9a 1471 }
f2f5443c
FXC
1472
1473next_char:
1474 c = getc (input);
6de9cd9a
DN
1475 }
1476
f56c5d5d
TS
1477 /* Pad lines to the selected line length in fixed form. */
1478 if (gfc_current_form == FORM_FIXED
043c2d9e 1479 && gfc_option.fixed_line_length != 0
f56c5d5d
TS
1480 && !preprocessor_flag
1481 && c != EOF)
043c2d9e
BF
1482 {
1483 while (i++ < maxlen)
1484 *buffer++ = ' ';
1485 }
f56c5d5d 1486
6de9cd9a 1487 *buffer = '\0';
d1e3d6ae 1488 *pbuflen = buflen;
840bd9f7 1489 current_line++;
ba1defa5
RG
1490
1491 return trunc_flag;
6de9cd9a
DN
1492}
1493
1494
d4fa05b9
TS
1495/* Get a gfc_file structure, initialize it and add it to
1496 the file stack. */
1497
1498static gfc_file *
e0bcf78c 1499get_file (const char *name, enum lc_reason reason ATTRIBUTE_UNUSED)
d4fa05b9
TS
1500{
1501 gfc_file *f;
1502
ece3f663 1503 f = XCNEW (gfc_file);
d4fa05b9 1504
ece3f663 1505 f->filename = xstrdup (name);
d4fa05b9
TS
1506
1507 f->next = file_head;
1508 file_head = f;
1509
60332588 1510 f->up = current_file;
d4fa05b9 1511 if (current_file != NULL)
1b271c9b 1512 f->inclusion_line = current_file->line;
d4fa05b9 1513
5ffeb913 1514 linemap_add (line_table, reason, false, f->filename, 1);
c8cc8542 1515
d4fa05b9
TS
1516 return f;
1517}
1518
8fc541d3 1519
d4fa05b9
TS
1520/* Deal with a line from the C preprocessor. The
1521 initial octothorp has already been seen. */
6de9cd9a
DN
1522
1523static void
8fc541d3 1524preprocessor_line (gfc_char_t *c)
6de9cd9a 1525{
d4fa05b9
TS
1526 bool flag[5];
1527 int i, line;
8fc541d3 1528 gfc_char_t *wide_filename;
d4fa05b9 1529 gfc_file *f;
2d7c7df6 1530 int escaped, unescape;
8fc541d3 1531 char *filename;
6de9cd9a 1532
d4fa05b9
TS
1533 c++;
1534 while (*c == ' ' || *c == '\t')
1535 c++;
6de9cd9a 1536
d4fa05b9 1537 if (*c < '0' || *c > '9')
fa841200 1538 goto bad_cpp_line;
6de9cd9a 1539
8fc541d3 1540 line = wide_atoi (c);
d4fa05b9 1541
8fc541d3 1542 c = wide_strchr (c, ' ');
fa841200 1543 if (c == NULL)
4c3a6ca1
JJ
1544 {
1545 /* No file name given. Set new line number. */
1546 current_file->line = line;
1547 return;
1548 }
d7d528c8
ES
1549
1550 /* Skip spaces. */
1551 while (*c == ' ' || *c == '\t')
1552 c++;
1553
1554 /* Skip quote. */
1555 if (*c != '"')
fa841200 1556 goto bad_cpp_line;
d7d528c8
ES
1557 ++c;
1558
8fc541d3 1559 wide_filename = c;
d4fa05b9 1560
d7d528c8 1561 /* Make filename end at quote. */
2d7c7df6 1562 unescape = 0;
d7d528c8 1563 escaped = false;
edf1eac2 1564 while (*c && ! (!escaped && *c == '"'))
d7d528c8
ES
1565 {
1566 if (escaped)
edf1eac2 1567 escaped = false;
2d7c7df6
JJ
1568 else if (*c == '\\')
1569 {
1570 escaped = true;
1571 unescape++;
1572 }
d7d528c8
ES
1573 ++c;
1574 }
1575
1576 if (! *c)
fa841200
TS
1577 /* Preprocessor line has no closing quote. */
1578 goto bad_cpp_line;
d7d528c8 1579
d4fa05b9
TS
1580 *c++ = '\0';
1581
2d7c7df6
JJ
1582 /* Undo effects of cpp_quote_string. */
1583 if (unescape)
1584 {
8fc541d3 1585 gfc_char_t *s = wide_filename;
b0b14c7b 1586 gfc_char_t *d = gfc_get_wide_string (c - wide_filename - unescape);
d7d528c8 1587
8fc541d3 1588 wide_filename = d;
2d7c7df6
JJ
1589 while (*s)
1590 {
1591 if (*s == '\\')
1592 *d++ = *++s;
1593 else
1594 *d++ = *s;
1595 s++;
1596 }
1597 *d = '\0';
1598 }
d7d528c8 1599
d4fa05b9 1600 /* Get flags. */
4c3a6ca1 1601
1e39a151 1602 flag[1] = flag[2] = flag[3] = flag[4] = false;
6de9cd9a 1603
6de9cd9a
DN
1604 for (;;)
1605 {
8fc541d3 1606 c = wide_strchr (c, ' ');
d4fa05b9
TS
1607 if (c == NULL)
1608 break;
6de9cd9a 1609
d4fa05b9 1610 c++;
8fc541d3 1611 i = wide_atoi (c);
6de9cd9a 1612
d4fa05b9
TS
1613 if (1 <= i && i <= 4)
1614 flag[i] = true;
1615 }
4c3a6ca1 1616
8fc541d3
FXC
1617 /* Convert the filename in wide characters into a filename in narrow
1618 characters. */
00660189 1619 filename = gfc_widechar_to_char (wide_filename, -1);
8fc541d3 1620
d4fa05b9 1621 /* Interpret flags. */
4c3a6ca1 1622
94b00ee4 1623 if (flag[1]) /* Starting new file. */
d4fa05b9 1624 {
c8cc8542 1625 f = get_file (filename, LC_RENAME);
1b271c9b 1626 add_file_change (f->filename, f->inclusion_line);
d4fa05b9
TS
1627 current_file = f;
1628 }
4c3a6ca1 1629
d4fa05b9
TS
1630 if (flag[2]) /* Ending current file. */
1631 {
94b00ee4
JJ
1632 if (!current_file->up
1633 || strcmp (current_file->up->filename, filename) != 0)
4c3a6ca1
JJ
1634 {
1635 gfc_warning_now ("%s:%d: file %s left but not entered",
1636 current_file->filename, current_file->line,
1637 filename);
2d7c7df6 1638 if (unescape)
8fc541d3
FXC
1639 gfc_free (wide_filename);
1640 gfc_free (filename);
4c3a6ca1
JJ
1641 return;
1642 }
ee07457b 1643
1b271c9b 1644 add_file_change (NULL, line);
94b00ee4 1645 current_file = current_file->up;
ee07457b
FXC
1646 linemap_add (line_table, LC_RENAME, false, current_file->filename,
1647 current_file->line);
d4fa05b9 1648 }
4c3a6ca1 1649
d4fa05b9
TS
1650 /* The name of the file can be a temporary file produced by
1651 cpp. Replace the name if it is different. */
4c3a6ca1 1652
d4fa05b9
TS
1653 if (strcmp (current_file->filename, filename) != 0)
1654 {
95213750
LB
1655 /* FIXME: we leak the old filename because a pointer to it may be stored
1656 in the linemap. Alternative could be using GC or updating linemap to
1657 point to the new name, but there is no API for that currently. */
ece3f663 1658 current_file->filename = xstrdup (filename);
d4fa05b9 1659 }
fa841200 1660
4c3a6ca1
JJ
1661 /* Set new line number. */
1662 current_file->line = line;
2d7c7df6 1663 if (unescape)
8fc541d3
FXC
1664 gfc_free (wide_filename);
1665 gfc_free (filename);
fa841200
TS
1666 return;
1667
1668 bad_cpp_line:
4c3a6ca1 1669 gfc_warning_now ("%s:%d: Illegal preprocessor directive",
fa841200
TS
1670 current_file->filename, current_file->line);
1671 current_file->line++;
d4fa05b9
TS
1672}
1673
1674
e0bcf78c 1675static try load_file (const char *, bool);
d4fa05b9
TS
1676
1677/* include_line()-- Checks a line buffer to see if it is an include
1678 line. If so, we call load_file() recursively to load the included
1679 file. We never return a syntax error because a statement like
1680 "include = 5" is perfectly legal. We return false if no include was
1681 processed or true if we matched an include. */
1682
1683static bool
8fc541d3 1684include_line (gfc_char_t *line)
d4fa05b9 1685{
8fc541d3
FXC
1686 gfc_char_t quote, *c, *begin, *stop;
1687 char *filename;
9b9e4cd6 1688
d4fa05b9 1689 c = line;
9b9e4cd6
JJ
1690
1691 if (gfc_option.flag_openmp)
1692 {
1693 if (gfc_current_form == FORM_FREE)
1694 {
1695 while (*c == ' ' || *c == '\t')
1696 c++;
1697 if (*c == '!' && c[1] == '$' && (c[2] == ' ' || c[2] == '\t'))
1698 c += 3;
1699 }
1700 else
1701 {
1702 if ((*c == '!' || *c == 'c' || *c == 'C' || *c == '*')
1703 && c[1] == '$' && (c[2] == ' ' || c[2] == '\t'))
1704 c += 3;
1705 }
1706 }
1707
d4fa05b9
TS
1708 while (*c == ' ' || *c == '\t')
1709 c++;
1710
00660189 1711 if (gfc_wide_strncasecmp (c, "include", 7))
8fc541d3 1712 return false;
d4fa05b9
TS
1713
1714 c += 7;
1715 while (*c == ' ' || *c == '\t')
1716 c++;
1717
1718 /* Find filename between quotes. */
1719
1720 quote = *c++;
1721 if (quote != '"' && quote != '\'')
1722 return false;
1723
1724 begin = c;
1725
1726 while (*c != quote && *c != '\0')
1727 c++;
1728
1729 if (*c == '\0')
1730 return false;
1731
1732 stop = c++;
1733
1734 while (*c == ' ' || *c == '\t')
1735 c++;
1736
1737 if (*c != '\0' && *c != '!')
1738 return false;
1739
f7b529fa 1740 /* We have an include line at this point. */
d4fa05b9
TS
1741
1742 *stop = '\0'; /* It's ok to trash the buffer, as this line won't be
1743 read by anything else. */
1744
00660189 1745 filename = gfc_widechar_to_char (begin, -1);
8fc541d3
FXC
1746 load_file (filename, false);
1747 gfc_free (filename);
d4fa05b9
TS
1748 return true;
1749}
1750
edf1eac2 1751
d4fa05b9
TS
1752/* Load a file into memory by calling load_line until the file ends. */
1753
1754static try
e0bcf78c 1755load_file (const char *filename, bool initial)
d4fa05b9 1756{
8fc541d3 1757 gfc_char_t *line;
d4fa05b9
TS
1758 gfc_linebuf *b;
1759 gfc_file *f;
1760 FILE *input;
d1e3d6ae 1761 int len, line_len;
caef7872 1762 bool first_line;
d4fa05b9
TS
1763
1764 for (f = current_file; f; f = f->up)
1765 if (strcmp (filename, f->filename) == 0)
1766 {
1767 gfc_error_now ("File '%s' is being included recursively", filename);
1768 return FAILURE;
1769 }
1770
1771 if (initial)
1772 {
2d7c7df6
JJ
1773 if (gfc_src_file)
1774 {
1775 input = gfc_src_file;
1776 gfc_src_file = NULL;
1777 }
1778 else
1779 input = gfc_open_file (filename);
d4fa05b9
TS
1780 if (input == NULL)
1781 {
1782 gfc_error_now ("Can't open file '%s'", filename);
1783 return FAILURE;
1784 }
1785 }
1786 else
1787 {
31198773 1788 input = gfc_open_included_file (filename, false, false);
d4fa05b9
TS
1789 if (input == NULL)
1790 {
1791 gfc_error_now ("Can't open included file '%s'", filename);
1792 return FAILURE;
1793 }
1794 }
1795
1796 /* Load the file. */
1797
c8cc8542 1798 f = get_file (filename, initial ? LC_RENAME : LC_ENTER);
1b271c9b
JJ
1799 if (!initial)
1800 add_file_change (f->filename, f->inclusion_line);
d4fa05b9
TS
1801 current_file = f;
1802 current_file->line = 1;
f56c5d5d 1803 line = NULL;
d1e3d6ae 1804 line_len = 0;
caef7872 1805 first_line = true;
d4fa05b9 1806
2d7c7df6
JJ
1807 if (initial && gfc_src_preprocessor_lines[0])
1808 {
1809 preprocessor_line (gfc_src_preprocessor_lines[0]);
1810 gfc_free (gfc_src_preprocessor_lines[0]);
1811 gfc_src_preprocessor_lines[0] = NULL;
1812 if (gfc_src_preprocessor_lines[1])
1813 {
1814 preprocessor_line (gfc_src_preprocessor_lines[1]);
1815 gfc_free (gfc_src_preprocessor_lines[1]);
1816 gfc_src_preprocessor_lines[1] = NULL;
1817 }
1818 }
1819
16ab8e74 1820 for (;;)
d4fa05b9 1821 {
f2f5443c 1822 int trunc = load_line (input, &line, &line_len, NULL);
d4fa05b9 1823
8fc541d3 1824 len = gfc_wide_strlen (line);
6de9cd9a
DN
1825 if (feof (input) && len == 0)
1826 break;
1827
caef7872
FXC
1828 /* If this is the first line of the file, it can contain a byte
1829 order mark (BOM), which we will ignore:
1830 FF FE is UTF-16 little endian,
1831 FE FF is UTF-16 big endian,
1832 EF BB BF is UTF-8. */
1833 if (first_line
8fc541d3
FXC
1834 && ((line_len >= 2 && line[0] == (unsigned char) '\xFF'
1835 && line[1] == (unsigned char) '\xFE')
1836 || (line_len >= 2 && line[0] == (unsigned char) '\xFE'
1837 && line[1] == (unsigned char) '\xFF')
1838 || (line_len >= 3 && line[0] == (unsigned char) '\xEF'
1839 && line[1] == (unsigned char) '\xBB'
1840 && line[2] == (unsigned char) '\xBF')))
caef7872 1841 {
8fc541d3 1842 int n = line[1] == (unsigned char) '\xBB' ? 3 : 2;
7b901ac4 1843 gfc_char_t *new_char = gfc_get_wide_string (line_len);
caef7872 1844
7b901ac4 1845 wide_strcpy (new_char, &line[n]);
caef7872 1846 gfc_free (line);
7b901ac4 1847 line = new_char;
caef7872
FXC
1848 len -= n;
1849 }
1850
d4fa05b9
TS
1851 /* There are three things this line can be: a line of Fortran
1852 source, an include line or a C preprocessor directive. */
6de9cd9a 1853
d4fa05b9
TS
1854 if (line[0] == '#')
1855 {
9e8a6720
FXC
1856 /* When -g3 is specified, it's possible that we emit #define
1857 and #undef lines, which we need to pass to the middle-end
1858 so that it can emit correct debug info. */
1859 if (debug_info_level == DINFO_LEVEL_VERBOSE
8fc541d3
FXC
1860 && (wide_strncmp (line, "#define ", 8) == 0
1861 || wide_strncmp (line, "#undef ", 7) == 0))
9e8a6720
FXC
1862 ;
1863 else
1864 {
1865 preprocessor_line (line);
1866 continue;
1867 }
d4fa05b9 1868 }
6de9cd9a 1869
caef7872
FXC
1870 /* Preprocessed files have preprocessor lines added before the byte
1871 order mark, so first_line is not about the first line of the file
1872 but the first line that's not a preprocessor line. */
1873 first_line = false;
1874
d4fa05b9
TS
1875 if (include_line (line))
1876 {
1877 current_file->line++;
1878 continue;
6de9cd9a
DN
1879 }
1880
d4fa05b9
TS
1881 /* Add line. */
1882
ece3f663
KG
1883 b = (gfc_linebuf *) gfc_getmem (gfc_linebuf_header_size
1884 + (len + 1) * sizeof (gfc_char_t));
d4fa05b9 1885
c8cc8542 1886 b->location
5ffeb913 1887 = linemap_line_start (line_table, current_file->line++, 120);
d4fa05b9 1888 b->file = current_file;
ba1defa5 1889 b->truncated = trunc;
8fc541d3 1890 wide_strcpy (b->line, line);
d4fa05b9
TS
1891
1892 if (line_head == NULL)
1893 line_head = b;
1894 else
1895 line_tail->next = b;
1896
1897 line_tail = b;
1b271c9b
JJ
1898
1899 while (file_changes_cur < file_changes_count)
1900 file_changes[file_changes_cur++].lb = b;
6de9cd9a 1901 }
d4fa05b9 1902
f56c5d5d
TS
1903 /* Release the line buffer allocated in load_line. */
1904 gfc_free (line);
1905
d4fa05b9
TS
1906 fclose (input);
1907
1b271c9b
JJ
1908 if (!initial)
1909 add_file_change (NULL, current_file->inclusion_line + 1);
d4fa05b9 1910 current_file = current_file->up;
5ffeb913 1911 linemap_add (line_table, LC_LEAVE, 0, NULL, 0);
d4fa05b9 1912 return SUCCESS;
6de9cd9a
DN
1913}
1914
1915
d4fa05b9
TS
1916/* Open a new file and start scanning from that file. Returns SUCCESS
1917 if everything went OK, FAILURE otherwise. If form == FORM_UKNOWN
1918 it tries to determine the source form from the filename, defaulting
1919 to free form. */
6de9cd9a
DN
1920
1921try
e0bcf78c 1922gfc_new_file (void)
6de9cd9a 1923{
d4fa05b9 1924 try result;
6de9cd9a 1925
670637ee
DF
1926 if (gfc_cpp_enabled ())
1927 {
1928 result = gfc_cpp_preprocess (gfc_source_file);
1929 if (!gfc_cpp_preprocess_only ())
1930 result = load_file (gfc_cpp_temporary_file (), true);
1931 }
1932 else
1933 result = load_file (gfc_source_file, true);
6de9cd9a 1934
63645982
TS
1935 gfc_current_locus.lb = line_head;
1936 gfc_current_locus.nextc = (line_head == NULL) ? NULL : line_head->line;
6de9cd9a 1937
d4fa05b9
TS
1938#if 0 /* Debugging aid. */
1939 for (; line_head; line_head = line_head->next)
6c1abb5c
FXC
1940 printf ("%s:%3d %s\n", LOCATION_FILE (line_head->location),
1941 LOCATION_LINE (line_head->location), line_head->line);
6de9cd9a 1942
d4fa05b9
TS
1943 exit (0);
1944#endif
6de9cd9a 1945
d4fa05b9 1946 return result;
6de9cd9a 1947}
2d7c7df6
JJ
1948
1949static char *
1950unescape_filename (const char *ptr)
1951{
1952 const char *p = ptr, *s;
1953 char *d, *ret;
1954 int escaped, unescape = 0;
1955
1956 /* Make filename end at quote. */
1957 escaped = false;
1958 while (*p && ! (! escaped && *p == '"'))
1959 {
1960 if (escaped)
1961 escaped = false;
1962 else if (*p == '\\')
1963 {
1964 escaped = true;
1965 unescape++;
1966 }
1967 ++p;
1968 }
1969
edf1eac2 1970 if (!*p || p[1])
2d7c7df6
JJ
1971 return NULL;
1972
1973 /* Undo effects of cpp_quote_string. */
1974 s = ptr;
ece3f663 1975 d = XCNEWVEC (char, p + 1 - ptr - unescape);
2d7c7df6
JJ
1976 ret = d;
1977
1978 while (s != p)
1979 {
1980 if (*s == '\\')
1981 *d++ = *++s;
1982 else
1983 *d++ = *s;
1984 s++;
1985 }
1986 *d = '\0';
1987 return ret;
1988}
1989
1990/* For preprocessed files, if the first tokens are of the form # NUM.
1991 handle the directives so we know the original file name. */
1992
1993const char *
1994gfc_read_orig_filename (const char *filename, const char **canon_source_file)
1995{
1996 int c, len;
8fc541d3 1997 char *dirname, *tmp;
2d7c7df6
JJ
1998
1999 gfc_src_file = gfc_open_file (filename);
2000 if (gfc_src_file == NULL)
2001 return NULL;
2002
c4da1827 2003 c = getc (gfc_src_file);
2d7c7df6
JJ
2004
2005 if (c != '#')
2006 return NULL;
2007
2008 len = 0;
f2f5443c 2009 load_line (gfc_src_file, &gfc_src_preprocessor_lines[0], &len, &c);
2d7c7df6 2010
8fc541d3 2011 if (wide_strncmp (gfc_src_preprocessor_lines[0], "# 1 \"", 5) != 0)
2d7c7df6
JJ
2012 return NULL;
2013
00660189 2014 tmp = gfc_widechar_to_char (&gfc_src_preprocessor_lines[0][5], -1);
8fc541d3
FXC
2015 filename = unescape_filename (tmp);
2016 gfc_free (tmp);
2d7c7df6
JJ
2017 if (filename == NULL)
2018 return NULL;
2019
c4da1827 2020 c = getc (gfc_src_file);
2d7c7df6
JJ
2021
2022 if (c != '#')
2023 return filename;
2024
2025 len = 0;
f2f5443c 2026 load_line (gfc_src_file, &gfc_src_preprocessor_lines[1], &len, &c);
2d7c7df6 2027
8fc541d3 2028 if (wide_strncmp (gfc_src_preprocessor_lines[1], "# 1 \"", 5) != 0)
2d7c7df6
JJ
2029 return filename;
2030
00660189 2031 tmp = gfc_widechar_to_char (&gfc_src_preprocessor_lines[1][5], -1);
8fc541d3
FXC
2032 dirname = unescape_filename (tmp);
2033 gfc_free (tmp);
2d7c7df6
JJ
2034 if (dirname == NULL)
2035 return filename;
2036
2037 len = strlen (dirname);
2038 if (len < 3 || dirname[len - 1] != '/' || dirname[len - 2] != '/')
2039 {
2040 gfc_free (dirname);
2041 return filename;
2042 }
2043 dirname[len - 2] = '\0';
2044 set_src_pwd (dirname);
2045
2046 if (! IS_ABSOLUTE_PATH (filename))
2047 {
ece3f663 2048 char *p = XCNEWVEC (char, len + strlen (filename));
2d7c7df6
JJ
2049
2050 memcpy (p, dirname, len - 2);
2051 p[len - 2] = '/';
2052 strcpy (p + len - 1, filename);
2053 *canon_source_file = p;
2054 }
2055
2056 gfc_free (dirname);
2057 return filename;
2058}