2008-01-06 Jerry DeLisle <jvdelisle@gcc.gnu.org>
[official-gcc.git] / gcc / fortran / scanner.c
blobda4c37b155e799300315df4e791f13492ca0a6a4
1 /* Character scanner.
2 Copyright (C) 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007
3 Free Software Foundation, Inc.
4 Contributed by Andy Vaught
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify it under
9 the terms of the GNU General Public License as published by the Free
10 Software Foundation; either version 3, or (at your option) any later
11 version.
13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING3. If not see
20 <http://www.gnu.org/licenses/>. */
22 /* Set of subroutines to (ultimately) return the next character to the
23 various matching subroutines. This file's job is to read files and
24 build up lines that are parsed by the parser. This means that we
25 handle continuation lines and "include" lines.
27 The first thing the scanner does is to load an entire file into
28 memory. We load the entire file into memory for a couple reasons.
29 The first is that we want to be able to deal with nonseekable input
30 (pipes, stdin) and there is a lot of backing up involved during
31 parsing.
33 The second is that we want to be able to print the locus of errors,
34 and an error on line 999999 could conflict with something on line
35 one. Given nonseekable input, we've got to store the whole thing.
37 One thing that helps are the column truncation limits that give us
38 an upper bound on the size of individual lines. We don't store the
39 truncated stuff.
41 From the scanner's viewpoint, the higher level subroutines ask for
42 new characters and do a lot of jumping backwards. */
44 #include "config.h"
45 #include "system.h"
46 #include "gfortran.h"
47 #include "toplev.h"
48 #include "debug.h"
49 #include "flags.h"
51 /* Structure for holding module and include file search path. */
52 typedef struct gfc_directorylist
54 char *path;
55 bool use_for_modules;
56 struct gfc_directorylist *next;
58 gfc_directorylist;
60 /* List of include file search directories. */
61 static gfc_directorylist *include_dirs, *intrinsic_modules_dirs;
63 static gfc_file *file_head, *current_file;
65 static int continue_flag, end_flag, openmp_flag;
66 static int continue_count, continue_line;
67 static locus openmp_locus;
69 gfc_source_form gfc_current_form;
70 static gfc_linebuf *line_head, *line_tail;
72 locus gfc_current_locus;
73 const char *gfc_source_file;
74 static FILE *gfc_src_file;
75 static char *gfc_src_preprocessor_lines[2];
77 extern int pedantic;
79 static struct gfc_file_change
81 const char *filename;
82 gfc_linebuf *lb;
83 int line;
84 } *file_changes;
85 size_t file_changes_cur, file_changes_count;
86 size_t file_changes_allocated;
88 /* Main scanner initialization. */
90 void
91 gfc_scanner_init_1 (void)
93 file_head = NULL;
94 line_head = NULL;
95 line_tail = NULL;
97 continue_count = 0;
98 continue_line = 0;
100 end_flag = 0;
104 /* Main scanner destructor. */
106 void
107 gfc_scanner_done_1 (void)
109 gfc_linebuf *lb;
110 gfc_file *f;
112 while(line_head != NULL)
114 lb = line_head->next;
115 gfc_free(line_head);
116 line_head = lb;
119 while(file_head != NULL)
121 f = file_head->next;
122 gfc_free(file_head->filename);
123 gfc_free(file_head);
124 file_head = f;
129 /* Adds path to the list pointed to by list. */
131 static void
132 add_path_to_list (gfc_directorylist **list, const char *path,
133 bool use_for_modules)
135 gfc_directorylist *dir;
136 const char *p;
138 p = path;
139 while (*p == ' ' || *p == '\t') /* someone might do "-I include" */
140 if (*p++ == '\0')
141 return;
143 dir = *list;
144 if (!dir)
145 dir = *list = gfc_getmem (sizeof (gfc_directorylist));
146 else
148 while (dir->next)
149 dir = dir->next;
151 dir->next = gfc_getmem (sizeof (gfc_directorylist));
152 dir = dir->next;
155 dir->next = NULL;
156 dir->use_for_modules = use_for_modules;
157 dir->path = gfc_getmem (strlen (p) + 2);
158 strcpy (dir->path, p);
159 strcat (dir->path, "/"); /* make '/' last character */
163 void
164 gfc_add_include_path (const char *path, bool use_for_modules)
166 add_path_to_list (&include_dirs, path, use_for_modules);
170 void
171 gfc_add_intrinsic_modules_path (const char *path)
173 add_path_to_list (&intrinsic_modules_dirs, path, true);
177 /* Release resources allocated for options. */
179 void
180 gfc_release_include_path (void)
182 gfc_directorylist *p;
184 while (include_dirs != NULL)
186 p = include_dirs;
187 include_dirs = include_dirs->next;
188 gfc_free (p->path);
189 gfc_free (p);
192 while (intrinsic_modules_dirs != NULL)
194 p = intrinsic_modules_dirs;
195 intrinsic_modules_dirs = intrinsic_modules_dirs->next;
196 gfc_free (p->path);
197 gfc_free (p);
200 gfc_free (gfc_option.module_dir);
204 static FILE *
205 open_included_file (const char *name, gfc_directorylist *list, bool module)
207 char *fullname;
208 gfc_directorylist *p;
209 FILE *f;
211 for (p = list; p; p = p->next)
213 if (module && !p->use_for_modules)
214 continue;
216 fullname = (char *) alloca(strlen (p->path) + strlen (name) + 1);
217 strcpy (fullname, p->path);
218 strcat (fullname, name);
220 f = gfc_open_file (fullname);
221 if (f != NULL)
222 return f;
225 return NULL;
229 /* Opens file for reading, searching through the include directories
230 given if necessary. If the include_cwd argument is true, we try
231 to open the file in the current directory first. */
233 FILE *
234 gfc_open_included_file (const char *name, bool include_cwd, bool module)
236 FILE *f;
238 if (IS_ABSOLUTE_PATH (name))
239 return gfc_open_file (name);
241 if (include_cwd)
243 f = gfc_open_file (name);
244 if (f != NULL)
245 return f;
248 return open_included_file (name, include_dirs, module);
251 FILE *
252 gfc_open_intrinsic_module (const char *name)
254 if (IS_ABSOLUTE_PATH (name))
255 return gfc_open_file (name);
257 return open_included_file (name, intrinsic_modules_dirs, true);
261 /* Test to see if we're at the end of the main source file. */
264 gfc_at_end (void)
266 return end_flag;
270 /* Test to see if we're at the end of the current file. */
273 gfc_at_eof (void)
275 if (gfc_at_end ())
276 return 1;
278 if (line_head == NULL)
279 return 1; /* Null file */
281 if (gfc_current_locus.lb == NULL)
282 return 1;
284 return 0;
288 /* Test to see if we're at the beginning of a new line. */
291 gfc_at_bol (void)
293 if (gfc_at_eof ())
294 return 1;
296 return (gfc_current_locus.nextc == gfc_current_locus.lb->line);
300 /* Test to see if we're at the end of a line. */
303 gfc_at_eol (void)
305 if (gfc_at_eof ())
306 return 1;
308 return (*gfc_current_locus.nextc == '\0');
311 static void
312 add_file_change (const char *filename, int line)
314 if (file_changes_count == file_changes_allocated)
316 if (file_changes_allocated)
317 file_changes_allocated *= 2;
318 else
319 file_changes_allocated = 16;
320 file_changes
321 = xrealloc (file_changes,
322 file_changes_allocated * sizeof (*file_changes));
324 file_changes[file_changes_count].filename = filename;
325 file_changes[file_changes_count].lb = NULL;
326 file_changes[file_changes_count++].line = line;
329 static void
330 report_file_change (gfc_linebuf *lb)
332 size_t c = file_changes_cur;
333 while (c < file_changes_count
334 && file_changes[c].lb == lb)
336 if (file_changes[c].filename)
337 (*debug_hooks->start_source_file) (file_changes[c].line,
338 file_changes[c].filename);
339 else
340 (*debug_hooks->end_source_file) (file_changes[c].line);
341 ++c;
343 file_changes_cur = c;
346 void
347 gfc_start_source_files (void)
349 /* If the debugger wants the name of the main source file,
350 we give it. */
351 if (debug_hooks->start_end_main_source_file)
352 (*debug_hooks->start_source_file) (0, gfc_source_file);
354 file_changes_cur = 0;
355 report_file_change (gfc_current_locus.lb);
358 void
359 gfc_end_source_files (void)
361 report_file_change (NULL);
363 if (debug_hooks->start_end_main_source_file)
364 (*debug_hooks->end_source_file) (0);
367 /* Advance the current line pointer to the next line. */
369 void
370 gfc_advance_line (void)
372 if (gfc_at_end ())
373 return;
375 if (gfc_current_locus.lb == NULL)
377 end_flag = 1;
378 return;
381 if (gfc_current_locus.lb->next
382 && !gfc_current_locus.lb->next->dbg_emitted)
384 report_file_change (gfc_current_locus.lb->next);
385 gfc_current_locus.lb->next->dbg_emitted = true;
388 gfc_current_locus.lb = gfc_current_locus.lb->next;
390 if (gfc_current_locus.lb != NULL)
391 gfc_current_locus.nextc = gfc_current_locus.lb->line;
392 else
394 gfc_current_locus.nextc = NULL;
395 end_flag = 1;
400 /* Get the next character from the input, advancing gfc_current_file's
401 locus. When we hit the end of the line or the end of the file, we
402 start returning a '\n' in order to complete the current statement.
403 No Fortran line conventions are implemented here.
405 Requiring explicit advances to the next line prevents the parse
406 pointer from being on the wrong line if the current statement ends
407 prematurely. */
409 static int
410 next_char (void)
412 int c;
414 if (gfc_current_locus.nextc == NULL)
415 return '\n';
417 c = (unsigned char) *gfc_current_locus.nextc++;
418 if (c == '\0')
420 gfc_current_locus.nextc--; /* Remain on this line. */
421 c = '\n';
424 return c;
428 /* Skip a comment. When we come here the parse pointer is positioned
429 immediately after the comment character. If we ever implement
430 compiler directives withing comments, here is where we parse the
431 directive. */
433 static void
434 skip_comment_line (void)
436 char c;
440 c = next_char ();
442 while (c != '\n');
444 gfc_advance_line ();
449 gfc_define_undef_line (void)
451 /* All lines beginning with '#' are either #define or #undef. */
452 if (debug_info_level != DINFO_LEVEL_VERBOSE || gfc_peek_char () != '#')
453 return 0;
455 if (strncmp (gfc_current_locus.nextc, "#define ", 8) == 0)
456 (*debug_hooks->define) (gfc_linebuf_linenum (gfc_current_locus.lb),
457 &(gfc_current_locus.nextc[8]));
459 if (strncmp (gfc_current_locus.nextc, "#undef ", 7) == 0)
460 (*debug_hooks->undef) (gfc_linebuf_linenum (gfc_current_locus.lb),
461 &(gfc_current_locus.nextc[7]));
463 /* Skip the rest of the line. */
464 skip_comment_line ();
466 return 1;
470 /* Comment lines are null lines, lines containing only blanks or lines
471 on which the first nonblank line is a '!'.
472 Return true if !$ openmp conditional compilation sentinel was
473 seen. */
475 static bool
476 skip_free_comments (void)
478 locus start;
479 char c;
480 int at_bol;
482 for (;;)
484 at_bol = gfc_at_bol ();
485 start = gfc_current_locus;
486 if (gfc_at_eof ())
487 break;
490 c = next_char ();
491 while (gfc_is_whitespace (c));
493 if (c == '\n')
495 gfc_advance_line ();
496 continue;
499 if (c == '!')
501 /* If -fopenmp, we need to handle here 2 things:
502 1) don't treat !$omp as comments, but directives
503 2) handle OpenMP conditional compilation, where
504 !$ should be treated as 2 spaces (for initial lines
505 only if followed by space). */
506 if (gfc_option.flag_openmp && at_bol)
508 locus old_loc = gfc_current_locus;
509 if (next_char () == '$')
511 c = next_char ();
512 if (c == 'o' || c == 'O')
514 if (((c = next_char ()) == 'm' || c == 'M')
515 && ((c = next_char ()) == 'p' || c == 'P'))
517 if ((c = next_char ()) == ' ' || continue_flag)
519 while (gfc_is_whitespace (c))
520 c = next_char ();
521 if (c != '\n' && c != '!')
523 openmp_flag = 1;
524 openmp_locus = old_loc;
525 gfc_current_locus = start;
526 return false;
529 else
530 gfc_warning_now ("!$OMP at %C starts a commented "
531 "line as it neither is followed "
532 "by a space nor is a "
533 "continuation line");
535 gfc_current_locus = old_loc;
536 next_char ();
537 c = next_char ();
539 if (continue_flag || c == ' ')
541 gfc_current_locus = old_loc;
542 next_char ();
543 openmp_flag = 0;
544 return true;
547 gfc_current_locus = old_loc;
549 skip_comment_line ();
550 continue;
553 break;
556 if (openmp_flag && at_bol)
557 openmp_flag = 0;
558 gfc_current_locus = start;
559 return false;
563 /* Skip comment lines in fixed source mode. We have the same rules as
564 in skip_free_comment(), except that we can have a 'c', 'C' or '*'
565 in column 1, and a '!' cannot be in column 6. Also, we deal with
566 lines with 'd' or 'D' in column 1, if the user requested this. */
568 static void
569 skip_fixed_comments (void)
571 locus start;
572 int col;
573 char c;
575 if (! gfc_at_bol ())
577 start = gfc_current_locus;
578 if (! gfc_at_eof ())
581 c = next_char ();
582 while (gfc_is_whitespace (c));
584 if (c == '\n')
585 gfc_advance_line ();
586 else if (c == '!')
587 skip_comment_line ();
590 if (! gfc_at_bol ())
592 gfc_current_locus = start;
593 return;
597 for (;;)
599 start = gfc_current_locus;
600 if (gfc_at_eof ())
601 break;
603 c = next_char ();
604 if (c == '\n')
606 gfc_advance_line ();
607 continue;
610 if (c == '!' || c == 'c' || c == 'C' || c == '*')
612 /* If -fopenmp, we need to handle here 2 things:
613 1) don't treat !$omp|c$omp|*$omp as comments, but directives
614 2) handle OpenMP conditional compilation, where
615 !$|c$|*$ should be treated as 2 spaces if the characters
616 in columns 3 to 6 are valid fixed form label columns
617 characters. */
618 if (gfc_option.flag_openmp)
620 if (next_char () == '$')
622 c = next_char ();
623 if (c == 'o' || c == 'O')
625 if (((c = next_char ()) == 'm' || c == 'M')
626 && ((c = next_char ()) == 'p' || c == 'P'))
628 c = next_char ();
629 if (c != '\n'
630 && ((openmp_flag && continue_flag)
631 || c == ' ' || c == '0'))
633 c = next_char ();
634 while (gfc_is_whitespace (c))
635 c = next_char ();
636 if (c != '\n' && c != '!')
638 /* Canonicalize to *$omp. */
639 *start.nextc = '*';
640 openmp_flag = 1;
641 gfc_current_locus = start;
642 return;
647 else
649 int digit_seen = 0;
651 for (col = 3; col < 6; col++, c = next_char ())
652 if (c == ' ')
653 continue;
654 else if (c < '0' || c > '9')
655 break;
656 else
657 digit_seen = 1;
659 if (col == 6 && c != '\n'
660 && ((continue_flag && !digit_seen)
661 || c == ' ' || c == '0'))
663 gfc_current_locus = start;
664 start.nextc[0] = ' ';
665 start.nextc[1] = ' ';
666 continue;
670 gfc_current_locus = start;
672 skip_comment_line ();
673 continue;
676 if (gfc_option.flag_d_lines != -1 && (c == 'd' || c == 'D'))
678 if (gfc_option.flag_d_lines == 0)
680 skip_comment_line ();
681 continue;
683 else
684 *start.nextc = c = ' ';
687 col = 1;
689 while (gfc_is_whitespace (c))
691 c = next_char ();
692 col++;
695 if (c == '\n')
697 gfc_advance_line ();
698 continue;
701 if (col != 6 && c == '!')
703 skip_comment_line ();
704 continue;
707 break;
710 openmp_flag = 0;
711 gfc_current_locus = start;
715 /* Skips the current line if it is a comment. */
717 void
718 gfc_skip_comments (void)
720 if (gfc_current_form == FORM_FREE)
721 skip_free_comments ();
722 else
723 skip_fixed_comments ();
727 /* Get the next character from the input, taking continuation lines
728 and end-of-line comments into account. This implies that comment
729 lines between continued lines must be eaten here. For higher-level
730 subroutines, this flattens continued lines into a single logical
731 line. The in_string flag denotes whether we're inside a character
732 context or not. */
735 gfc_next_char_literal (int in_string)
737 locus old_loc;
738 int i, c, prev_openmp_flag;
740 continue_flag = 0;
742 restart:
743 c = next_char ();
744 if (gfc_at_end ())
746 continue_count = 0;
747 return c;
750 if (gfc_current_form == FORM_FREE)
752 bool openmp_cond_flag;
754 if (!in_string && c == '!')
756 if (openmp_flag
757 && memcmp (&gfc_current_locus, &openmp_locus,
758 sizeof (gfc_current_locus)) == 0)
759 goto done;
761 /* This line can't be continued */
764 c = next_char ();
766 while (c != '\n');
768 /* Avoid truncation warnings for comment ending lines. */
769 gfc_current_locus.lb->truncated = 0;
771 goto done;
774 if (c != '&')
775 goto done;
777 /* If the next nonblank character is a ! or \n, we've got a
778 continuation line. */
779 old_loc = gfc_current_locus;
781 c = next_char ();
782 while (gfc_is_whitespace (c))
783 c = next_char ();
785 /* Character constants to be continued cannot have commentary
786 after the '&'. */
788 if (in_string && c != '\n')
790 gfc_current_locus = old_loc;
791 c = '&';
792 goto done;
795 if (c != '!' && c != '\n')
797 gfc_current_locus = old_loc;
798 c = '&';
799 goto done;
802 prev_openmp_flag = openmp_flag;
803 continue_flag = 1;
804 if (c == '!')
805 skip_comment_line ();
806 else
807 gfc_advance_line ();
809 if (gfc_at_eof())
810 goto not_continuation;
812 /* We've got a continuation line. If we are on the very next line after
813 the last continuation, increment the continuation line count and
814 check whether the limit has been exceeded. */
815 if (gfc_linebuf_linenum (gfc_current_locus.lb) == continue_line + 1)
817 if (++continue_count == gfc_option.max_continue_free)
819 if (gfc_notification_std (GFC_STD_GNU) || pedantic)
820 gfc_warning ("Limit of %d continuations exceeded in "
821 "statement at %C", gfc_option.max_continue_free);
824 continue_line = gfc_linebuf_linenum (gfc_current_locus.lb);
826 /* Now find where it continues. First eat any comment lines. */
827 openmp_cond_flag = skip_free_comments ();
829 if (prev_openmp_flag != openmp_flag)
831 gfc_current_locus = old_loc;
832 openmp_flag = prev_openmp_flag;
833 c = '&';
834 goto done;
837 /* Now that we have a non-comment line, probe ahead for the
838 first non-whitespace character. If it is another '&', then
839 reading starts at the next character, otherwise we must back
840 up to where the whitespace started and resume from there. */
842 old_loc = gfc_current_locus;
844 c = next_char ();
845 while (gfc_is_whitespace (c))
846 c = next_char ();
848 if (openmp_flag)
850 for (i = 0; i < 5; i++, c = next_char ())
852 gcc_assert (TOLOWER (c) == "!$omp"[i]);
853 if (i == 4)
854 old_loc = gfc_current_locus;
856 while (gfc_is_whitespace (c))
857 c = next_char ();
860 if (c != '&')
862 if (in_string)
864 if (gfc_option.warn_ampersand)
865 gfc_warning_now ("Missing '&' in continued character "
866 "constant at %C");
867 gfc_current_locus.nextc--;
869 /* Both !$omp and !$ -fopenmp continuation lines have & on the
870 continuation line only optionally. */
871 else if (openmp_flag || openmp_cond_flag)
872 gfc_current_locus.nextc--;
873 else
875 c = ' ';
876 gfc_current_locus = old_loc;
877 goto done;
881 else
883 /* Fixed form continuation. */
884 if (!in_string && c == '!')
886 /* Skip comment at end of line. */
889 c = next_char ();
891 while (c != '\n');
893 /* Avoid truncation warnings for comment ending lines. */
894 gfc_current_locus.lb->truncated = 0;
897 if (c != '\n')
898 goto done;
900 prev_openmp_flag = openmp_flag;
901 continue_flag = 1;
902 old_loc = gfc_current_locus;
904 gfc_advance_line ();
905 skip_fixed_comments ();
907 /* See if this line is a continuation line. */
908 if (openmp_flag != prev_openmp_flag)
910 openmp_flag = prev_openmp_flag;
911 goto not_continuation;
914 if (!openmp_flag)
915 for (i = 0; i < 5; i++)
917 c = next_char ();
918 if (c != ' ')
919 goto not_continuation;
921 else
922 for (i = 0; i < 5; i++)
924 c = next_char ();
925 if (TOLOWER (c) != "*$omp"[i])
926 goto not_continuation;
929 c = next_char ();
930 if (c == '0' || c == ' ' || c == '\n')
931 goto not_continuation;
933 /* We've got a continuation line. If we are on the very next line after
934 the last continuation, increment the continuation line count and
935 check whether the limit has been exceeded. */
936 if (gfc_linebuf_linenum (gfc_current_locus.lb) == continue_line + 1)
938 if (++continue_count == gfc_option.max_continue_fixed)
940 if (gfc_notification_std (GFC_STD_GNU) || pedantic)
941 gfc_warning ("Limit of %d continuations exceeded in "
942 "statement at %C",
943 gfc_option.max_continue_fixed);
947 if (continue_line < gfc_linebuf_linenum (gfc_current_locus.lb))
948 continue_line = gfc_linebuf_linenum (gfc_current_locus.lb);
951 /* Ready to read first character of continuation line, which might
952 be another continuation line! */
953 goto restart;
955 not_continuation:
956 c = '\n';
957 gfc_current_locus = old_loc;
959 done:
960 if (c == '\n')
961 continue_count = 0;
962 continue_flag = 0;
963 return c;
967 /* Get the next character of input, folded to lowercase. In fixed
968 form mode, we also ignore spaces. When matcher subroutines are
969 parsing character literals, they have to call
970 gfc_next_char_literal(). */
973 gfc_next_char (void)
975 int c;
979 c = gfc_next_char_literal (0);
981 while (gfc_current_form == FORM_FIXED && gfc_is_whitespace (c));
983 return TOLOWER (c);
988 gfc_peek_char (void)
990 locus old_loc;
991 int c;
993 old_loc = gfc_current_locus;
994 c = gfc_next_char ();
995 gfc_current_locus = old_loc;
997 return c;
1001 /* Recover from an error. We try to get past the current statement
1002 and get lined up for the next. The next statement follows a '\n'
1003 or a ';'. We also assume that we are not within a character
1004 constant, and deal with finding a '\'' or '"'. */
1006 void
1007 gfc_error_recovery (void)
1009 char c, delim;
1011 if (gfc_at_eof ())
1012 return;
1014 for (;;)
1016 c = gfc_next_char ();
1017 if (c == '\n' || c == ';')
1018 break;
1020 if (c != '\'' && c != '"')
1022 if (gfc_at_eof ())
1023 break;
1024 continue;
1026 delim = c;
1028 for (;;)
1030 c = next_char ();
1032 if (c == delim)
1033 break;
1034 if (c == '\n')
1035 return;
1036 if (c == '\\')
1038 c = next_char ();
1039 if (c == '\n')
1040 return;
1043 if (gfc_at_eof ())
1044 break;
1049 /* Read ahead until the next character to be read is not whitespace. */
1051 void
1052 gfc_gobble_whitespace (void)
1054 static int linenum = 0;
1055 locus old_loc;
1056 int c;
1060 old_loc = gfc_current_locus;
1061 c = gfc_next_char_literal (0);
1062 /* Issue a warning for nonconforming tabs. We keep track of the line
1063 number because the Fortran matchers will often back up and the same
1064 line will be scanned multiple times. */
1065 if (!gfc_option.warn_tabs && c == '\t')
1067 #ifdef USE_MAPPED_LOCATION
1068 int cur_linenum = LOCATION_LINE (gfc_current_locus.lb->location);
1069 #else
1070 int cur_linenum = gfc_current_locus.lb->linenum;
1071 #endif
1072 if (cur_linenum != linenum)
1074 linenum = cur_linenum;
1075 gfc_warning_now ("Nonconforming tab character at %C");
1079 while (gfc_is_whitespace (c));
1081 gfc_current_locus = old_loc;
1085 /* Load a single line into pbuf.
1087 If pbuf points to a NULL pointer, it is allocated.
1088 We truncate lines that are too long, unless we're dealing with
1089 preprocessor lines or if the option -ffixed-line-length-none is set,
1090 in which case we reallocate the buffer to fit the entire line, if
1091 need be.
1092 In fixed mode, we expand a tab that occurs within the statement
1093 label region to expand to spaces that leave the next character in
1094 the source region.
1095 load_line returns whether the line was truncated.
1097 NOTE: The error machinery isn't available at this point, so we can't
1098 easily report line and column numbers consistent with other
1099 parts of gfortran. */
1101 static int
1102 load_line (FILE *input, char **pbuf, int *pbuflen)
1104 static int linenum = 0, current_line = 1;
1105 int c, maxlen, i, preprocessor_flag, buflen = *pbuflen;
1106 int trunc_flag = 0, seen_comment = 0;
1107 int seen_printable = 0, seen_ampersand = 0;
1108 char *buffer;
1110 /* Determine the maximum allowed line length. */
1111 if (gfc_current_form == FORM_FREE)
1112 maxlen = gfc_option.free_line_length;
1113 else if (gfc_current_form == FORM_FIXED)
1114 maxlen = gfc_option.fixed_line_length;
1115 else
1116 maxlen = 72;
1118 if (*pbuf == NULL)
1120 /* Allocate the line buffer, storing its length into buflen.
1121 Note that if maxlen==0, indicating that arbitrary-length lines
1122 are allowed, the buffer will be reallocated if this length is
1123 insufficient; since 132 characters is the length of a standard
1124 free-form line, we use that as a starting guess. */
1125 if (maxlen > 0)
1126 buflen = maxlen;
1127 else
1128 buflen = 132;
1130 *pbuf = gfc_getmem (buflen + 1);
1133 i = 0;
1134 buffer = *pbuf;
1136 preprocessor_flag = 0;
1137 c = getc (input);
1138 if (c == '#')
1139 /* In order to not truncate preprocessor lines, we have to
1140 remember that this is one. */
1141 preprocessor_flag = 1;
1142 ungetc (c, input);
1144 for (;;)
1146 c = getc (input);
1148 if (c == EOF)
1149 break;
1150 if (c == '\n')
1152 /* Check for illegal use of ampersand. See F95 Standard 3.3.1.3. */
1153 if (gfc_current_form == FORM_FREE
1154 && !seen_printable && seen_ampersand)
1156 if (pedantic)
1157 gfc_error_now ("'&' not allowed by itself in line %d",
1158 current_line);
1159 else
1160 gfc_warning_now ("'&' not allowed by itself in line %d",
1161 current_line);
1163 break;
1166 if (c == '\r')
1167 continue; /* Gobble characters. */
1168 if (c == '\0')
1169 continue;
1171 if (c == '&')
1173 if (seen_ampersand)
1174 seen_ampersand = 0;
1175 else
1176 seen_ampersand = 1;
1179 if ((c != '&' && c != '!' && c != ' ') || (c == '!' && !seen_ampersand))
1180 seen_printable = 1;
1182 /* Is this a fixed-form comment? */
1183 if (gfc_current_form == FORM_FIXED && i == 0
1184 && (c == '*' || c == 'c' || c == 'd'))
1185 seen_comment = 1;
1187 if (gfc_current_form == FORM_FIXED && c == '\t' && i <= 6)
1189 if (!gfc_option.warn_tabs && seen_comment == 0
1190 && current_line != linenum)
1192 linenum = current_line;
1193 gfc_warning_now ("Nonconforming tab character in column 1 "
1194 "of line %d", linenum);
1197 while (i <= 6)
1199 *buffer++ = ' ';
1200 i++;
1203 continue;
1206 *buffer++ = c;
1207 i++;
1209 if (maxlen == 0 || preprocessor_flag)
1211 if (i >= buflen)
1213 /* Reallocate line buffer to double size to hold the
1214 overlong line. */
1215 buflen = buflen * 2;
1216 *pbuf = xrealloc (*pbuf, buflen + 1);
1217 buffer = (*pbuf) + i;
1220 else if (i >= maxlen)
1222 /* Truncate the rest of the line. */
1223 for (;;)
1225 c = getc (input);
1226 if (c == '\n' || c == EOF)
1227 break;
1229 trunc_flag = 1;
1232 ungetc ('\n', input);
1236 /* Pad lines to the selected line length in fixed form. */
1237 if (gfc_current_form == FORM_FIXED
1238 && gfc_option.fixed_line_length != 0
1239 && !preprocessor_flag
1240 && c != EOF)
1242 while (i++ < maxlen)
1243 *buffer++ = ' ';
1246 *buffer = '\0';
1247 *pbuflen = buflen;
1248 current_line++;
1250 return trunc_flag;
1254 /* Get a gfc_file structure, initialize it and add it to
1255 the file stack. */
1257 static gfc_file *
1258 get_file (const char *name, enum lc_reason reason ATTRIBUTE_UNUSED)
1260 gfc_file *f;
1262 f = gfc_getmem (sizeof (gfc_file));
1264 f->filename = gfc_getmem (strlen (name) + 1);
1265 strcpy (f->filename, name);
1267 f->next = file_head;
1268 file_head = f;
1270 f->up = current_file;
1271 if (current_file != NULL)
1272 f->inclusion_line = current_file->line;
1274 #ifdef USE_MAPPED_LOCATION
1275 linemap_add (line_table, reason, false, f->filename, 1);
1276 #endif
1278 return f;
1281 /* Deal with a line from the C preprocessor. The
1282 initial octothorp has already been seen. */
1284 static void
1285 preprocessor_line (char *c)
1287 bool flag[5];
1288 int i, line;
1289 char *filename;
1290 gfc_file *f;
1291 int escaped, unescape;
1293 c++;
1294 while (*c == ' ' || *c == '\t')
1295 c++;
1297 if (*c < '0' || *c > '9')
1298 goto bad_cpp_line;
1300 line = atoi (c);
1302 c = strchr (c, ' ');
1303 if (c == NULL)
1305 /* No file name given. Set new line number. */
1306 current_file->line = line;
1307 return;
1310 /* Skip spaces. */
1311 while (*c == ' ' || *c == '\t')
1312 c++;
1314 /* Skip quote. */
1315 if (*c != '"')
1316 goto bad_cpp_line;
1317 ++c;
1319 filename = c;
1321 /* Make filename end at quote. */
1322 unescape = 0;
1323 escaped = false;
1324 while (*c && ! (!escaped && *c == '"'))
1326 if (escaped)
1327 escaped = false;
1328 else if (*c == '\\')
1330 escaped = true;
1331 unescape++;
1333 ++c;
1336 if (! *c)
1337 /* Preprocessor line has no closing quote. */
1338 goto bad_cpp_line;
1340 *c++ = '\0';
1342 /* Undo effects of cpp_quote_string. */
1343 if (unescape)
1345 char *s = filename;
1346 char *d = gfc_getmem (c - filename - unescape);
1348 filename = d;
1349 while (*s)
1351 if (*s == '\\')
1352 *d++ = *++s;
1353 else
1354 *d++ = *s;
1355 s++;
1357 *d = '\0';
1360 /* Get flags. */
1362 flag[1] = flag[2] = flag[3] = flag[4] = false;
1364 for (;;)
1366 c = strchr (c, ' ');
1367 if (c == NULL)
1368 break;
1370 c++;
1371 i = atoi (c);
1373 if (1 <= i && i <= 4)
1374 flag[i] = true;
1377 /* Interpret flags. */
1379 if (flag[1]) /* Starting new file. */
1381 f = get_file (filename, LC_RENAME);
1382 add_file_change (f->filename, f->inclusion_line);
1383 current_file = f;
1386 if (flag[2]) /* Ending current file. */
1388 if (!current_file->up
1389 || strcmp (current_file->up->filename, filename) != 0)
1391 gfc_warning_now ("%s:%d: file %s left but not entered",
1392 current_file->filename, current_file->line,
1393 filename);
1394 if (unescape)
1395 gfc_free (filename);
1396 return;
1399 add_file_change (NULL, line);
1400 current_file = current_file->up;
1401 #ifdef USE_MAPPED_LOCATION
1402 linemap_add (line_table, LC_RENAME, false, current_file->filename,
1403 current_file->line);
1404 #endif
1407 /* The name of the file can be a temporary file produced by
1408 cpp. Replace the name if it is different. */
1410 if (strcmp (current_file->filename, filename) != 0)
1412 gfc_free (current_file->filename);
1413 current_file->filename = gfc_getmem (strlen (filename) + 1);
1414 strcpy (current_file->filename, filename);
1417 /* Set new line number. */
1418 current_file->line = line;
1419 if (unescape)
1420 gfc_free (filename);
1421 return;
1423 bad_cpp_line:
1424 gfc_warning_now ("%s:%d: Illegal preprocessor directive",
1425 current_file->filename, current_file->line);
1426 current_file->line++;
1430 static try load_file (const char *, bool);
1432 /* include_line()-- Checks a line buffer to see if it is an include
1433 line. If so, we call load_file() recursively to load the included
1434 file. We never return a syntax error because a statement like
1435 "include = 5" is perfectly legal. We return false if no include was
1436 processed or true if we matched an include. */
1438 static bool
1439 include_line (char *line)
1441 char quote, *c, *begin, *stop;
1443 c = line;
1445 if (gfc_option.flag_openmp)
1447 if (gfc_current_form == FORM_FREE)
1449 while (*c == ' ' || *c == '\t')
1450 c++;
1451 if (*c == '!' && c[1] == '$' && (c[2] == ' ' || c[2] == '\t'))
1452 c += 3;
1454 else
1456 if ((*c == '!' || *c == 'c' || *c == 'C' || *c == '*')
1457 && c[1] == '$' && (c[2] == ' ' || c[2] == '\t'))
1458 c += 3;
1462 while (*c == ' ' || *c == '\t')
1463 c++;
1465 if (strncasecmp (c, "include", 7))
1466 return false;
1468 c += 7;
1469 while (*c == ' ' || *c == '\t')
1470 c++;
1472 /* Find filename between quotes. */
1474 quote = *c++;
1475 if (quote != '"' && quote != '\'')
1476 return false;
1478 begin = c;
1480 while (*c != quote && *c != '\0')
1481 c++;
1483 if (*c == '\0')
1484 return false;
1486 stop = c++;
1488 while (*c == ' ' || *c == '\t')
1489 c++;
1491 if (*c != '\0' && *c != '!')
1492 return false;
1494 /* We have an include line at this point. */
1496 *stop = '\0'; /* It's ok to trash the buffer, as this line won't be
1497 read by anything else. */
1499 load_file (begin, false);
1500 return true;
1504 /* Load a file into memory by calling load_line until the file ends. */
1506 static try
1507 load_file (const char *filename, bool initial)
1509 char *line;
1510 gfc_linebuf *b;
1511 gfc_file *f;
1512 FILE *input;
1513 int len, line_len;
1514 bool first_line;
1516 for (f = current_file; f; f = f->up)
1517 if (strcmp (filename, f->filename) == 0)
1519 gfc_error_now ("File '%s' is being included recursively", filename);
1520 return FAILURE;
1523 if (initial)
1525 if (gfc_src_file)
1527 input = gfc_src_file;
1528 gfc_src_file = NULL;
1530 else
1531 input = gfc_open_file (filename);
1532 if (input == NULL)
1534 gfc_error_now ("Can't open file '%s'", filename);
1535 return FAILURE;
1538 else
1540 input = gfc_open_included_file (filename, false, false);
1541 if (input == NULL)
1543 gfc_error_now ("Can't open included file '%s'", filename);
1544 return FAILURE;
1548 /* Load the file. */
1550 f = get_file (filename, initial ? LC_RENAME : LC_ENTER);
1551 if (!initial)
1552 add_file_change (f->filename, f->inclusion_line);
1553 current_file = f;
1554 current_file->line = 1;
1555 line = NULL;
1556 line_len = 0;
1557 first_line = true;
1559 if (initial && gfc_src_preprocessor_lines[0])
1561 preprocessor_line (gfc_src_preprocessor_lines[0]);
1562 gfc_free (gfc_src_preprocessor_lines[0]);
1563 gfc_src_preprocessor_lines[0] = NULL;
1564 if (gfc_src_preprocessor_lines[1])
1566 preprocessor_line (gfc_src_preprocessor_lines[1]);
1567 gfc_free (gfc_src_preprocessor_lines[1]);
1568 gfc_src_preprocessor_lines[1] = NULL;
1572 for (;;)
1574 int trunc = load_line (input, &line, &line_len);
1576 len = strlen (line);
1577 if (feof (input) && len == 0)
1578 break;
1580 /* If this is the first line of the file, it can contain a byte
1581 order mark (BOM), which we will ignore:
1582 FF FE is UTF-16 little endian,
1583 FE FF is UTF-16 big endian,
1584 EF BB BF is UTF-8. */
1585 if (first_line
1586 && ((line_len >= 2 && line[0] == '\xFF' && line[1] == '\xFE')
1587 || (line_len >= 2 && line[0] == '\xFE' && line[1] == '\xFF')
1588 || (line_len >= 3 && line[0] == '\xEF' && line[1] == '\xBB'
1589 && line[2] == '\xBF')))
1591 int n = line[1] == '\xBB' ? 3 : 2;
1592 char * new = gfc_getmem (line_len);
1594 strcpy (new, line + n);
1595 gfc_free (line);
1596 line = new;
1597 len -= n;
1600 /* There are three things this line can be: a line of Fortran
1601 source, an include line or a C preprocessor directive. */
1603 if (line[0] == '#')
1605 /* When -g3 is specified, it's possible that we emit #define
1606 and #undef lines, which we need to pass to the middle-end
1607 so that it can emit correct debug info. */
1608 if (debug_info_level == DINFO_LEVEL_VERBOSE
1609 && (strncmp (line, "#define ", 8) == 0
1610 || strncmp (line, "#undef ", 7) == 0))
1612 else
1614 preprocessor_line (line);
1615 continue;
1619 /* Preprocessed files have preprocessor lines added before the byte
1620 order mark, so first_line is not about the first line of the file
1621 but the first line that's not a preprocessor line. */
1622 first_line = false;
1624 if (include_line (line))
1626 current_file->line++;
1627 continue;
1630 /* Add line. */
1632 b = gfc_getmem (gfc_linebuf_header_size + len + 1);
1634 #ifdef USE_MAPPED_LOCATION
1635 b->location
1636 = linemap_line_start (line_table, current_file->line++, 120);
1637 #else
1638 b->linenum = current_file->line++;
1639 #endif
1640 b->file = current_file;
1641 b->truncated = trunc;
1642 strcpy (b->line, line);
1644 if (line_head == NULL)
1645 line_head = b;
1646 else
1647 line_tail->next = b;
1649 line_tail = b;
1651 while (file_changes_cur < file_changes_count)
1652 file_changes[file_changes_cur++].lb = b;
1655 /* Release the line buffer allocated in load_line. */
1656 gfc_free (line);
1658 fclose (input);
1660 if (!initial)
1661 add_file_change (NULL, current_file->inclusion_line + 1);
1662 current_file = current_file->up;
1663 #ifdef USE_MAPPED_LOCATION
1664 linemap_add (line_table, LC_LEAVE, 0, NULL, 0);
1665 #endif
1666 return SUCCESS;
1670 /* Open a new file and start scanning from that file. Returns SUCCESS
1671 if everything went OK, FAILURE otherwise. If form == FORM_UKNOWN
1672 it tries to determine the source form from the filename, defaulting
1673 to free form. */
1676 gfc_new_file (void)
1678 try result;
1680 result = load_file (gfc_source_file, true);
1682 gfc_current_locus.lb = line_head;
1683 gfc_current_locus.nextc = (line_head == NULL) ? NULL : line_head->line;
1685 #if 0 /* Debugging aid. */
1686 for (; line_head; line_head = line_head->next)
1687 gfc_status ("%s:%3d %s\n",
1688 #ifdef USE_MAPPED_LOCATION
1689 LOCATION_FILE (line_head->location),
1690 LOCATION_LINE (line_head->location),
1691 #else
1692 line_head->file->filename,
1693 line_head->linenum,
1694 #endif
1695 line_head->line);
1697 exit (0);
1698 #endif
1700 return result;
1703 static char *
1704 unescape_filename (const char *ptr)
1706 const char *p = ptr, *s;
1707 char *d, *ret;
1708 int escaped, unescape = 0;
1710 /* Make filename end at quote. */
1711 escaped = false;
1712 while (*p && ! (! escaped && *p == '"'))
1714 if (escaped)
1715 escaped = false;
1716 else if (*p == '\\')
1718 escaped = true;
1719 unescape++;
1721 ++p;
1724 if (!*p || p[1])
1725 return NULL;
1727 /* Undo effects of cpp_quote_string. */
1728 s = ptr;
1729 d = gfc_getmem (p + 1 - ptr - unescape);
1730 ret = d;
1732 while (s != p)
1734 if (*s == '\\')
1735 *d++ = *++s;
1736 else
1737 *d++ = *s;
1738 s++;
1740 *d = '\0';
1741 return ret;
1744 /* For preprocessed files, if the first tokens are of the form # NUM.
1745 handle the directives so we know the original file name. */
1747 const char *
1748 gfc_read_orig_filename (const char *filename, const char **canon_source_file)
1750 int c, len;
1751 char *dirname;
1753 gfc_src_file = gfc_open_file (filename);
1754 if (gfc_src_file == NULL)
1755 return NULL;
1757 c = getc (gfc_src_file);
1758 ungetc (c, gfc_src_file);
1760 if (c != '#')
1761 return NULL;
1763 len = 0;
1764 load_line (gfc_src_file, &gfc_src_preprocessor_lines[0], &len);
1766 if (strncmp (gfc_src_preprocessor_lines[0], "# 1 \"", 5) != 0)
1767 return NULL;
1769 filename = unescape_filename (gfc_src_preprocessor_lines[0] + 5);
1770 if (filename == NULL)
1771 return NULL;
1773 c = getc (gfc_src_file);
1774 ungetc (c, gfc_src_file);
1776 if (c != '#')
1777 return filename;
1779 len = 0;
1780 load_line (gfc_src_file, &gfc_src_preprocessor_lines[1], &len);
1782 if (strncmp (gfc_src_preprocessor_lines[1], "# 1 \"", 5) != 0)
1783 return filename;
1785 dirname = unescape_filename (gfc_src_preprocessor_lines[1] + 5);
1786 if (dirname == NULL)
1787 return filename;
1789 len = strlen (dirname);
1790 if (len < 3 || dirname[len - 1] != '/' || dirname[len - 2] != '/')
1792 gfc_free (dirname);
1793 return filename;
1795 dirname[len - 2] = '\0';
1796 set_src_pwd (dirname);
1798 if (! IS_ABSOLUTE_PATH (filename))
1800 char *p = gfc_getmem (len + strlen (filename));
1802 memcpy (p, dirname, len - 2);
1803 p[len - 2] = '/';
1804 strcpy (p + len - 1, filename);
1805 *canon_source_file = p;
1808 gfc_free (dirname);
1809 return filename;