2 Copyright (C) 2000-2014 Free Software Foundation, Inc.
3 Contributed by Andy Vaught
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 /* Set of subroutines to (ultimately) return the next character to the
22 various matching subroutines. This file's job is to read files and
23 build up lines that are parsed by the parser. This means that we
24 handle continuation lines and "include" lines.
26 The first thing the scanner does is to load an entire file into
27 memory. We load the entire file into memory for a couple reasons.
28 The first is that we want to be able to deal with nonseekable input
29 (pipes, stdin) and there is a lot of backing up involved during
32 The second is that we want to be able to print the locus of errors,
33 and an error on line 999999 could conflict with something on line
34 one. Given nonseekable input, we've got to store the whole thing.
36 One thing that helps are the column truncation limits that give us
37 an upper bound on the size of individual lines. We don't store the
40 From the scanner's viewpoint, the higher level subroutines ask for
41 new characters and do a lot of jumping backwards. */
45 #include "coretypes.h"
47 #include "toplev.h" /* For set_src_pwd. */
53 /* List of include file search directories. */
54 gfc_directorylist
*include_dirs
, *intrinsic_modules_dirs
;
56 static gfc_file
*file_head
, *current_file
;
58 static int continue_flag
, end_flag
, openmp_flag
, gcc_attribute_flag
;
59 static int continue_count
, continue_line
;
60 static locus openmp_locus
;
61 static locus gcc_attribute_locus
;
63 gfc_source_form gfc_current_form
;
64 static gfc_linebuf
*line_head
, *line_tail
;
66 locus gfc_current_locus
;
67 const char *gfc_source_file
;
68 static FILE *gfc_src_file
;
69 static gfc_char_t
*gfc_src_preprocessor_lines
[2];
71 static struct gfc_file_change
77 size_t file_changes_cur
, file_changes_count
;
78 size_t file_changes_allocated
;
81 /* Functions dealing with our wide characters (gfc_char_t) and
82 sequences of such characters. */
85 gfc_wide_fits_in_byte (gfc_char_t c
)
87 return (c
<= UCHAR_MAX
);
91 wide_is_ascii (gfc_char_t c
)
93 return (gfc_wide_fits_in_byte (c
) && ((unsigned char) c
& ~0x7f) == 0);
97 gfc_wide_is_printable (gfc_char_t c
)
99 return (gfc_wide_fits_in_byte (c
) && ISPRINT ((unsigned char) c
));
103 gfc_wide_tolower (gfc_char_t c
)
105 return (wide_is_ascii (c
) ? (gfc_char_t
) TOLOWER((unsigned char) c
) : c
);
109 gfc_wide_toupper (gfc_char_t c
)
111 return (wide_is_ascii (c
) ? (gfc_char_t
) TOUPPER((unsigned char) c
) : c
);
115 gfc_wide_is_digit (gfc_char_t c
)
117 return (c
>= '0' && c
<= '9');
121 wide_atoi (gfc_char_t
*c
)
123 #define MAX_DIGITS 20
124 char buf
[MAX_DIGITS
+1];
127 while (gfc_wide_is_digit(*c
) && i
< MAX_DIGITS
)
134 gfc_wide_strlen (const gfc_char_t
*str
)
138 for (i
= 0; str
[i
]; i
++)
145 gfc_wide_memset (gfc_char_t
*b
, gfc_char_t c
, size_t len
)
149 for (i
= 0; i
< len
; i
++)
156 wide_strcpy (gfc_char_t
*dest
, const gfc_char_t
*src
)
160 for (d
= dest
; (*d
= *src
) != '\0'; ++src
, ++d
)
167 wide_strchr (const gfc_char_t
*s
, gfc_char_t c
)
172 return CONST_CAST(gfc_char_t
*, s
);
179 gfc_widechar_to_char (const gfc_char_t
*s
, int length
)
187 /* Passing a negative length is used to indicate that length should be
188 calculated using gfc_wide_strlen(). */
189 len
= (length
>= 0 ? (size_t) length
: gfc_wide_strlen (s
));
190 res
= XNEWVEC (char, len
+ 1);
192 for (i
= 0; i
< len
; i
++)
194 gcc_assert (gfc_wide_fits_in_byte (s
[i
]));
195 res
[i
] = (unsigned char) s
[i
];
203 gfc_char_to_widechar (const char *s
)
212 res
= gfc_get_wide_string (len
+ 1);
214 for (i
= 0; i
< len
; i
++)
215 res
[i
] = (unsigned char) s
[i
];
222 wide_strncmp (const gfc_char_t
*s1
, const char *s2
, size_t n
)
231 return (c1
> c2
? 1 : -1);
239 gfc_wide_strncasecmp (const gfc_char_t
*s1
, const char *s2
, size_t n
)
245 c1
= gfc_wide_tolower (*s1
++);
246 c2
= TOLOWER (*s2
++);
248 return (c1
> c2
? 1 : -1);
256 /* Main scanner initialization. */
259 gfc_scanner_init_1 (void)
272 /* Main scanner destructor. */
275 gfc_scanner_done_1 (void)
280 while(line_head
!= NULL
)
282 lb
= line_head
->next
;
287 while(file_head
!= NULL
)
290 free (file_head
->filename
);
297 /* Adds path to the list pointed to by list. */
300 add_path_to_list (gfc_directorylist
**list
, const char *path
,
301 bool use_for_modules
, bool head
, bool warn
)
303 gfc_directorylist
*dir
;
311 while (*p
== ' ' || *p
== '\t') /* someone might do "-I include" */
315 /* Strip trailing directory separators from the path, as this
316 will confuse Windows systems. */
318 q
= (char *) alloca (len
+ 1);
319 memcpy (q
, p
, len
+ 1);
321 while (i
>=0 && IS_DIR_SEPARATOR (q
[i
]))
327 gfc_warning_now ("Include directory %qs: %s", path
,
330 gfc_warning_now (OPT_Wmissing_include_dirs
,
331 "Nonexistent include directory %qs", path
);
334 else if (!S_ISDIR (st
.st_mode
))
336 gfc_warning_now ("%qs is not a directory", path
);
340 if (head
|| *list
== NULL
)
342 dir
= XCNEW (gfc_directorylist
);
352 dir
->next
= XCNEW (gfc_directorylist
);
356 dir
->next
= head
? *list
: NULL
;
359 dir
->use_for_modules
= use_for_modules
;
360 dir
->path
= XCNEWVEC (char, strlen (p
) + 2);
361 strcpy (dir
->path
, p
);
362 strcat (dir
->path
, "/"); /* make '/' last character */
367 gfc_add_include_path (const char *path
, bool use_for_modules
, bool file_dir
,
370 add_path_to_list (&include_dirs
, path
, use_for_modules
, file_dir
, warn
);
372 /* For '#include "..."' these directories are automatically searched. */
374 gfc_cpp_add_include_path (xstrdup(path
), true);
379 gfc_add_intrinsic_modules_path (const char *path
)
381 add_path_to_list (&intrinsic_modules_dirs
, path
, true, false, false);
385 /* Release resources allocated for options. */
388 gfc_release_include_path (void)
390 gfc_directorylist
*p
;
392 while (include_dirs
!= NULL
)
395 include_dirs
= include_dirs
->next
;
400 while (intrinsic_modules_dirs
!= NULL
)
402 p
= intrinsic_modules_dirs
;
403 intrinsic_modules_dirs
= intrinsic_modules_dirs
->next
;
408 free (gfc_option
.module_dir
);
413 open_included_file (const char *name
, gfc_directorylist
*list
,
414 bool module
, bool system
)
417 gfc_directorylist
*p
;
420 for (p
= list
; p
; p
= p
->next
)
422 if (module
&& !p
->use_for_modules
)
425 fullname
= (char *) alloca(strlen (p
->path
) + strlen (name
) + 1);
426 strcpy (fullname
, p
->path
);
427 strcat (fullname
, name
);
429 f
= gfc_open_file (fullname
);
432 if (gfc_cpp_makedep ())
433 gfc_cpp_add_dep (fullname
, system
);
443 /* Opens file for reading, searching through the include directories
444 given if necessary. If the include_cwd argument is true, we try
445 to open the file in the current directory first. */
448 gfc_open_included_file (const char *name
, bool include_cwd
, bool module
)
452 if (IS_ABSOLUTE_PATH (name
) || include_cwd
)
454 f
= gfc_open_file (name
);
455 if (f
&& gfc_cpp_makedep ())
456 gfc_cpp_add_dep (name
, false);
460 f
= open_included_file (name
, include_dirs
, module
, false);
466 /* Test to see if we're at the end of the main source file. */
475 /* Test to see if we're at the end of the current file. */
483 if (line_head
== NULL
)
484 return 1; /* Null file */
486 if (gfc_current_locus
.lb
== NULL
)
493 /* Test to see if we're at the beginning of a new line. */
501 return (gfc_current_locus
.nextc
== gfc_current_locus
.lb
->line
);
505 /* Test to see if we're at the end of a line. */
513 return (*gfc_current_locus
.nextc
== '\0');
517 add_file_change (const char *filename
, int line
)
519 if (file_changes_count
== file_changes_allocated
)
521 if (file_changes_allocated
)
522 file_changes_allocated
*= 2;
524 file_changes_allocated
= 16;
525 file_changes
= XRESIZEVEC (struct gfc_file_change
, file_changes
,
526 file_changes_allocated
);
528 file_changes
[file_changes_count
].filename
= filename
;
529 file_changes
[file_changes_count
].lb
= NULL
;
530 file_changes
[file_changes_count
++].line
= line
;
534 report_file_change (gfc_linebuf
*lb
)
536 size_t c
= file_changes_cur
;
537 while (c
< file_changes_count
538 && file_changes
[c
].lb
== lb
)
540 if (file_changes
[c
].filename
)
541 (*debug_hooks
->start_source_file
) (file_changes
[c
].line
,
542 file_changes
[c
].filename
);
544 (*debug_hooks
->end_source_file
) (file_changes
[c
].line
);
547 file_changes_cur
= c
;
551 gfc_start_source_files (void)
553 /* If the debugger wants the name of the main source file,
555 if (debug_hooks
->start_end_main_source_file
)
556 (*debug_hooks
->start_source_file
) (0, gfc_source_file
);
558 file_changes_cur
= 0;
559 report_file_change (gfc_current_locus
.lb
);
563 gfc_end_source_files (void)
565 report_file_change (NULL
);
567 if (debug_hooks
->start_end_main_source_file
)
568 (*debug_hooks
->end_source_file
) (0);
571 /* Advance the current line pointer to the next line. */
574 gfc_advance_line (void)
579 if (gfc_current_locus
.lb
== NULL
)
585 if (gfc_current_locus
.lb
->next
586 && !gfc_current_locus
.lb
->next
->dbg_emitted
)
588 report_file_change (gfc_current_locus
.lb
->next
);
589 gfc_current_locus
.lb
->next
->dbg_emitted
= true;
592 gfc_current_locus
.lb
= gfc_current_locus
.lb
->next
;
594 if (gfc_current_locus
.lb
!= NULL
)
595 gfc_current_locus
.nextc
= gfc_current_locus
.lb
->line
;
598 gfc_current_locus
.nextc
= NULL
;
604 /* Get the next character from the input, advancing gfc_current_file's
605 locus. When we hit the end of the line or the end of the file, we
606 start returning a '\n' in order to complete the current statement.
607 No Fortran line conventions are implemented here.
609 Requiring explicit advances to the next line prevents the parse
610 pointer from being on the wrong line if the current statement ends
618 if (gfc_current_locus
.nextc
== NULL
)
621 c
= *gfc_current_locus
.nextc
++;
624 gfc_current_locus
.nextc
--; /* Remain on this line. */
632 /* Skip a comment. When we come here the parse pointer is positioned
633 immediately after the comment character. If we ever implement
634 compiler directives within comments, here is where we parse the
638 skip_comment_line (void)
653 gfc_define_undef_line (void)
657 /* All lines beginning with '#' are either #define or #undef. */
658 if (debug_info_level
!= DINFO_LEVEL_VERBOSE
|| gfc_peek_ascii_char () != '#')
661 if (wide_strncmp (gfc_current_locus
.nextc
, "#define ", 8) == 0)
663 tmp
= gfc_widechar_to_char (&gfc_current_locus
.nextc
[8], -1);
664 (*debug_hooks
->define
) (gfc_linebuf_linenum (gfc_current_locus
.lb
),
669 if (wide_strncmp (gfc_current_locus
.nextc
, "#undef ", 7) == 0)
671 tmp
= gfc_widechar_to_char (&gfc_current_locus
.nextc
[7], -1);
672 (*debug_hooks
->undef
) (gfc_linebuf_linenum (gfc_current_locus
.lb
),
677 /* Skip the rest of the line. */
678 skip_comment_line ();
684 /* Return true if GCC$ was matched. */
686 skip_gcc_attribute (locus start
)
690 locus old_loc
= gfc_current_locus
;
692 if ((c
= next_char ()) == 'g' || c
== 'G')
693 if ((c
= next_char ()) == 'c' || c
== 'C')
694 if ((c
= next_char ()) == 'c' || c
== 'C')
695 if ((c
= next_char ()) == '$')
699 gfc_current_locus
= old_loc
;
702 gcc_attribute_flag
= 1;
703 gcc_attribute_locus
= old_loc
;
704 gfc_current_locus
= start
;
712 /* Comment lines are null lines, lines containing only blanks or lines
713 on which the first nonblank line is a '!'.
714 Return true if !$ openmp conditional compilation sentinel was
718 skip_free_comments (void)
726 at_bol
= gfc_at_bol ();
727 start
= gfc_current_locus
;
733 while (gfc_is_whitespace (c
));
743 /* Keep the !GCC$ line. */
744 if (at_bol
&& skip_gcc_attribute (start
))
747 /* If -fopenmp, we need to handle here 2 things:
748 1) don't treat !$omp as comments, but directives
749 2) handle OpenMP conditional compilation, where
750 !$ should be treated as 2 spaces (for initial lines
751 only if followed by space). */
752 if ((gfc_option
.gfc_flag_openmp
753 || gfc_option
.gfc_flag_openmp_simd
) && at_bol
)
755 locus old_loc
= gfc_current_locus
;
756 if (next_char () == '$')
759 if (c
== 'o' || c
== 'O')
761 if (((c
= next_char ()) == 'm' || c
== 'M')
762 && ((c
= next_char ()) == 'p' || c
== 'P'))
764 if ((c
= next_char ()) == ' ' || c
== '\t'
767 while (gfc_is_whitespace (c
))
769 if (c
!= '\n' && c
!= '!')
772 openmp_locus
= old_loc
;
773 gfc_current_locus
= start
;
778 gfc_warning_now ("!$OMP at %C starts a commented "
779 "line as it neither is followed "
780 "by a space nor is a "
781 "continuation line");
783 gfc_current_locus
= old_loc
;
787 if (continue_flag
|| c
== ' ' || c
== '\t')
789 gfc_current_locus
= old_loc
;
795 gfc_current_locus
= old_loc
;
797 skip_comment_line ();
804 if (openmp_flag
&& at_bol
)
807 gcc_attribute_flag
= 0;
808 gfc_current_locus
= start
;
813 /* Skip comment lines in fixed source mode. We have the same rules as
814 in skip_free_comment(), except that we can have a 'c', 'C' or '*'
815 in column 1, and a '!' cannot be in column 6. Also, we deal with
816 lines with 'd' or 'D' in column 1, if the user requested this. */
819 skip_fixed_comments (void)
827 start
= gfc_current_locus
;
832 while (gfc_is_whitespace (c
));
837 skip_comment_line ();
842 gfc_current_locus
= start
;
849 start
= gfc_current_locus
;
860 if (c
== '!' || c
== 'c' || c
== 'C' || c
== '*')
862 if (skip_gcc_attribute (start
))
864 /* Canonicalize to *$omp. */
869 /* If -fopenmp, we need to handle here 2 things:
870 1) don't treat !$omp|c$omp|*$omp as comments, but directives
871 2) handle OpenMP conditional compilation, where
872 !$|c$|*$ should be treated as 2 spaces if the characters
873 in columns 3 to 6 are valid fixed form label columns
875 if (gfc_current_locus
.lb
!= NULL
876 && continue_line
< gfc_linebuf_linenum (gfc_current_locus
.lb
))
877 continue_line
= gfc_linebuf_linenum (gfc_current_locus
.lb
);
879 if (gfc_option
.gfc_flag_openmp
|| gfc_option
.gfc_flag_openmp_simd
)
881 if (next_char () == '$')
884 if (c
== 'o' || c
== 'O')
886 if (((c
= next_char ()) == 'm' || c
== 'M')
887 && ((c
= next_char ()) == 'p' || c
== 'P'))
891 && ((openmp_flag
&& continue_flag
)
892 || c
== ' ' || c
== '\t' || c
== '0'))
896 while (gfc_is_whitespace (c
));
897 if (c
!= '\n' && c
!= '!')
899 /* Canonicalize to *$omp. */
902 gfc_current_locus
= start
;
912 for (col
= 3; col
< 6; col
++, c
= next_char ())
920 else if (c
< '0' || c
> '9')
925 if (col
== 6 && c
!= '\n'
926 && ((continue_flag
&& !digit_seen
)
927 || c
== ' ' || c
== '\t' || c
== '0'))
929 gfc_current_locus
= start
;
930 start
.nextc
[0] = ' ';
931 start
.nextc
[1] = ' ';
936 gfc_current_locus
= start
;
938 skip_comment_line ();
942 if (gfc_option
.flag_d_lines
!= -1 && (c
== 'd' || c
== 'D'))
944 if (gfc_option
.flag_d_lines
== 0)
946 skip_comment_line ();
950 *start
.nextc
= c
= ' ';
955 while (gfc_is_whitespace (c
))
967 if (col
!= 6 && c
== '!')
969 if (gfc_current_locus
.lb
!= NULL
970 && continue_line
< gfc_linebuf_linenum (gfc_current_locus
.lb
))
971 continue_line
= gfc_linebuf_linenum (gfc_current_locus
.lb
);
972 skip_comment_line ();
980 gcc_attribute_flag
= 0;
981 gfc_current_locus
= start
;
985 /* Skips the current line if it is a comment. */
988 gfc_skip_comments (void)
990 if (gfc_current_form
== FORM_FREE
)
991 skip_free_comments ();
993 skip_fixed_comments ();
997 /* Get the next character from the input, taking continuation lines
998 and end-of-line comments into account. This implies that comment
999 lines between continued lines must be eaten here. For higher-level
1000 subroutines, this flattens continued lines into a single logical
1001 line. The in_string flag denotes whether we're inside a character
1005 gfc_next_char_literal (gfc_instring in_string
)
1008 int i
, prev_openmp_flag
;
1021 if (gfc_current_form
== FORM_FREE
)
1023 bool openmp_cond_flag
;
1025 if (!in_string
&& c
== '!')
1027 if (gcc_attribute_flag
1028 && memcmp (&gfc_current_locus
, &gcc_attribute_locus
,
1029 sizeof (gfc_current_locus
)) == 0)
1033 && memcmp (&gfc_current_locus
, &openmp_locus
,
1034 sizeof (gfc_current_locus
)) == 0)
1037 /* This line can't be continued */
1044 /* Avoid truncation warnings for comment ending lines. */
1045 gfc_current_locus
.lb
->truncated
= 0;
1050 /* Check to see if the continuation line was truncated. */
1051 if (warn_line_truncation
&& gfc_current_locus
.lb
!= NULL
1052 && gfc_current_locus
.lb
->truncated
)
1054 int maxlen
= flag_free_line_length
;
1055 gfc_char_t
*current_nextc
= gfc_current_locus
.nextc
;
1057 gfc_current_locus
.lb
->truncated
= 0;
1058 gfc_current_locus
.nextc
= gfc_current_locus
.lb
->line
+ maxlen
;
1059 gfc_warning_now (OPT_Wline_truncation
,
1060 "Line truncated at %L", &gfc_current_locus
);
1061 gfc_current_locus
.nextc
= current_nextc
;
1067 /* If the next nonblank character is a ! or \n, we've got a
1068 continuation line. */
1069 old_loc
= gfc_current_locus
;
1072 while (gfc_is_whitespace (c
))
1075 /* Character constants to be continued cannot have commentary
1078 if (in_string
&& c
!= '\n')
1080 gfc_current_locus
= old_loc
;
1085 if (c
!= '!' && c
!= '\n')
1087 gfc_current_locus
= old_loc
;
1092 prev_openmp_flag
= openmp_flag
;
1095 skip_comment_line ();
1097 gfc_advance_line ();
1100 goto not_continuation
;
1102 /* We've got a continuation line. If we are on the very next line after
1103 the last continuation, increment the continuation line count and
1104 check whether the limit has been exceeded. */
1105 if (gfc_linebuf_linenum (gfc_current_locus
.lb
) == continue_line
+ 1)
1107 if (++continue_count
== gfc_option
.max_continue_free
)
1109 if (gfc_notification_std (GFC_STD_GNU
) || pedantic
)
1110 gfc_warning ("Limit of %d continuations exceeded in "
1111 "statement at %C", gfc_option
.max_continue_free
);
1115 /* Now find where it continues. First eat any comment lines. */
1116 openmp_cond_flag
= skip_free_comments ();
1118 if (gfc_current_locus
.lb
!= NULL
1119 && continue_line
< gfc_linebuf_linenum (gfc_current_locus
.lb
))
1120 continue_line
= gfc_linebuf_linenum (gfc_current_locus
.lb
);
1122 if (prev_openmp_flag
!= openmp_flag
)
1124 gfc_current_locus
= old_loc
;
1125 openmp_flag
= prev_openmp_flag
;
1130 /* Now that we have a non-comment line, probe ahead for the
1131 first non-whitespace character. If it is another '&', then
1132 reading starts at the next character, otherwise we must back
1133 up to where the whitespace started and resume from there. */
1135 old_loc
= gfc_current_locus
;
1138 while (gfc_is_whitespace (c
))
1143 for (i
= 0; i
< 5; i
++, c
= next_char ())
1145 gcc_assert (gfc_wide_tolower (c
) == (unsigned char) "!$omp"[i
]);
1147 old_loc
= gfc_current_locus
;
1149 while (gfc_is_whitespace (c
))
1157 gfc_current_locus
.nextc
--;
1158 if (warn_ampersand
&& in_string
== INSTRING_WARN
)
1159 gfc_warning (OPT_Wampersand
,
1160 "Missing %<&%> in continued character "
1163 /* Both !$omp and !$ -fopenmp continuation lines have & on the
1164 continuation line only optionally. */
1165 else if (openmp_flag
|| openmp_cond_flag
)
1166 gfc_current_locus
.nextc
--;
1170 gfc_current_locus
= old_loc
;
1175 else /* Fixed form. */
1177 /* Fixed form continuation. */
1178 if (!in_string
&& c
== '!')
1180 /* Skip comment at end of line. */
1187 /* Avoid truncation warnings for comment ending lines. */
1188 gfc_current_locus
.lb
->truncated
= 0;
1194 /* Check to see if the continuation line was truncated. */
1195 if (warn_line_truncation
&& gfc_current_locus
.lb
!= NULL
1196 && gfc_current_locus
.lb
->truncated
)
1198 gfc_current_locus
.lb
->truncated
= 0;
1199 gfc_warning_now (OPT_Wline_truncation
,
1200 "Line truncated at %L", &gfc_current_locus
);
1203 prev_openmp_flag
= openmp_flag
;
1205 old_loc
= gfc_current_locus
;
1207 gfc_advance_line ();
1208 skip_fixed_comments ();
1210 /* See if this line is a continuation line. */
1211 if (openmp_flag
!= prev_openmp_flag
)
1213 openmp_flag
= prev_openmp_flag
;
1214 goto not_continuation
;
1218 for (i
= 0; i
< 5; i
++)
1222 goto not_continuation
;
1225 for (i
= 0; i
< 5; i
++)
1228 if (gfc_wide_tolower (c
) != (unsigned char) "*$omp"[i
])
1229 goto not_continuation
;
1233 if (c
== '0' || c
== ' ' || c
== '\n')
1234 goto not_continuation
;
1236 /* We've got a continuation line. If we are on the very next line after
1237 the last continuation, increment the continuation line count and
1238 check whether the limit has been exceeded. */
1239 if (gfc_linebuf_linenum (gfc_current_locus
.lb
) == continue_line
+ 1)
1241 if (++continue_count
== gfc_option
.max_continue_fixed
)
1243 if (gfc_notification_std (GFC_STD_GNU
) || pedantic
)
1244 gfc_warning ("Limit of %d continuations exceeded in "
1246 gfc_option
.max_continue_fixed
);
1250 if (gfc_current_locus
.lb
!= NULL
1251 && continue_line
< gfc_linebuf_linenum (gfc_current_locus
.lb
))
1252 continue_line
= gfc_linebuf_linenum (gfc_current_locus
.lb
);
1255 /* Ready to read first character of continuation line, which might
1256 be another continuation line! */
1261 gfc_current_locus
= old_loc
;
1271 /* Get the next character of input, folded to lowercase. In fixed
1272 form mode, we also ignore spaces. When matcher subroutines are
1273 parsing character literals, they have to call
1274 gfc_next_char_literal(). */
1277 gfc_next_char (void)
1283 c
= gfc_next_char_literal (NONSTRING
);
1285 while (gfc_current_form
== FORM_FIXED
&& gfc_is_whitespace (c
));
1287 return gfc_wide_tolower (c
);
1291 gfc_next_ascii_char (void)
1293 gfc_char_t c
= gfc_next_char ();
1295 return (gfc_wide_fits_in_byte (c
) ? (unsigned char) c
1296 : (unsigned char) UCHAR_MAX
);
1301 gfc_peek_char (void)
1306 old_loc
= gfc_current_locus
;
1307 c
= gfc_next_char ();
1308 gfc_current_locus
= old_loc
;
1315 gfc_peek_ascii_char (void)
1317 gfc_char_t c
= gfc_peek_char ();
1319 return (gfc_wide_fits_in_byte (c
) ? (unsigned char) c
1320 : (unsigned char) UCHAR_MAX
);
1324 /* Recover from an error. We try to get past the current statement
1325 and get lined up for the next. The next statement follows a '\n'
1326 or a ';'. We also assume that we are not within a character
1327 constant, and deal with finding a '\'' or '"'. */
1330 gfc_error_recovery (void)
1332 gfc_char_t c
, delim
;
1339 c
= gfc_next_char ();
1340 if (c
== '\n' || c
== ';')
1343 if (c
!= '\'' && c
!= '"')
1372 /* Read ahead until the next character to be read is not whitespace. */
1375 gfc_gobble_whitespace (void)
1377 static int linenum
= 0;
1383 old_loc
= gfc_current_locus
;
1384 c
= gfc_next_char_literal (NONSTRING
);
1385 /* Issue a warning for nonconforming tabs. We keep track of the line
1386 number because the Fortran matchers will often back up and the same
1387 line will be scanned multiple times. */
1388 if (warn_tabs
&& c
== '\t')
1390 int cur_linenum
= LOCATION_LINE (gfc_current_locus
.lb
->location
);
1391 if (cur_linenum
!= linenum
)
1393 linenum
= cur_linenum
;
1394 gfc_warning_now (OPT_Wtabs
, "Nonconforming tab character at %C");
1398 while (gfc_is_whitespace (c
));
1400 gfc_current_locus
= old_loc
;
1404 /* Load a single line into pbuf.
1406 If pbuf points to a NULL pointer, it is allocated.
1407 We truncate lines that are too long, unless we're dealing with
1408 preprocessor lines or if the option -ffixed-line-length-none is set,
1409 in which case we reallocate the buffer to fit the entire line, if
1411 In fixed mode, we expand a tab that occurs within the statement
1412 label region to expand to spaces that leave the next character in
1415 If first_char is not NULL, it's a pointer to a single char value holding
1416 the first character of the line, which has already been read by the
1417 caller. This avoids the use of ungetc().
1419 load_line returns whether the line was truncated.
1421 NOTE: The error machinery isn't available at this point, so we can't
1422 easily report line and column numbers consistent with other
1423 parts of gfortran. */
1426 load_line (FILE *input
, gfc_char_t
**pbuf
, int *pbuflen
, const int *first_char
)
1428 static int linenum
= 0, current_line
= 1;
1429 int c
, maxlen
, i
, preprocessor_flag
, buflen
= *pbuflen
;
1430 int trunc_flag
= 0, seen_comment
= 0;
1431 int seen_printable
= 0, seen_ampersand
= 0, quoted
= ' ';
1433 bool found_tab
= false;
1435 /* Determine the maximum allowed line length. */
1436 if (gfc_current_form
== FORM_FREE
)
1437 maxlen
= flag_free_line_length
;
1438 else if (gfc_current_form
== FORM_FIXED
)
1439 maxlen
= flag_fixed_line_length
;
1445 /* Allocate the line buffer, storing its length into buflen.
1446 Note that if maxlen==0, indicating that arbitrary-length lines
1447 are allowed, the buffer will be reallocated if this length is
1448 insufficient; since 132 characters is the length of a standard
1449 free-form line, we use that as a starting guess. */
1455 *pbuf
= gfc_get_wide_string (buflen
+ 1);
1466 /* In order to not truncate preprocessor lines, we have to
1467 remember that this is one. */
1468 preprocessor_flag
= (c
== '#' ? 1 : 0);
1477 /* Check for illegal use of ampersand. See F95 Standard 3.3.1.3. */
1478 if (gfc_current_form
== FORM_FREE
1479 && !seen_printable
&& seen_ampersand
)
1482 gfc_error_now ("%<&%> not allowed by itself in line %d",
1485 gfc_warning_now ("%<&%> not allowed by itself in line %d",
1491 if (c
== '\r' || c
== '\0')
1492 goto next_char
; /* Gobble characters. */
1505 if ((c
!= '&' && c
!= '!' && c
!= ' ') || (c
== '!' && !seen_ampersand
))
1508 /* Is this a fixed-form comment? */
1509 if (gfc_current_form
== FORM_FIXED
&& i
== 0
1510 && (c
== '*' || c
== 'c' || c
== 'd'))
1515 if (c
== '\'' || c
== '"')
1518 else if (c
== quoted
)
1521 /* Is this a free-form comment? */
1522 if (c
== '!' && quoted
== ' ')
1525 /* Vendor extension: "<tab>1" marks a continuation line. */
1529 if (c
>= '1' && c
<= '9')
1536 if (gfc_current_form
== FORM_FIXED
&& c
== '\t' && i
< 6)
1540 if (warn_tabs
&& seen_comment
== 0 && current_line
!= linenum
)
1542 linenum
= current_line
;
1543 gfc_warning_now (OPT_Wtabs
,
1544 "Nonconforming tab character in column %d "
1545 "of line %d", i
+1, linenum
);
1560 if (maxlen
== 0 || preprocessor_flag
)
1564 /* Reallocate line buffer to double size to hold the
1566 buflen
= buflen
* 2;
1567 *pbuf
= XRESIZEVEC (gfc_char_t
, *pbuf
, (buflen
+ 1));
1568 buffer
= (*pbuf
) + i
;
1571 else if (i
>= maxlen
)
1573 bool trunc_warn
= true;
1575 /* Enhancement, if the very next non-space character is an ampersand
1576 or comment that we would otherwise warn about, don't mark as
1579 /* Truncate the rest of the line. */
1583 if (c
== '\r' || c
== ' ')
1586 if (c
== '\n' || c
== EOF
)
1589 if (!trunc_warn
&& c
!= '!')
1592 if (trunc_warn
&& ((gfc_current_form
== FORM_FIXED
&& c
== '&')
1599 if (trunc_warn
&& !seen_comment
)
1611 /* Pad lines to the selected line length in fixed form. */
1612 if (gfc_current_form
== FORM_FIXED
1613 && flag_fixed_line_length
!= 0
1614 && !preprocessor_flag
1617 while (i
++ < maxlen
)
1629 /* Get a gfc_file structure, initialize it and add it to
1633 get_file (const char *name
, enum lc_reason reason ATTRIBUTE_UNUSED
)
1637 f
= XCNEW (gfc_file
);
1639 f
->filename
= xstrdup (name
);
1641 f
->next
= file_head
;
1644 f
->up
= current_file
;
1645 if (current_file
!= NULL
)
1646 f
->inclusion_line
= current_file
->line
;
1648 linemap_add (line_table
, reason
, false, f
->filename
, 1);
1654 /* Deal with a line from the C preprocessor. The
1655 initial octothorp has already been seen. */
1658 preprocessor_line (gfc_char_t
*c
)
1662 gfc_char_t
*wide_filename
;
1664 int escaped
, unescape
;
1668 while (*c
== ' ' || *c
== '\t')
1671 if (*c
< '0' || *c
> '9')
1674 line
= wide_atoi (c
);
1676 c
= wide_strchr (c
, ' ');
1679 /* No file name given. Set new line number. */
1680 current_file
->line
= line
;
1685 while (*c
== ' ' || *c
== '\t')
1695 /* Make filename end at quote. */
1698 while (*c
&& ! (!escaped
&& *c
== '"'))
1702 else if (*c
== '\\')
1711 /* Preprocessor line has no closing quote. */
1716 /* Undo effects of cpp_quote_string. */
1719 gfc_char_t
*s
= wide_filename
;
1720 gfc_char_t
*d
= gfc_get_wide_string (c
- wide_filename
- unescape
);
1736 flag
[1] = flag
[2] = flag
[3] = flag
[4] = false;
1740 c
= wide_strchr (c
, ' ');
1747 if (1 <= i
&& i
<= 4)
1751 /* Convert the filename in wide characters into a filename in narrow
1753 filename
= gfc_widechar_to_char (wide_filename
, -1);
1755 /* Interpret flags. */
1757 if (flag
[1]) /* Starting new file. */
1759 f
= get_file (filename
, LC_RENAME
);
1760 add_file_change (f
->filename
, f
->inclusion_line
);
1764 if (flag
[2]) /* Ending current file. */
1766 if (!current_file
->up
1767 || filename_cmp (current_file
->up
->filename
, filename
) != 0)
1769 gfc_warning_now_1 ("%s:%d: file %s left but not entered",
1770 current_file
->filename
, current_file
->line
,
1773 free (wide_filename
);
1778 add_file_change (NULL
, line
);
1779 current_file
= current_file
->up
;
1780 linemap_add (line_table
, LC_RENAME
, false, current_file
->filename
,
1781 current_file
->line
);
1784 /* The name of the file can be a temporary file produced by
1785 cpp. Replace the name if it is different. */
1787 if (filename_cmp (current_file
->filename
, filename
) != 0)
1789 /* FIXME: we leak the old filename because a pointer to it may be stored
1790 in the linemap. Alternative could be using GC or updating linemap to
1791 point to the new name, but there is no API for that currently. */
1792 current_file
->filename
= xstrdup (filename
);
1795 /* Set new line number. */
1796 current_file
->line
= line
;
1798 free (wide_filename
);
1803 gfc_warning_now_1 ("%s:%d: Illegal preprocessor directive",
1804 current_file
->filename
, current_file
->line
);
1805 current_file
->line
++;
1809 static bool load_file (const char *, const char *, bool);
1811 /* include_line()-- Checks a line buffer to see if it is an include
1812 line. If so, we call load_file() recursively to load the included
1813 file. We never return a syntax error because a statement like
1814 "include = 5" is perfectly legal. We return false if no include was
1815 processed or true if we matched an include. */
1818 include_line (gfc_char_t
*line
)
1820 gfc_char_t quote
, *c
, *begin
, *stop
;
1825 if (gfc_option
.gfc_flag_openmp
|| gfc_option
.gfc_flag_openmp_simd
)
1827 if (gfc_current_form
== FORM_FREE
)
1829 while (*c
== ' ' || *c
== '\t')
1831 if (*c
== '!' && c
[1] == '$' && (c
[2] == ' ' || c
[2] == '\t'))
1836 if ((*c
== '!' || *c
== 'c' || *c
== 'C' || *c
== '*')
1837 && c
[1] == '$' && (c
[2] == ' ' || c
[2] == '\t'))
1842 while (*c
== ' ' || *c
== '\t')
1845 if (gfc_wide_strncasecmp (c
, "include", 7))
1849 while (*c
== ' ' || *c
== '\t')
1852 /* Find filename between quotes. */
1855 if (quote
!= '"' && quote
!= '\'')
1860 while (*c
!= quote
&& *c
!= '\0')
1868 while (*c
== ' ' || *c
== '\t')
1871 if (*c
!= '\0' && *c
!= '!')
1874 /* We have an include line at this point. */
1876 *stop
= '\0'; /* It's ok to trash the buffer, as this line won't be
1877 read by anything else. */
1879 filename
= gfc_widechar_to_char (begin
, -1);
1880 if (!load_file (filename
, NULL
, false))
1881 exit (FATAL_EXIT_CODE
);
1888 /* Load a file into memory by calling load_line until the file ends. */
1891 load_file (const char *realfilename
, const char *displayedname
, bool initial
)
1899 const char *filename
;
1900 /* If realfilename and displayedname are different and non-null then
1901 surely realfilename is the preprocessed form of
1903 bool preprocessed_p
= (realfilename
&& displayedname
1904 && strcmp (realfilename
, displayedname
));
1906 filename
= displayedname
? displayedname
: realfilename
;
1908 for (f
= current_file
; f
; f
= f
->up
)
1909 if (filename_cmp (filename
, f
->filename
) == 0)
1911 fprintf (stderr
, "%s:%d: Error: File '%s' is being included "
1912 "recursively\n", current_file
->filename
, current_file
->line
,
1921 input
= gfc_src_file
;
1922 gfc_src_file
= NULL
;
1925 input
= gfc_open_file (realfilename
);
1928 gfc_error_now ("Can't open file %qs", filename
);
1934 input
= gfc_open_included_file (realfilename
, false, false);
1937 fprintf (stderr
, "%s:%d: Error: Can't open included file '%s'\n",
1938 current_file
->filename
, current_file
->line
, filename
);
1945 A "non-initial" file means a file that is being included. In
1946 that case we are creating an LC_ENTER map.
1948 An "initial" file means a main file; one that is not included.
1949 That file has already got at least one (surely more) line map(s)
1950 created by gfc_init. So the subsequent map created in that case
1951 must have LC_RENAME reason.
1953 This latter case is not true for a preprocessed file. In that
1954 case, although the file is "initial", the line maps created by
1955 gfc_init was used during the preprocessing of the file. Now that
1956 the preprocessing is over and we are being fed the result of that
1957 preprocessing, we need to create a brand new line map for the
1958 preprocessed file, so the reason is going to be LC_ENTER. */
1960 f
= get_file (filename
, (initial
&& !preprocessed_p
) ? LC_RENAME
: LC_ENTER
);
1962 add_file_change (f
->filename
, f
->inclusion_line
);
1964 current_file
->line
= 1;
1969 if (initial
&& gfc_src_preprocessor_lines
[0])
1971 preprocessor_line (gfc_src_preprocessor_lines
[0]);
1972 free (gfc_src_preprocessor_lines
[0]);
1973 gfc_src_preprocessor_lines
[0] = NULL
;
1974 if (gfc_src_preprocessor_lines
[1])
1976 preprocessor_line (gfc_src_preprocessor_lines
[1]);
1977 free (gfc_src_preprocessor_lines
[1]);
1978 gfc_src_preprocessor_lines
[1] = NULL
;
1984 int trunc
= load_line (input
, &line
, &line_len
, NULL
);
1986 len
= gfc_wide_strlen (line
);
1987 if (feof (input
) && len
== 0)
1990 /* If this is the first line of the file, it can contain a byte
1991 order mark (BOM), which we will ignore:
1992 FF FE is UTF-16 little endian,
1993 FE FF is UTF-16 big endian,
1994 EF BB BF is UTF-8. */
1996 && ((line_len
>= 2 && line
[0] == (unsigned char) '\xFF'
1997 && line
[1] == (unsigned char) '\xFE')
1998 || (line_len
>= 2 && line
[0] == (unsigned char) '\xFE'
1999 && line
[1] == (unsigned char) '\xFF')
2000 || (line_len
>= 3 && line
[0] == (unsigned char) '\xEF'
2001 && line
[1] == (unsigned char) '\xBB'
2002 && line
[2] == (unsigned char) '\xBF')))
2004 int n
= line
[1] == (unsigned char) '\xBB' ? 3 : 2;
2005 gfc_char_t
*new_char
= gfc_get_wide_string (line_len
);
2007 wide_strcpy (new_char
, &line
[n
]);
2013 /* There are three things this line can be: a line of Fortran
2014 source, an include line or a C preprocessor directive. */
2018 /* When -g3 is specified, it's possible that we emit #define
2019 and #undef lines, which we need to pass to the middle-end
2020 so that it can emit correct debug info. */
2021 if (debug_info_level
== DINFO_LEVEL_VERBOSE
2022 && (wide_strncmp (line
, "#define ", 8) == 0
2023 || wide_strncmp (line
, "#undef ", 7) == 0))
2027 preprocessor_line (line
);
2032 /* Preprocessed files have preprocessor lines added before the byte
2033 order mark, so first_line is not about the first line of the file
2034 but the first line that's not a preprocessor line. */
2037 if (include_line (line
))
2039 current_file
->line
++;
2045 b
= XCNEWVAR (gfc_linebuf
, gfc_linebuf_header_size
2046 + (len
+ 1) * sizeof (gfc_char_t
));
2050 = linemap_line_start (line_table
, current_file
->line
++, len
);
2051 /* ??? We add the location for the maximum column possible here,
2052 because otherwise if the next call creates a new line-map, it
2053 will not reserve space for any offset. */
2055 linemap_position_for_column (line_table
, len
);
2057 b
->file
= current_file
;
2058 b
->truncated
= trunc
;
2059 wide_strcpy (b
->line
, line
);
2061 if (line_head
== NULL
)
2064 line_tail
->next
= b
;
2068 while (file_changes_cur
< file_changes_count
)
2069 file_changes
[file_changes_cur
++].lb
= b
;
2072 /* Release the line buffer allocated in load_line. */
2078 add_file_change (NULL
, current_file
->inclusion_line
+ 1);
2079 current_file
= current_file
->up
;
2080 linemap_add (line_table
, LC_LEAVE
, 0, NULL
, 0);
2085 /* Open a new file and start scanning from that file. Returns true
2086 if everything went OK, false otherwise. If form == FORM_UNKNOWN
2087 it tries to determine the source form from the filename, defaulting
2095 if (gfc_cpp_enabled ())
2097 result
= gfc_cpp_preprocess (gfc_source_file
);
2098 if (!gfc_cpp_preprocess_only ())
2099 result
= load_file (gfc_cpp_temporary_file (), gfc_source_file
, true);
2102 result
= load_file (gfc_source_file
, NULL
, true);
2104 gfc_current_locus
.lb
= line_head
;
2105 gfc_current_locus
.nextc
= (line_head
== NULL
) ? NULL
: line_head
->line
;
2107 #if 0 /* Debugging aid. */
2108 for (; line_head
; line_head
= line_head
->next
)
2109 printf ("%s:%3d %s\n", LOCATION_FILE (line_head
->location
),
2110 LOCATION_LINE (line_head
->location
), line_head
->line
);
2112 exit (SUCCESS_EXIT_CODE
);
2119 unescape_filename (const char *ptr
)
2121 const char *p
= ptr
, *s
;
2123 int escaped
, unescape
= 0;
2125 /* Make filename end at quote. */
2127 while (*p
&& ! (! escaped
&& *p
== '"'))
2131 else if (*p
== '\\')
2142 /* Undo effects of cpp_quote_string. */
2144 d
= XCNEWVEC (char, p
+ 1 - ptr
- unescape
);
2159 /* For preprocessed files, if the first tokens are of the form # NUM.
2160 handle the directives so we know the original file name. */
2163 gfc_read_orig_filename (const char *filename
, const char **canon_source_file
)
2166 char *dirname
, *tmp
;
2168 gfc_src_file
= gfc_open_file (filename
);
2169 if (gfc_src_file
== NULL
)
2172 c
= getc (gfc_src_file
);
2178 load_line (gfc_src_file
, &gfc_src_preprocessor_lines
[0], &len
, &c
);
2180 if (wide_strncmp (gfc_src_preprocessor_lines
[0], "# 1 \"", 5) != 0)
2183 tmp
= gfc_widechar_to_char (&gfc_src_preprocessor_lines
[0][5], -1);
2184 filename
= unescape_filename (tmp
);
2186 if (filename
== NULL
)
2189 c
= getc (gfc_src_file
);
2195 load_line (gfc_src_file
, &gfc_src_preprocessor_lines
[1], &len
, &c
);
2197 if (wide_strncmp (gfc_src_preprocessor_lines
[1], "# 1 \"", 5) != 0)
2200 tmp
= gfc_widechar_to_char (&gfc_src_preprocessor_lines
[1][5], -1);
2201 dirname
= unescape_filename (tmp
);
2203 if (dirname
== NULL
)
2206 len
= strlen (dirname
);
2207 if (len
< 3 || dirname
[len
- 1] != '/' || dirname
[len
- 2] != '/')
2212 dirname
[len
- 2] = '\0';
2213 set_src_pwd (dirname
);
2215 if (! IS_ABSOLUTE_PATH (filename
))
2217 char *p
= XCNEWVEC (char, len
+ strlen (filename
));
2219 memcpy (p
, dirname
, len
- 2);
2221 strcpy (p
+ len
- 1, filename
);
2222 *canon_source_file
= p
;