2015-01-14 Christophe Lyon <christophe.lyon@linaro.org>
[official-gcc.git] / gcc / fortran / scanner.c
blobf804060a26d319ff4478e0b91856b91d493fdeae
1 /* Character scanner.
2 Copyright (C) 2000-2015 Free Software Foundation, Inc.
3 Contributed by Andy Vaught
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 /* Set of subroutines to (ultimately) return the next character to the
22 various matching subroutines. This file's job is to read files and
23 build up lines that are parsed by the parser. This means that we
24 handle continuation lines and "include" lines.
26 The first thing the scanner does is to load an entire file into
27 memory. We load the entire file into memory for a couple reasons.
28 The first is that we want to be able to deal with nonseekable input
29 (pipes, stdin) and there is a lot of backing up involved during
30 parsing.
32 The second is that we want to be able to print the locus of errors,
33 and an error on line 999999 could conflict with something on line
34 one. Given nonseekable input, we've got to store the whole thing.
36 One thing that helps are the column truncation limits that give us
37 an upper bound on the size of individual lines. We don't store the
38 truncated stuff.
40 From the scanner's viewpoint, the higher level subroutines ask for
41 new characters and do a lot of jumping backwards. */
43 #include "config.h"
44 #include "system.h"
45 #include "coretypes.h"
46 #include "gfortran.h"
47 #include "toplev.h" /* For set_src_pwd. */
48 #include "debug.h"
49 #include "flags.h"
50 #include "cpp.h"
51 #include "scanner.h"
53 /* List of include file search directories. */
54 gfc_directorylist *include_dirs, *intrinsic_modules_dirs;
56 static gfc_file *file_head, *current_file;
58 static int continue_flag, end_flag, openmp_flag, gcc_attribute_flag;
59 static int continue_count, continue_line;
60 static locus openmp_locus;
61 static locus gcc_attribute_locus;
63 gfc_source_form gfc_current_form;
64 static gfc_linebuf *line_head, *line_tail;
66 locus gfc_current_locus;
67 const char *gfc_source_file;
68 static FILE *gfc_src_file;
69 static gfc_char_t *gfc_src_preprocessor_lines[2];
71 static struct gfc_file_change
73 const char *filename;
74 gfc_linebuf *lb;
75 int line;
76 } *file_changes;
77 size_t file_changes_cur, file_changes_count;
78 size_t file_changes_allocated;
81 /* Functions dealing with our wide characters (gfc_char_t) and
82 sequences of such characters. */
84 int
85 gfc_wide_fits_in_byte (gfc_char_t c)
87 return (c <= UCHAR_MAX);
90 static inline int
91 wide_is_ascii (gfc_char_t c)
93 return (gfc_wide_fits_in_byte (c) && ((unsigned char) c & ~0x7f) == 0);
96 int
97 gfc_wide_is_printable (gfc_char_t c)
99 return (gfc_wide_fits_in_byte (c) && ISPRINT ((unsigned char) c));
102 gfc_char_t
103 gfc_wide_tolower (gfc_char_t c)
105 return (wide_is_ascii (c) ? (gfc_char_t) TOLOWER((unsigned char) c) : c);
108 gfc_char_t
109 gfc_wide_toupper (gfc_char_t c)
111 return (wide_is_ascii (c) ? (gfc_char_t) TOUPPER((unsigned char) c) : c);
115 gfc_wide_is_digit (gfc_char_t c)
117 return (c >= '0' && c <= '9');
120 static inline int
121 wide_atoi (gfc_char_t *c)
123 #define MAX_DIGITS 20
124 char buf[MAX_DIGITS+1];
125 int i = 0;
127 while (gfc_wide_is_digit(*c) && i < MAX_DIGITS)
128 buf[i++] = *c++;
129 buf[i] = '\0';
130 return atoi (buf);
133 size_t
134 gfc_wide_strlen (const gfc_char_t *str)
136 size_t i;
138 for (i = 0; str[i]; i++)
141 return i;
144 gfc_char_t *
145 gfc_wide_memset (gfc_char_t *b, gfc_char_t c, size_t len)
147 size_t i;
149 for (i = 0; i < len; i++)
150 b[i] = c;
152 return b;
155 static gfc_char_t *
156 wide_strcpy (gfc_char_t *dest, const gfc_char_t *src)
158 gfc_char_t *d;
160 for (d = dest; (*d = *src) != '\0'; ++src, ++d)
163 return dest;
166 static gfc_char_t *
167 wide_strchr (const gfc_char_t *s, gfc_char_t c)
169 do {
170 if (*s == c)
172 return CONST_CAST(gfc_char_t *, s);
174 } while (*s++);
175 return 0;
178 char *
179 gfc_widechar_to_char (const gfc_char_t *s, int length)
181 size_t len, i;
182 char *res;
184 if (s == NULL)
185 return NULL;
187 /* Passing a negative length is used to indicate that length should be
188 calculated using gfc_wide_strlen(). */
189 len = (length >= 0 ? (size_t) length : gfc_wide_strlen (s));
190 res = XNEWVEC (char, len + 1);
192 for (i = 0; i < len; i++)
194 gcc_assert (gfc_wide_fits_in_byte (s[i]));
195 res[i] = (unsigned char) s[i];
198 res[len] = '\0';
199 return res;
202 gfc_char_t *
203 gfc_char_to_widechar (const char *s)
205 size_t len, i;
206 gfc_char_t *res;
208 if (s == NULL)
209 return NULL;
211 len = strlen (s);
212 res = gfc_get_wide_string (len + 1);
214 for (i = 0; i < len; i++)
215 res[i] = (unsigned char) s[i];
217 res[len] = '\0';
218 return res;
221 static int
222 wide_strncmp (const gfc_char_t *s1, const char *s2, size_t n)
224 gfc_char_t c1, c2;
226 while (n-- > 0)
228 c1 = *s1++;
229 c2 = *s2++;
230 if (c1 != c2)
231 return (c1 > c2 ? 1 : -1);
232 if (c1 == '\0')
233 return 0;
235 return 0;
239 gfc_wide_strncasecmp (const gfc_char_t *s1, const char *s2, size_t n)
241 gfc_char_t c1, c2;
243 while (n-- > 0)
245 c1 = gfc_wide_tolower (*s1++);
246 c2 = TOLOWER (*s2++);
247 if (c1 != c2)
248 return (c1 > c2 ? 1 : -1);
249 if (c1 == '\0')
250 return 0;
252 return 0;
256 /* Main scanner initialization. */
258 void
259 gfc_scanner_init_1 (void)
261 file_head = NULL;
262 line_head = NULL;
263 line_tail = NULL;
265 continue_count = 0;
266 continue_line = 0;
268 end_flag = 0;
272 /* Main scanner destructor. */
274 void
275 gfc_scanner_done_1 (void)
277 gfc_linebuf *lb;
278 gfc_file *f;
280 while(line_head != NULL)
282 lb = line_head->next;
283 free (line_head);
284 line_head = lb;
287 while(file_head != NULL)
289 f = file_head->next;
290 free (file_head->filename);
291 free (file_head);
292 file_head = f;
297 /* Adds path to the list pointed to by list. */
299 static void
300 add_path_to_list (gfc_directorylist **list, const char *path,
301 bool use_for_modules, bool head, bool warn)
303 gfc_directorylist *dir;
304 const char *p;
305 char *q;
306 struct stat st;
307 size_t len;
308 int i;
310 p = path;
311 while (*p == ' ' || *p == '\t') /* someone might do "-I include" */
312 if (*p++ == '\0')
313 return;
315 /* Strip trailing directory separators from the path, as this
316 will confuse Windows systems. */
317 len = strlen (p);
318 q = (char *) alloca (len + 1);
319 memcpy (q, p, len + 1);
320 i = len - 1;
321 while (i >=0 && IS_DIR_SEPARATOR (q[i]))
322 q[i--] = '\0';
324 if (stat (q, &st))
326 if (errno != ENOENT)
327 gfc_warning_now ("Include directory %qs: %s", path,
328 xstrerror(errno));
329 else if (warn)
330 gfc_warning_now (OPT_Wmissing_include_dirs,
331 "Nonexistent include directory %qs", path);
332 return;
334 else if (!S_ISDIR (st.st_mode))
336 gfc_warning_now ("%qs is not a directory", path);
337 return;
340 if (head || *list == NULL)
342 dir = XCNEW (gfc_directorylist);
343 if (!head)
344 *list = dir;
346 else
348 dir = *list;
349 while (dir->next)
350 dir = dir->next;
352 dir->next = XCNEW (gfc_directorylist);
353 dir = dir->next;
356 dir->next = head ? *list : NULL;
357 if (head)
358 *list = dir;
359 dir->use_for_modules = use_for_modules;
360 dir->path = XCNEWVEC (char, strlen (p) + 2);
361 strcpy (dir->path, p);
362 strcat (dir->path, "/"); /* make '/' last character */
366 void
367 gfc_add_include_path (const char *path, bool use_for_modules, bool file_dir,
368 bool warn)
370 add_path_to_list (&include_dirs, path, use_for_modules, file_dir, warn);
372 /* For '#include "..."' these directories are automatically searched. */
373 if (!file_dir)
374 gfc_cpp_add_include_path (xstrdup(path), true);
378 void
379 gfc_add_intrinsic_modules_path (const char *path)
381 add_path_to_list (&intrinsic_modules_dirs, path, true, false, false);
385 /* Release resources allocated for options. */
387 void
388 gfc_release_include_path (void)
390 gfc_directorylist *p;
392 while (include_dirs != NULL)
394 p = include_dirs;
395 include_dirs = include_dirs->next;
396 free (p->path);
397 free (p);
400 while (intrinsic_modules_dirs != NULL)
402 p = intrinsic_modules_dirs;
403 intrinsic_modules_dirs = intrinsic_modules_dirs->next;
404 free (p->path);
405 free (p);
408 free (gfc_option.module_dir);
412 static FILE *
413 open_included_file (const char *name, gfc_directorylist *list,
414 bool module, bool system)
416 char *fullname;
417 gfc_directorylist *p;
418 FILE *f;
420 for (p = list; p; p = p->next)
422 if (module && !p->use_for_modules)
423 continue;
425 fullname = (char *) alloca(strlen (p->path) + strlen (name) + 1);
426 strcpy (fullname, p->path);
427 strcat (fullname, name);
429 f = gfc_open_file (fullname);
430 if (f != NULL)
432 if (gfc_cpp_makedep ())
433 gfc_cpp_add_dep (fullname, system);
435 return f;
439 return NULL;
443 /* Opens file for reading, searching through the include directories
444 given if necessary. If the include_cwd argument is true, we try
445 to open the file in the current directory first. */
447 FILE *
448 gfc_open_included_file (const char *name, bool include_cwd, bool module)
450 FILE *f = NULL;
452 if (IS_ABSOLUTE_PATH (name) || include_cwd)
454 f = gfc_open_file (name);
455 if (f && gfc_cpp_makedep ())
456 gfc_cpp_add_dep (name, false);
459 if (!f)
460 f = open_included_file (name, include_dirs, module, false);
462 return f;
466 /* Test to see if we're at the end of the main source file. */
469 gfc_at_end (void)
471 return end_flag;
475 /* Test to see if we're at the end of the current file. */
478 gfc_at_eof (void)
480 if (gfc_at_end ())
481 return 1;
483 if (line_head == NULL)
484 return 1; /* Null file */
486 if (gfc_current_locus.lb == NULL)
487 return 1;
489 return 0;
493 /* Test to see if we're at the beginning of a new line. */
496 gfc_at_bol (void)
498 if (gfc_at_eof ())
499 return 1;
501 return (gfc_current_locus.nextc == gfc_current_locus.lb->line);
505 /* Test to see if we're at the end of a line. */
508 gfc_at_eol (void)
510 if (gfc_at_eof ())
511 return 1;
513 return (*gfc_current_locus.nextc == '\0');
516 static void
517 add_file_change (const char *filename, int line)
519 if (file_changes_count == file_changes_allocated)
521 if (file_changes_allocated)
522 file_changes_allocated *= 2;
523 else
524 file_changes_allocated = 16;
525 file_changes = XRESIZEVEC (struct gfc_file_change, file_changes,
526 file_changes_allocated);
528 file_changes[file_changes_count].filename = filename;
529 file_changes[file_changes_count].lb = NULL;
530 file_changes[file_changes_count++].line = line;
533 static void
534 report_file_change (gfc_linebuf *lb)
536 size_t c = file_changes_cur;
537 while (c < file_changes_count
538 && file_changes[c].lb == lb)
540 if (file_changes[c].filename)
541 (*debug_hooks->start_source_file) (file_changes[c].line,
542 file_changes[c].filename);
543 else
544 (*debug_hooks->end_source_file) (file_changes[c].line);
545 ++c;
547 file_changes_cur = c;
550 void
551 gfc_start_source_files (void)
553 /* If the debugger wants the name of the main source file,
554 we give it. */
555 if (debug_hooks->start_end_main_source_file)
556 (*debug_hooks->start_source_file) (0, gfc_source_file);
558 file_changes_cur = 0;
559 report_file_change (gfc_current_locus.lb);
562 void
563 gfc_end_source_files (void)
565 report_file_change (NULL);
567 if (debug_hooks->start_end_main_source_file)
568 (*debug_hooks->end_source_file) (0);
571 /* Advance the current line pointer to the next line. */
573 void
574 gfc_advance_line (void)
576 if (gfc_at_end ())
577 return;
579 if (gfc_current_locus.lb == NULL)
581 end_flag = 1;
582 return;
585 if (gfc_current_locus.lb->next
586 && !gfc_current_locus.lb->next->dbg_emitted)
588 report_file_change (gfc_current_locus.lb->next);
589 gfc_current_locus.lb->next->dbg_emitted = true;
592 gfc_current_locus.lb = gfc_current_locus.lb->next;
594 if (gfc_current_locus.lb != NULL)
595 gfc_current_locus.nextc = gfc_current_locus.lb->line;
596 else
598 gfc_current_locus.nextc = NULL;
599 end_flag = 1;
604 /* Get the next character from the input, advancing gfc_current_file's
605 locus. When we hit the end of the line or the end of the file, we
606 start returning a '\n' in order to complete the current statement.
607 No Fortran line conventions are implemented here.
609 Requiring explicit advances to the next line prevents the parse
610 pointer from being on the wrong line if the current statement ends
611 prematurely. */
613 static gfc_char_t
614 next_char (void)
616 gfc_char_t c;
618 if (gfc_current_locus.nextc == NULL)
619 return '\n';
621 c = *gfc_current_locus.nextc++;
622 if (c == '\0')
624 gfc_current_locus.nextc--; /* Remain on this line. */
625 c = '\n';
628 return c;
632 /* Skip a comment. When we come here the parse pointer is positioned
633 immediately after the comment character. If we ever implement
634 compiler directives within comments, here is where we parse the
635 directive. */
637 static void
638 skip_comment_line (void)
640 gfc_char_t c;
644 c = next_char ();
646 while (c != '\n');
648 gfc_advance_line ();
653 gfc_define_undef_line (void)
655 char *tmp;
657 /* All lines beginning with '#' are either #define or #undef. */
658 if (debug_info_level != DINFO_LEVEL_VERBOSE || gfc_peek_ascii_char () != '#')
659 return 0;
661 if (wide_strncmp (gfc_current_locus.nextc, "#define ", 8) == 0)
663 tmp = gfc_widechar_to_char (&gfc_current_locus.nextc[8], -1);
664 (*debug_hooks->define) (gfc_linebuf_linenum (gfc_current_locus.lb),
665 tmp);
666 free (tmp);
669 if (wide_strncmp (gfc_current_locus.nextc, "#undef ", 7) == 0)
671 tmp = gfc_widechar_to_char (&gfc_current_locus.nextc[7], -1);
672 (*debug_hooks->undef) (gfc_linebuf_linenum (gfc_current_locus.lb),
673 tmp);
674 free (tmp);
677 /* Skip the rest of the line. */
678 skip_comment_line ();
680 return 1;
684 /* Return true if GCC$ was matched. */
685 static bool
686 skip_gcc_attribute (locus start)
688 bool r = false;
689 char c;
690 locus old_loc = gfc_current_locus;
692 if ((c = next_char ()) == 'g' || c == 'G')
693 if ((c = next_char ()) == 'c' || c == 'C')
694 if ((c = next_char ()) == 'c' || c == 'C')
695 if ((c = next_char ()) == '$')
696 r = true;
698 if (r == false)
699 gfc_current_locus = old_loc;
700 else
702 gcc_attribute_flag = 1;
703 gcc_attribute_locus = old_loc;
704 gfc_current_locus = start;
707 return r;
712 /* Comment lines are null lines, lines containing only blanks or lines
713 on which the first nonblank line is a '!'.
714 Return true if !$ openmp conditional compilation sentinel was
715 seen. */
717 static bool
718 skip_free_comments (void)
720 locus start;
721 gfc_char_t c;
722 int at_bol;
724 for (;;)
726 at_bol = gfc_at_bol ();
727 start = gfc_current_locus;
728 if (gfc_at_eof ())
729 break;
732 c = next_char ();
733 while (gfc_is_whitespace (c));
735 if (c == '\n')
737 gfc_advance_line ();
738 continue;
741 if (c == '!')
743 /* Keep the !GCC$ line. */
744 if (at_bol && skip_gcc_attribute (start))
745 return false;
747 /* If -fopenmp, we need to handle here 2 things:
748 1) don't treat !$omp as comments, but directives
749 2) handle OpenMP conditional compilation, where
750 !$ should be treated as 2 spaces (for initial lines
751 only if followed by space). */
752 if ((flag_openmp || flag_openmp_simd) && at_bol)
754 locus old_loc = gfc_current_locus;
755 if (next_char () == '$')
757 c = next_char ();
758 if (c == 'o' || c == 'O')
760 if (((c = next_char ()) == 'm' || c == 'M')
761 && ((c = next_char ()) == 'p' || c == 'P'))
763 if ((c = next_char ()) == ' ' || c == '\t'
764 || continue_flag)
766 while (gfc_is_whitespace (c))
767 c = next_char ();
768 if (c != '\n' && c != '!')
770 openmp_flag = 1;
771 openmp_locus = old_loc;
772 gfc_current_locus = start;
773 return false;
776 else
777 gfc_warning_now ("!$OMP at %C starts a commented "
778 "line as it neither is followed "
779 "by a space nor is a "
780 "continuation line");
782 gfc_current_locus = old_loc;
783 next_char ();
784 c = next_char ();
786 if (continue_flag || c == ' ' || c == '\t')
788 gfc_current_locus = old_loc;
789 next_char ();
790 openmp_flag = 0;
791 return true;
794 gfc_current_locus = old_loc;
796 skip_comment_line ();
797 continue;
800 break;
803 if (openmp_flag && at_bol)
804 openmp_flag = 0;
806 gcc_attribute_flag = 0;
807 gfc_current_locus = start;
808 return false;
812 /* Skip comment lines in fixed source mode. We have the same rules as
813 in skip_free_comment(), except that we can have a 'c', 'C' or '*'
814 in column 1, and a '!' cannot be in column 6. Also, we deal with
815 lines with 'd' or 'D' in column 1, if the user requested this. */
817 static void
818 skip_fixed_comments (void)
820 locus start;
821 int col;
822 gfc_char_t c;
824 if (! gfc_at_bol ())
826 start = gfc_current_locus;
827 if (! gfc_at_eof ())
830 c = next_char ();
831 while (gfc_is_whitespace (c));
833 if (c == '\n')
834 gfc_advance_line ();
835 else if (c == '!')
836 skip_comment_line ();
839 if (! gfc_at_bol ())
841 gfc_current_locus = start;
842 return;
846 for (;;)
848 start = gfc_current_locus;
849 if (gfc_at_eof ())
850 break;
852 c = next_char ();
853 if (c == '\n')
855 gfc_advance_line ();
856 continue;
859 if (c == '!' || c == 'c' || c == 'C' || c == '*')
861 if (skip_gcc_attribute (start))
863 /* Canonicalize to *$omp. */
864 *start.nextc = '*';
865 return;
868 /* If -fopenmp, we need to handle here 2 things:
869 1) don't treat !$omp|c$omp|*$omp as comments, but directives
870 2) handle OpenMP conditional compilation, where
871 !$|c$|*$ should be treated as 2 spaces if the characters
872 in columns 3 to 6 are valid fixed form label columns
873 characters. */
874 if (gfc_current_locus.lb != NULL
875 && continue_line < gfc_linebuf_linenum (gfc_current_locus.lb))
876 continue_line = gfc_linebuf_linenum (gfc_current_locus.lb);
878 if (flag_openmp || flag_openmp_simd)
880 if (next_char () == '$')
882 c = next_char ();
883 if (c == 'o' || c == 'O')
885 if (((c = next_char ()) == 'm' || c == 'M')
886 && ((c = next_char ()) == 'p' || c == 'P'))
888 c = next_char ();
889 if (c != '\n'
890 && ((openmp_flag && continue_flag)
891 || c == ' ' || c == '\t' || c == '0'))
894 c = next_char ();
895 while (gfc_is_whitespace (c));
896 if (c != '\n' && c != '!')
898 /* Canonicalize to *$omp. */
899 *start.nextc = '*';
900 openmp_flag = 1;
901 gfc_current_locus = start;
902 return;
907 else
909 int digit_seen = 0;
911 for (col = 3; col < 6; col++, c = next_char ())
912 if (c == ' ')
913 continue;
914 else if (c == '\t')
916 col = 6;
917 break;
919 else if (c < '0' || c > '9')
920 break;
921 else
922 digit_seen = 1;
924 if (col == 6 && c != '\n'
925 && ((continue_flag && !digit_seen)
926 || c == ' ' || c == '\t' || c == '0'))
928 gfc_current_locus = start;
929 start.nextc[0] = ' ';
930 start.nextc[1] = ' ';
931 continue;
935 gfc_current_locus = start;
937 skip_comment_line ();
938 continue;
941 if (gfc_option.flag_d_lines != -1 && (c == 'd' || c == 'D'))
943 if (gfc_option.flag_d_lines == 0)
945 skip_comment_line ();
946 continue;
948 else
949 *start.nextc = c = ' ';
952 col = 1;
954 while (gfc_is_whitespace (c))
956 c = next_char ();
957 col++;
960 if (c == '\n')
962 gfc_advance_line ();
963 continue;
966 if (col != 6 && c == '!')
968 if (gfc_current_locus.lb != NULL
969 && continue_line < gfc_linebuf_linenum (gfc_current_locus.lb))
970 continue_line = gfc_linebuf_linenum (gfc_current_locus.lb);
971 skip_comment_line ();
972 continue;
975 break;
978 openmp_flag = 0;
979 gcc_attribute_flag = 0;
980 gfc_current_locus = start;
984 /* Skips the current line if it is a comment. */
986 void
987 gfc_skip_comments (void)
989 if (gfc_current_form == FORM_FREE)
990 skip_free_comments ();
991 else
992 skip_fixed_comments ();
996 /* Get the next character from the input, taking continuation lines
997 and end-of-line comments into account. This implies that comment
998 lines between continued lines must be eaten here. For higher-level
999 subroutines, this flattens continued lines into a single logical
1000 line. The in_string flag denotes whether we're inside a character
1001 context or not. */
1003 gfc_char_t
1004 gfc_next_char_literal (gfc_instring in_string)
1006 locus old_loc;
1007 int i, prev_openmp_flag;
1008 gfc_char_t c;
1010 continue_flag = 0;
1012 restart:
1013 c = next_char ();
1014 if (gfc_at_end ())
1016 continue_count = 0;
1017 return c;
1020 if (gfc_current_form == FORM_FREE)
1022 bool openmp_cond_flag;
1024 if (!in_string && c == '!')
1026 if (gcc_attribute_flag
1027 && memcmp (&gfc_current_locus, &gcc_attribute_locus,
1028 sizeof (gfc_current_locus)) == 0)
1029 goto done;
1031 if (openmp_flag
1032 && memcmp (&gfc_current_locus, &openmp_locus,
1033 sizeof (gfc_current_locus)) == 0)
1034 goto done;
1036 /* This line can't be continued */
1039 c = next_char ();
1041 while (c != '\n');
1043 /* Avoid truncation warnings for comment ending lines. */
1044 gfc_current_locus.lb->truncated = 0;
1046 goto done;
1049 /* Check to see if the continuation line was truncated. */
1050 if (warn_line_truncation && gfc_current_locus.lb != NULL
1051 && gfc_current_locus.lb->truncated)
1053 int maxlen = flag_free_line_length;
1054 gfc_char_t *current_nextc = gfc_current_locus.nextc;
1056 gfc_current_locus.lb->truncated = 0;
1057 gfc_current_locus.nextc = gfc_current_locus.lb->line + maxlen;
1058 gfc_warning_now (OPT_Wline_truncation,
1059 "Line truncated at %L", &gfc_current_locus);
1060 gfc_current_locus.nextc = current_nextc;
1063 if (c != '&')
1064 goto done;
1066 /* If the next nonblank character is a ! or \n, we've got a
1067 continuation line. */
1068 old_loc = gfc_current_locus;
1070 c = next_char ();
1071 while (gfc_is_whitespace (c))
1072 c = next_char ();
1074 /* Character constants to be continued cannot have commentary
1075 after the '&'. */
1077 if (in_string && c != '\n')
1079 gfc_current_locus = old_loc;
1080 c = '&';
1081 goto done;
1084 if (c != '!' && c != '\n')
1086 gfc_current_locus = old_loc;
1087 c = '&';
1088 goto done;
1091 prev_openmp_flag = openmp_flag;
1092 continue_flag = 1;
1093 if (c == '!')
1094 skip_comment_line ();
1095 else
1096 gfc_advance_line ();
1098 if (gfc_at_eof ())
1099 goto not_continuation;
1101 /* We've got a continuation line. If we are on the very next line after
1102 the last continuation, increment the continuation line count and
1103 check whether the limit has been exceeded. */
1104 if (gfc_linebuf_linenum (gfc_current_locus.lb) == continue_line + 1)
1106 if (++continue_count == gfc_option.max_continue_free)
1108 if (gfc_notification_std (GFC_STD_GNU) || pedantic)
1109 gfc_warning ("Limit of %d continuations exceeded in "
1110 "statement at %C", gfc_option.max_continue_free);
1114 /* Now find where it continues. First eat any comment lines. */
1115 openmp_cond_flag = skip_free_comments ();
1117 if (gfc_current_locus.lb != NULL
1118 && continue_line < gfc_linebuf_linenum (gfc_current_locus.lb))
1119 continue_line = gfc_linebuf_linenum (gfc_current_locus.lb);
1121 if (prev_openmp_flag != openmp_flag)
1123 gfc_current_locus = old_loc;
1124 openmp_flag = prev_openmp_flag;
1125 c = '&';
1126 goto done;
1129 /* Now that we have a non-comment line, probe ahead for the
1130 first non-whitespace character. If it is another '&', then
1131 reading starts at the next character, otherwise we must back
1132 up to where the whitespace started and resume from there. */
1134 old_loc = gfc_current_locus;
1136 c = next_char ();
1137 while (gfc_is_whitespace (c))
1138 c = next_char ();
1140 if (openmp_flag)
1142 for (i = 0; i < 5; i++, c = next_char ())
1144 gcc_assert (gfc_wide_tolower (c) == (unsigned char) "!$omp"[i]);
1145 if (i == 4)
1146 old_loc = gfc_current_locus;
1148 while (gfc_is_whitespace (c))
1149 c = next_char ();
1152 if (c != '&')
1154 if (in_string)
1156 gfc_current_locus.nextc--;
1157 if (warn_ampersand && in_string == INSTRING_WARN)
1158 gfc_warning (OPT_Wampersand,
1159 "Missing %<&%> in continued character "
1160 "constant at %C");
1162 /* Both !$omp and !$ -fopenmp continuation lines have & on the
1163 continuation line only optionally. */
1164 else if (openmp_flag || openmp_cond_flag)
1165 gfc_current_locus.nextc--;
1166 else
1168 c = ' ';
1169 gfc_current_locus = old_loc;
1170 goto done;
1174 else /* Fixed form. */
1176 /* Fixed form continuation. */
1177 if (!in_string && c == '!')
1179 /* Skip comment at end of line. */
1182 c = next_char ();
1184 while (c != '\n');
1186 /* Avoid truncation warnings for comment ending lines. */
1187 gfc_current_locus.lb->truncated = 0;
1190 if (c != '\n')
1191 goto done;
1193 /* Check to see if the continuation line was truncated. */
1194 if (warn_line_truncation && gfc_current_locus.lb != NULL
1195 && gfc_current_locus.lb->truncated)
1197 gfc_current_locus.lb->truncated = 0;
1198 gfc_warning_now (OPT_Wline_truncation,
1199 "Line truncated at %L", &gfc_current_locus);
1202 prev_openmp_flag = openmp_flag;
1203 continue_flag = 1;
1204 old_loc = gfc_current_locus;
1206 gfc_advance_line ();
1207 skip_fixed_comments ();
1209 /* See if this line is a continuation line. */
1210 if (openmp_flag != prev_openmp_flag)
1212 openmp_flag = prev_openmp_flag;
1213 goto not_continuation;
1216 if (!openmp_flag)
1217 for (i = 0; i < 5; i++)
1219 c = next_char ();
1220 if (c != ' ')
1221 goto not_continuation;
1223 else
1224 for (i = 0; i < 5; i++)
1226 c = next_char ();
1227 if (gfc_wide_tolower (c) != (unsigned char) "*$omp"[i])
1228 goto not_continuation;
1231 c = next_char ();
1232 if (c == '0' || c == ' ' || c == '\n')
1233 goto not_continuation;
1235 /* We've got a continuation line. If we are on the very next line after
1236 the last continuation, increment the continuation line count and
1237 check whether the limit has been exceeded. */
1238 if (gfc_linebuf_linenum (gfc_current_locus.lb) == continue_line + 1)
1240 if (++continue_count == gfc_option.max_continue_fixed)
1242 if (gfc_notification_std (GFC_STD_GNU) || pedantic)
1243 gfc_warning ("Limit of %d continuations exceeded in "
1244 "statement at %C",
1245 gfc_option.max_continue_fixed);
1249 if (gfc_current_locus.lb != NULL
1250 && continue_line < gfc_linebuf_linenum (gfc_current_locus.lb))
1251 continue_line = gfc_linebuf_linenum (gfc_current_locus.lb);
1254 /* Ready to read first character of continuation line, which might
1255 be another continuation line! */
1256 goto restart;
1258 not_continuation:
1259 c = '\n';
1260 gfc_current_locus = old_loc;
1262 done:
1263 if (c == '\n')
1264 continue_count = 0;
1265 continue_flag = 0;
1266 return c;
1270 /* Get the next character of input, folded to lowercase. In fixed
1271 form mode, we also ignore spaces. When matcher subroutines are
1272 parsing character literals, they have to call
1273 gfc_next_char_literal(). */
1275 gfc_char_t
1276 gfc_next_char (void)
1278 gfc_char_t c;
1282 c = gfc_next_char_literal (NONSTRING);
1284 while (gfc_current_form == FORM_FIXED && gfc_is_whitespace (c));
1286 return gfc_wide_tolower (c);
1289 char
1290 gfc_next_ascii_char (void)
1292 gfc_char_t c = gfc_next_char ();
1294 return (gfc_wide_fits_in_byte (c) ? (unsigned char) c
1295 : (unsigned char) UCHAR_MAX);
1299 gfc_char_t
1300 gfc_peek_char (void)
1302 locus old_loc;
1303 gfc_char_t c;
1305 old_loc = gfc_current_locus;
1306 c = gfc_next_char ();
1307 gfc_current_locus = old_loc;
1309 return c;
1313 char
1314 gfc_peek_ascii_char (void)
1316 gfc_char_t c = gfc_peek_char ();
1318 return (gfc_wide_fits_in_byte (c) ? (unsigned char) c
1319 : (unsigned char) UCHAR_MAX);
1323 /* Recover from an error. We try to get past the current statement
1324 and get lined up for the next. The next statement follows a '\n'
1325 or a ';'. We also assume that we are not within a character
1326 constant, and deal with finding a '\'' or '"'. */
1328 void
1329 gfc_error_recovery (void)
1331 gfc_char_t c, delim;
1333 if (gfc_at_eof ())
1334 return;
1336 for (;;)
1338 c = gfc_next_char ();
1339 if (c == '\n' || c == ';')
1340 break;
1342 if (c != '\'' && c != '"')
1344 if (gfc_at_eof ())
1345 break;
1346 continue;
1348 delim = c;
1350 for (;;)
1352 c = next_char ();
1354 if (c == delim)
1355 break;
1356 if (c == '\n')
1357 return;
1358 if (c == '\\')
1360 c = next_char ();
1361 if (c == '\n')
1362 return;
1365 if (gfc_at_eof ())
1366 break;
1371 /* Read ahead until the next character to be read is not whitespace. */
1373 void
1374 gfc_gobble_whitespace (void)
1376 static int linenum = 0;
1377 locus old_loc;
1378 gfc_char_t c;
1382 old_loc = gfc_current_locus;
1383 c = gfc_next_char_literal (NONSTRING);
1384 /* Issue a warning for nonconforming tabs. We keep track of the line
1385 number because the Fortran matchers will often back up and the same
1386 line will be scanned multiple times. */
1387 if (warn_tabs && c == '\t')
1389 int cur_linenum = LOCATION_LINE (gfc_current_locus.lb->location);
1390 if (cur_linenum != linenum)
1392 linenum = cur_linenum;
1393 gfc_warning_now (OPT_Wtabs, "Nonconforming tab character at %C");
1397 while (gfc_is_whitespace (c));
1399 gfc_current_locus = old_loc;
1403 /* Load a single line into pbuf.
1405 If pbuf points to a NULL pointer, it is allocated.
1406 We truncate lines that are too long, unless we're dealing with
1407 preprocessor lines or if the option -ffixed-line-length-none is set,
1408 in which case we reallocate the buffer to fit the entire line, if
1409 need be.
1410 In fixed mode, we expand a tab that occurs within the statement
1411 label region to expand to spaces that leave the next character in
1412 the source region.
1414 If first_char is not NULL, it's a pointer to a single char value holding
1415 the first character of the line, which has already been read by the
1416 caller. This avoids the use of ungetc().
1418 load_line returns whether the line was truncated.
1420 NOTE: The error machinery isn't available at this point, so we can't
1421 easily report line and column numbers consistent with other
1422 parts of gfortran. */
1424 static int
1425 load_line (FILE *input, gfc_char_t **pbuf, int *pbuflen, const int *first_char)
1427 static int linenum = 0, current_line = 1;
1428 int c, maxlen, i, preprocessor_flag, buflen = *pbuflen;
1429 int trunc_flag = 0, seen_comment = 0;
1430 int seen_printable = 0, seen_ampersand = 0, quoted = ' ';
1431 gfc_char_t *buffer;
1432 bool found_tab = false;
1434 /* Determine the maximum allowed line length. */
1435 if (gfc_current_form == FORM_FREE)
1436 maxlen = flag_free_line_length;
1437 else if (gfc_current_form == FORM_FIXED)
1438 maxlen = flag_fixed_line_length;
1439 else
1440 maxlen = 72;
1442 if (*pbuf == NULL)
1444 /* Allocate the line buffer, storing its length into buflen.
1445 Note that if maxlen==0, indicating that arbitrary-length lines
1446 are allowed, the buffer will be reallocated if this length is
1447 insufficient; since 132 characters is the length of a standard
1448 free-form line, we use that as a starting guess. */
1449 if (maxlen > 0)
1450 buflen = maxlen;
1451 else
1452 buflen = 132;
1454 *pbuf = gfc_get_wide_string (buflen + 1);
1457 i = 0;
1458 buffer = *pbuf;
1460 if (first_char)
1461 c = *first_char;
1462 else
1463 c = getc (input);
1465 /* In order to not truncate preprocessor lines, we have to
1466 remember that this is one. */
1467 preprocessor_flag = (c == '#' ? 1 : 0);
1469 for (;;)
1471 if (c == EOF)
1472 break;
1474 if (c == '\n')
1476 /* Check for illegal use of ampersand. See F95 Standard 3.3.1.3. */
1477 if (gfc_current_form == FORM_FREE
1478 && !seen_printable && seen_ampersand)
1480 if (pedantic)
1481 gfc_error_now ("%<&%> not allowed by itself in line %d",
1482 current_line);
1483 else
1484 gfc_warning_now ("%<&%> not allowed by itself in line %d",
1485 current_line);
1487 break;
1490 if (c == '\r' || c == '\0')
1491 goto next_char; /* Gobble characters. */
1493 if (c == '&')
1495 if (seen_ampersand)
1497 seen_ampersand = 0;
1498 seen_printable = 1;
1500 else
1501 seen_ampersand = 1;
1504 if ((c != '&' && c != '!' && c != ' ') || (c == '!' && !seen_ampersand))
1505 seen_printable = 1;
1507 /* Is this a fixed-form comment? */
1508 if (gfc_current_form == FORM_FIXED && i == 0
1509 && (c == '*' || c == 'c' || c == 'd'))
1510 seen_comment = 1;
1512 if (quoted == ' ')
1514 if (c == '\'' || c == '"')
1515 quoted = c;
1517 else if (c == quoted)
1518 quoted = ' ';
1520 /* Is this a free-form comment? */
1521 if (c == '!' && quoted == ' ')
1522 seen_comment = 1;
1524 /* Vendor extension: "<tab>1" marks a continuation line. */
1525 if (found_tab)
1527 found_tab = false;
1528 if (c >= '1' && c <= '9')
1530 *(buffer-1) = c;
1531 goto next_char;
1535 if (gfc_current_form == FORM_FIXED && c == '\t' && i < 6)
1537 found_tab = true;
1539 if (warn_tabs && seen_comment == 0 && current_line != linenum)
1541 linenum = current_line;
1542 gfc_warning_now (OPT_Wtabs,
1543 "Nonconforming tab character in column %d "
1544 "of line %d", i+1, linenum);
1547 while (i < 6)
1549 *buffer++ = ' ';
1550 i++;
1553 goto next_char;
1556 *buffer++ = c;
1557 i++;
1559 if (maxlen == 0 || preprocessor_flag)
1561 if (i >= buflen)
1563 /* Reallocate line buffer to double size to hold the
1564 overlong line. */
1565 buflen = buflen * 2;
1566 *pbuf = XRESIZEVEC (gfc_char_t, *pbuf, (buflen + 1));
1567 buffer = (*pbuf) + i;
1570 else if (i >= maxlen)
1572 bool trunc_warn = true;
1574 /* Enhancement, if the very next non-space character is an ampersand
1575 or comment that we would otherwise warn about, don't mark as
1576 truncated. */
1578 /* Truncate the rest of the line. */
1579 for (;;)
1581 c = getc (input);
1582 if (c == '\r' || c == ' ')
1583 continue;
1585 if (c == '\n' || c == EOF)
1586 break;
1588 if (!trunc_warn && c != '!')
1589 trunc_warn = true;
1591 if (trunc_warn && ((gfc_current_form == FORM_FIXED && c == '&')
1592 || c == '!'))
1593 trunc_warn = false;
1595 if (c == '!')
1596 seen_comment = 1;
1598 if (trunc_warn && !seen_comment)
1599 trunc_flag = 1;
1602 c = '\n';
1603 continue;
1606 next_char:
1607 c = getc (input);
1610 /* Pad lines to the selected line length in fixed form. */
1611 if (gfc_current_form == FORM_FIXED
1612 && flag_fixed_line_length != 0
1613 && !preprocessor_flag
1614 && c != EOF)
1616 while (i++ < maxlen)
1617 *buffer++ = ' ';
1620 *buffer = '\0';
1621 *pbuflen = buflen;
1622 current_line++;
1624 return trunc_flag;
1628 /* Get a gfc_file structure, initialize it and add it to
1629 the file stack. */
1631 static gfc_file *
1632 get_file (const char *name, enum lc_reason reason ATTRIBUTE_UNUSED)
1634 gfc_file *f;
1636 f = XCNEW (gfc_file);
1638 f->filename = xstrdup (name);
1640 f->next = file_head;
1641 file_head = f;
1643 f->up = current_file;
1644 if (current_file != NULL)
1645 f->inclusion_line = current_file->line;
1647 linemap_add (line_table, reason, false, f->filename, 1);
1649 return f;
1653 /* Deal with a line from the C preprocessor. The
1654 initial octothorp has already been seen. */
1656 static void
1657 preprocessor_line (gfc_char_t *c)
1659 bool flag[5];
1660 int i, line;
1661 gfc_char_t *wide_filename;
1662 gfc_file *f;
1663 int escaped, unescape;
1664 char *filename;
1666 c++;
1667 while (*c == ' ' || *c == '\t')
1668 c++;
1670 if (*c < '0' || *c > '9')
1671 goto bad_cpp_line;
1673 line = wide_atoi (c);
1675 c = wide_strchr (c, ' ');
1676 if (c == NULL)
1678 /* No file name given. Set new line number. */
1679 current_file->line = line;
1680 return;
1683 /* Skip spaces. */
1684 while (*c == ' ' || *c == '\t')
1685 c++;
1687 /* Skip quote. */
1688 if (*c != '"')
1689 goto bad_cpp_line;
1690 ++c;
1692 wide_filename = c;
1694 /* Make filename end at quote. */
1695 unescape = 0;
1696 escaped = false;
1697 while (*c && ! (!escaped && *c == '"'))
1699 if (escaped)
1700 escaped = false;
1701 else if (*c == '\\')
1703 escaped = true;
1704 unescape++;
1706 ++c;
1709 if (! *c)
1710 /* Preprocessor line has no closing quote. */
1711 goto bad_cpp_line;
1713 *c++ = '\0';
1715 /* Undo effects of cpp_quote_string. */
1716 if (unescape)
1718 gfc_char_t *s = wide_filename;
1719 gfc_char_t *d = gfc_get_wide_string (c - wide_filename - unescape);
1721 wide_filename = d;
1722 while (*s)
1724 if (*s == '\\')
1725 *d++ = *++s;
1726 else
1727 *d++ = *s;
1728 s++;
1730 *d = '\0';
1733 /* Get flags. */
1735 flag[1] = flag[2] = flag[3] = flag[4] = false;
1737 for (;;)
1739 c = wide_strchr (c, ' ');
1740 if (c == NULL)
1741 break;
1743 c++;
1744 i = wide_atoi (c);
1746 if (1 <= i && i <= 4)
1747 flag[i] = true;
1750 /* Convert the filename in wide characters into a filename in narrow
1751 characters. */
1752 filename = gfc_widechar_to_char (wide_filename, -1);
1754 /* Interpret flags. */
1756 if (flag[1]) /* Starting new file. */
1758 f = get_file (filename, LC_RENAME);
1759 add_file_change (f->filename, f->inclusion_line);
1760 current_file = f;
1763 if (flag[2]) /* Ending current file. */
1765 if (!current_file->up
1766 || filename_cmp (current_file->up->filename, filename) != 0)
1768 gfc_warning_now_1 ("%s:%d: file %s left but not entered",
1769 current_file->filename, current_file->line,
1770 filename);
1771 if (unescape)
1772 free (wide_filename);
1773 free (filename);
1774 return;
1777 add_file_change (NULL, line);
1778 current_file = current_file->up;
1779 linemap_add (line_table, LC_RENAME, false, current_file->filename,
1780 current_file->line);
1783 /* The name of the file can be a temporary file produced by
1784 cpp. Replace the name if it is different. */
1786 if (filename_cmp (current_file->filename, filename) != 0)
1788 /* FIXME: we leak the old filename because a pointer to it may be stored
1789 in the linemap. Alternative could be using GC or updating linemap to
1790 point to the new name, but there is no API for that currently. */
1791 current_file->filename = xstrdup (filename);
1794 /* Set new line number. */
1795 current_file->line = line;
1796 if (unescape)
1797 free (wide_filename);
1798 free (filename);
1799 return;
1801 bad_cpp_line:
1802 gfc_warning_now_1 ("%s:%d: Illegal preprocessor directive",
1803 current_file->filename, current_file->line);
1804 current_file->line++;
1808 static bool load_file (const char *, const char *, bool);
1810 /* include_line()-- Checks a line buffer to see if it is an include
1811 line. If so, we call load_file() recursively to load the included
1812 file. We never return a syntax error because a statement like
1813 "include = 5" is perfectly legal. We return false if no include was
1814 processed or true if we matched an include. */
1816 static bool
1817 include_line (gfc_char_t *line)
1819 gfc_char_t quote, *c, *begin, *stop;
1820 char *filename;
1822 c = line;
1824 if (flag_openmp || flag_openmp_simd)
1826 if (gfc_current_form == FORM_FREE)
1828 while (*c == ' ' || *c == '\t')
1829 c++;
1830 if (*c == '!' && c[1] == '$' && (c[2] == ' ' || c[2] == '\t'))
1831 c += 3;
1833 else
1835 if ((*c == '!' || *c == 'c' || *c == 'C' || *c == '*')
1836 && c[1] == '$' && (c[2] == ' ' || c[2] == '\t'))
1837 c += 3;
1841 while (*c == ' ' || *c == '\t')
1842 c++;
1844 if (gfc_wide_strncasecmp (c, "include", 7))
1845 return false;
1847 c += 7;
1848 while (*c == ' ' || *c == '\t')
1849 c++;
1851 /* Find filename between quotes. */
1853 quote = *c++;
1854 if (quote != '"' && quote != '\'')
1855 return false;
1857 begin = c;
1859 while (*c != quote && *c != '\0')
1860 c++;
1862 if (*c == '\0')
1863 return false;
1865 stop = c++;
1867 while (*c == ' ' || *c == '\t')
1868 c++;
1870 if (*c != '\0' && *c != '!')
1871 return false;
1873 /* We have an include line at this point. */
1875 *stop = '\0'; /* It's ok to trash the buffer, as this line won't be
1876 read by anything else. */
1878 filename = gfc_widechar_to_char (begin, -1);
1879 if (!load_file (filename, NULL, false))
1880 exit (FATAL_EXIT_CODE);
1882 free (filename);
1883 return true;
1887 /* Load a file into memory by calling load_line until the file ends. */
1889 static bool
1890 load_file (const char *realfilename, const char *displayedname, bool initial)
1892 gfc_char_t *line;
1893 gfc_linebuf *b;
1894 gfc_file *f;
1895 FILE *input;
1896 int len, line_len;
1897 bool first_line;
1898 const char *filename;
1899 /* If realfilename and displayedname are different and non-null then
1900 surely realfilename is the preprocessed form of
1901 displayedname. */
1902 bool preprocessed_p = (realfilename && displayedname
1903 && strcmp (realfilename, displayedname));
1905 filename = displayedname ? displayedname : realfilename;
1907 for (f = current_file; f; f = f->up)
1908 if (filename_cmp (filename, f->filename) == 0)
1910 fprintf (stderr, "%s:%d: Error: File '%s' is being included "
1911 "recursively\n", current_file->filename, current_file->line,
1912 filename);
1913 return false;
1916 if (initial)
1918 if (gfc_src_file)
1920 input = gfc_src_file;
1921 gfc_src_file = NULL;
1923 else
1924 input = gfc_open_file (realfilename);
1925 if (input == NULL)
1927 gfc_error_now ("Can't open file %qs", filename);
1928 return false;
1931 else
1933 input = gfc_open_included_file (realfilename, false, false);
1934 if (input == NULL)
1936 fprintf (stderr, "%s:%d: Error: Can't open included file '%s'\n",
1937 current_file->filename, current_file->line, filename);
1938 return false;
1942 /* Load the file.
1944 A "non-initial" file means a file that is being included. In
1945 that case we are creating an LC_ENTER map.
1947 An "initial" file means a main file; one that is not included.
1948 That file has already got at least one (surely more) line map(s)
1949 created by gfc_init. So the subsequent map created in that case
1950 must have LC_RENAME reason.
1952 This latter case is not true for a preprocessed file. In that
1953 case, although the file is "initial", the line maps created by
1954 gfc_init was used during the preprocessing of the file. Now that
1955 the preprocessing is over and we are being fed the result of that
1956 preprocessing, we need to create a brand new line map for the
1957 preprocessed file, so the reason is going to be LC_ENTER. */
1959 f = get_file (filename, (initial && !preprocessed_p) ? LC_RENAME : LC_ENTER);
1960 if (!initial)
1961 add_file_change (f->filename, f->inclusion_line);
1962 current_file = f;
1963 current_file->line = 1;
1964 line = NULL;
1965 line_len = 0;
1966 first_line = true;
1968 if (initial && gfc_src_preprocessor_lines[0])
1970 preprocessor_line (gfc_src_preprocessor_lines[0]);
1971 free (gfc_src_preprocessor_lines[0]);
1972 gfc_src_preprocessor_lines[0] = NULL;
1973 if (gfc_src_preprocessor_lines[1])
1975 preprocessor_line (gfc_src_preprocessor_lines[1]);
1976 free (gfc_src_preprocessor_lines[1]);
1977 gfc_src_preprocessor_lines[1] = NULL;
1981 for (;;)
1983 int trunc = load_line (input, &line, &line_len, NULL);
1985 len = gfc_wide_strlen (line);
1986 if (feof (input) && len == 0)
1987 break;
1989 /* If this is the first line of the file, it can contain a byte
1990 order mark (BOM), which we will ignore:
1991 FF FE is UTF-16 little endian,
1992 FE FF is UTF-16 big endian,
1993 EF BB BF is UTF-8. */
1994 if (first_line
1995 && ((line_len >= 2 && line[0] == (unsigned char) '\xFF'
1996 && line[1] == (unsigned char) '\xFE')
1997 || (line_len >= 2 && line[0] == (unsigned char) '\xFE'
1998 && line[1] == (unsigned char) '\xFF')
1999 || (line_len >= 3 && line[0] == (unsigned char) '\xEF'
2000 && line[1] == (unsigned char) '\xBB'
2001 && line[2] == (unsigned char) '\xBF')))
2003 int n = line[1] == (unsigned char) '\xBB' ? 3 : 2;
2004 gfc_char_t *new_char = gfc_get_wide_string (line_len);
2006 wide_strcpy (new_char, &line[n]);
2007 free (line);
2008 line = new_char;
2009 len -= n;
2012 /* There are three things this line can be: a line of Fortran
2013 source, an include line or a C preprocessor directive. */
2015 if (line[0] == '#')
2017 /* When -g3 is specified, it's possible that we emit #define
2018 and #undef lines, which we need to pass to the middle-end
2019 so that it can emit correct debug info. */
2020 if (debug_info_level == DINFO_LEVEL_VERBOSE
2021 && (wide_strncmp (line, "#define ", 8) == 0
2022 || wide_strncmp (line, "#undef ", 7) == 0))
2024 else
2026 preprocessor_line (line);
2027 continue;
2031 /* Preprocessed files have preprocessor lines added before the byte
2032 order mark, so first_line is not about the first line of the file
2033 but the first line that's not a preprocessor line. */
2034 first_line = false;
2036 if (include_line (line))
2038 current_file->line++;
2039 continue;
2042 /* Add line. */
2044 b = XCNEWVAR (gfc_linebuf, gfc_linebuf_header_size
2045 + (len + 1) * sizeof (gfc_char_t));
2048 b->location
2049 = linemap_line_start (line_table, current_file->line++, len);
2050 /* ??? We add the location for the maximum column possible here,
2051 because otherwise if the next call creates a new line-map, it
2052 will not reserve space for any offset. */
2053 if (len > 0)
2054 linemap_position_for_column (line_table, len);
2056 b->file = current_file;
2057 b->truncated = trunc;
2058 wide_strcpy (b->line, line);
2060 if (line_head == NULL)
2061 line_head = b;
2062 else
2063 line_tail->next = b;
2065 line_tail = b;
2067 while (file_changes_cur < file_changes_count)
2068 file_changes[file_changes_cur++].lb = b;
2071 /* Release the line buffer allocated in load_line. */
2072 free (line);
2074 fclose (input);
2076 if (!initial)
2077 add_file_change (NULL, current_file->inclusion_line + 1);
2078 current_file = current_file->up;
2079 linemap_add (line_table, LC_LEAVE, 0, NULL, 0);
2080 return true;
2084 /* Open a new file and start scanning from that file. Returns true
2085 if everything went OK, false otherwise. If form == FORM_UNKNOWN
2086 it tries to determine the source form from the filename, defaulting
2087 to free form. */
2089 bool
2090 gfc_new_file (void)
2092 bool result;
2094 if (gfc_cpp_enabled ())
2096 result = gfc_cpp_preprocess (gfc_source_file);
2097 if (!gfc_cpp_preprocess_only ())
2098 result = load_file (gfc_cpp_temporary_file (), gfc_source_file, true);
2100 else
2101 result = load_file (gfc_source_file, NULL, true);
2103 gfc_current_locus.lb = line_head;
2104 gfc_current_locus.nextc = (line_head == NULL) ? NULL : line_head->line;
2106 #if 0 /* Debugging aid. */
2107 for (; line_head; line_head = line_head->next)
2108 printf ("%s:%3d %s\n", LOCATION_FILE (line_head->location),
2109 LOCATION_LINE (line_head->location), line_head->line);
2111 exit (SUCCESS_EXIT_CODE);
2112 #endif
2114 return result;
2117 static char *
2118 unescape_filename (const char *ptr)
2120 const char *p = ptr, *s;
2121 char *d, *ret;
2122 int escaped, unescape = 0;
2124 /* Make filename end at quote. */
2125 escaped = false;
2126 while (*p && ! (! escaped && *p == '"'))
2128 if (escaped)
2129 escaped = false;
2130 else if (*p == '\\')
2132 escaped = true;
2133 unescape++;
2135 ++p;
2138 if (!*p || p[1])
2139 return NULL;
2141 /* Undo effects of cpp_quote_string. */
2142 s = ptr;
2143 d = XCNEWVEC (char, p + 1 - ptr - unescape);
2144 ret = d;
2146 while (s != p)
2148 if (*s == '\\')
2149 *d++ = *++s;
2150 else
2151 *d++ = *s;
2152 s++;
2154 *d = '\0';
2155 return ret;
2158 /* For preprocessed files, if the first tokens are of the form # NUM.
2159 handle the directives so we know the original file name. */
2161 const char *
2162 gfc_read_orig_filename (const char *filename, const char **canon_source_file)
2164 int c, len;
2165 char *dirname, *tmp;
2167 gfc_src_file = gfc_open_file (filename);
2168 if (gfc_src_file == NULL)
2169 return NULL;
2171 c = getc (gfc_src_file);
2173 if (c != '#')
2174 return NULL;
2176 len = 0;
2177 load_line (gfc_src_file, &gfc_src_preprocessor_lines[0], &len, &c);
2179 if (wide_strncmp (gfc_src_preprocessor_lines[0], "# 1 \"", 5) != 0)
2180 return NULL;
2182 tmp = gfc_widechar_to_char (&gfc_src_preprocessor_lines[0][5], -1);
2183 filename = unescape_filename (tmp);
2184 free (tmp);
2185 if (filename == NULL)
2186 return NULL;
2188 c = getc (gfc_src_file);
2190 if (c != '#')
2191 return filename;
2193 len = 0;
2194 load_line (gfc_src_file, &gfc_src_preprocessor_lines[1], &len, &c);
2196 if (wide_strncmp (gfc_src_preprocessor_lines[1], "# 1 \"", 5) != 0)
2197 return filename;
2199 tmp = gfc_widechar_to_char (&gfc_src_preprocessor_lines[1][5], -1);
2200 dirname = unescape_filename (tmp);
2201 free (tmp);
2202 if (dirname == NULL)
2203 return filename;
2205 len = strlen (dirname);
2206 if (len < 3 || dirname[len - 1] != '/' || dirname[len - 2] != '/')
2208 free (dirname);
2209 return filename;
2211 dirname[len - 2] = '\0';
2212 set_src_pwd (dirname);
2214 if (! IS_ABSOLUTE_PATH (filename))
2216 char *p = XCNEWVEC (char, len + strlen (filename));
2218 memcpy (p, dirname, len - 2);
2219 p[len - 2] = '/';
2220 strcpy (p + len - 1, filename);
2221 *canon_source_file = p;
2224 free (dirname);
2225 return filename;