* ggc.h (empty_string): Delete.
[official-gcc.git] / gcc / fortran / scanner.c
blob82f431da52799f1ce4d3fdd9c15ce88d58f2366c
1 /* Character scanner.
2 Copyright (C) 2000-2017 Free Software Foundation, Inc.
3 Contributed by Andy Vaught
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 /* Set of subroutines to (ultimately) return the next character to the
22 various matching subroutines. This file's job is to read files and
23 build up lines that are parsed by the parser. This means that we
24 handle continuation lines and "include" lines.
26 The first thing the scanner does is to load an entire file into
27 memory. We load the entire file into memory for a couple reasons.
28 The first is that we want to be able to deal with nonseekable input
29 (pipes, stdin) and there is a lot of backing up involved during
30 parsing.
32 The second is that we want to be able to print the locus of errors,
33 and an error on line 999999 could conflict with something on line
34 one. Given nonseekable input, we've got to store the whole thing.
36 One thing that helps are the column truncation limits that give us
37 an upper bound on the size of individual lines. We don't store the
38 truncated stuff.
40 From the scanner's viewpoint, the higher level subroutines ask for
41 new characters and do a lot of jumping backwards. */
43 #include "config.h"
44 #include "system.h"
45 #include "coretypes.h"
46 #include "gfortran.h"
47 #include "toplev.h" /* For set_src_pwd. */
48 #include "debug.h"
49 #include "options.h"
50 #include "cpp.h"
51 #include "scanner.h"
53 /* List of include file search directories. */
54 gfc_directorylist *include_dirs, *intrinsic_modules_dirs;
56 static gfc_file *file_head, *current_file;
58 static int continue_flag, end_flag, gcc_attribute_flag;
59 /* If !$omp/!$acc occurred in current comment line. */
60 static int openmp_flag, openacc_flag;
61 static int continue_count, continue_line;
62 static locus openmp_locus;
63 static locus openacc_locus;
64 static locus gcc_attribute_locus;
66 gfc_source_form gfc_current_form;
67 static gfc_linebuf *line_head, *line_tail;
69 locus gfc_current_locus;
70 const char *gfc_source_file;
71 static FILE *gfc_src_file;
72 static gfc_char_t *gfc_src_preprocessor_lines[2];
74 static struct gfc_file_change
76 const char *filename;
77 gfc_linebuf *lb;
78 int line;
79 } *file_changes;
80 size_t file_changes_cur, file_changes_count;
81 size_t file_changes_allocated;
84 /* Functions dealing with our wide characters (gfc_char_t) and
85 sequences of such characters. */
87 int
88 gfc_wide_fits_in_byte (gfc_char_t c)
90 return (c <= UCHAR_MAX);
93 static inline int
94 wide_is_ascii (gfc_char_t c)
96 return (gfc_wide_fits_in_byte (c) && ((unsigned char) c & ~0x7f) == 0);
99 int
100 gfc_wide_is_printable (gfc_char_t c)
102 return (gfc_wide_fits_in_byte (c) && ISPRINT ((unsigned char) c));
105 gfc_char_t
106 gfc_wide_tolower (gfc_char_t c)
108 return (wide_is_ascii (c) ? (gfc_char_t) TOLOWER((unsigned char) c) : c);
111 gfc_char_t
112 gfc_wide_toupper (gfc_char_t c)
114 return (wide_is_ascii (c) ? (gfc_char_t) TOUPPER((unsigned char) c) : c);
118 gfc_wide_is_digit (gfc_char_t c)
120 return (c >= '0' && c <= '9');
123 static inline int
124 wide_atoi (gfc_char_t *c)
126 #define MAX_DIGITS 20
127 char buf[MAX_DIGITS+1];
128 int i = 0;
130 while (gfc_wide_is_digit(*c) && i < MAX_DIGITS)
131 buf[i++] = *c++;
132 buf[i] = '\0';
133 return atoi (buf);
136 size_t
137 gfc_wide_strlen (const gfc_char_t *str)
139 size_t i;
141 for (i = 0; str[i]; i++)
144 return i;
147 gfc_char_t *
148 gfc_wide_memset (gfc_char_t *b, gfc_char_t c, size_t len)
150 size_t i;
152 for (i = 0; i < len; i++)
153 b[i] = c;
155 return b;
158 static gfc_char_t *
159 wide_strcpy (gfc_char_t *dest, const gfc_char_t *src)
161 gfc_char_t *d;
163 for (d = dest; (*d = *src) != '\0'; ++src, ++d)
166 return dest;
169 static gfc_char_t *
170 wide_strchr (const gfc_char_t *s, gfc_char_t c)
172 do {
173 if (*s == c)
175 return CONST_CAST(gfc_char_t *, s);
177 } while (*s++);
178 return 0;
181 char *
182 gfc_widechar_to_char (const gfc_char_t *s, int length)
184 size_t len, i;
185 char *res;
187 if (s == NULL)
188 return NULL;
190 /* Passing a negative length is used to indicate that length should be
191 calculated using gfc_wide_strlen(). */
192 len = (length >= 0 ? (size_t) length : gfc_wide_strlen (s));
193 res = XNEWVEC (char, len + 1);
195 for (i = 0; i < len; i++)
197 gcc_assert (gfc_wide_fits_in_byte (s[i]));
198 res[i] = (unsigned char) s[i];
201 res[len] = '\0';
202 return res;
205 gfc_char_t *
206 gfc_char_to_widechar (const char *s)
208 size_t len, i;
209 gfc_char_t *res;
211 if (s == NULL)
212 return NULL;
214 len = strlen (s);
215 res = gfc_get_wide_string (len + 1);
217 for (i = 0; i < len; i++)
218 res[i] = (unsigned char) s[i];
220 res[len] = '\0';
221 return res;
224 static int
225 wide_strncmp (const gfc_char_t *s1, const char *s2, size_t n)
227 gfc_char_t c1, c2;
229 while (n-- > 0)
231 c1 = *s1++;
232 c2 = *s2++;
233 if (c1 != c2)
234 return (c1 > c2 ? 1 : -1);
235 if (c1 == '\0')
236 return 0;
238 return 0;
242 gfc_wide_strncasecmp (const gfc_char_t *s1, const char *s2, size_t n)
244 gfc_char_t c1, c2;
246 while (n-- > 0)
248 c1 = gfc_wide_tolower (*s1++);
249 c2 = TOLOWER (*s2++);
250 if (c1 != c2)
251 return (c1 > c2 ? 1 : -1);
252 if (c1 == '\0')
253 return 0;
255 return 0;
259 /* Main scanner initialization. */
261 void
262 gfc_scanner_init_1 (void)
264 file_head = NULL;
265 line_head = NULL;
266 line_tail = NULL;
268 continue_count = 0;
269 continue_line = 0;
271 end_flag = 0;
275 /* Main scanner destructor. */
277 void
278 gfc_scanner_done_1 (void)
280 gfc_linebuf *lb;
281 gfc_file *f;
283 while(line_head != NULL)
285 lb = line_head->next;
286 free (line_head);
287 line_head = lb;
290 while(file_head != NULL)
292 f = file_head->next;
293 free (file_head->filename);
294 free (file_head);
295 file_head = f;
300 /* Adds path to the list pointed to by list. */
302 static void
303 add_path_to_list (gfc_directorylist **list, const char *path,
304 bool use_for_modules, bool head, bool warn)
306 gfc_directorylist *dir;
307 const char *p;
308 char *q;
309 struct stat st;
310 size_t len;
311 int i;
313 p = path;
314 while (*p == ' ' || *p == '\t') /* someone might do "-I include" */
315 if (*p++ == '\0')
316 return;
318 /* Strip trailing directory separators from the path, as this
319 will confuse Windows systems. */
320 len = strlen (p);
321 q = (char *) alloca (len + 1);
322 memcpy (q, p, len + 1);
323 i = len - 1;
324 while (i >=0 && IS_DIR_SEPARATOR (q[i]))
325 q[i--] = '\0';
327 if (stat (q, &st))
329 if (errno != ENOENT)
330 gfc_warning_now (0, "Include directory %qs: %s", path,
331 xstrerror(errno));
332 else if (warn)
333 gfc_warning_now (OPT_Wmissing_include_dirs,
334 "Nonexistent include directory %qs", path);
335 return;
337 else if (!S_ISDIR (st.st_mode))
339 gfc_fatal_error ("%qs is not a directory", path);
340 return;
343 if (head || *list == NULL)
345 dir = XCNEW (gfc_directorylist);
346 if (!head)
347 *list = dir;
349 else
351 dir = *list;
352 while (dir->next)
353 dir = dir->next;
355 dir->next = XCNEW (gfc_directorylist);
356 dir = dir->next;
359 dir->next = head ? *list : NULL;
360 if (head)
361 *list = dir;
362 dir->use_for_modules = use_for_modules;
363 dir->path = XCNEWVEC (char, strlen (p) + 2);
364 strcpy (dir->path, p);
365 strcat (dir->path, "/"); /* make '/' last character */
369 void
370 gfc_add_include_path (const char *path, bool use_for_modules, bool file_dir,
371 bool warn)
373 add_path_to_list (&include_dirs, path, use_for_modules, file_dir, warn);
375 /* For '#include "..."' these directories are automatically searched. */
376 if (!file_dir)
377 gfc_cpp_add_include_path (xstrdup(path), true);
381 void
382 gfc_add_intrinsic_modules_path (const char *path)
384 add_path_to_list (&intrinsic_modules_dirs, path, true, false, false);
388 /* Release resources allocated for options. */
390 void
391 gfc_release_include_path (void)
393 gfc_directorylist *p;
395 while (include_dirs != NULL)
397 p = include_dirs;
398 include_dirs = include_dirs->next;
399 free (p->path);
400 free (p);
403 while (intrinsic_modules_dirs != NULL)
405 p = intrinsic_modules_dirs;
406 intrinsic_modules_dirs = intrinsic_modules_dirs->next;
407 free (p->path);
408 free (p);
411 free (gfc_option.module_dir);
415 static FILE *
416 open_included_file (const char *name, gfc_directorylist *list,
417 bool module, bool system)
419 char *fullname;
420 gfc_directorylist *p;
421 FILE *f;
423 for (p = list; p; p = p->next)
425 if (module && !p->use_for_modules)
426 continue;
428 fullname = (char *) alloca(strlen (p->path) + strlen (name) + 1);
429 strcpy (fullname, p->path);
430 strcat (fullname, name);
432 f = gfc_open_file (fullname);
433 if (f != NULL)
435 if (gfc_cpp_makedep ())
436 gfc_cpp_add_dep (fullname, system);
438 return f;
442 return NULL;
446 /* Opens file for reading, searching through the include directories
447 given if necessary. If the include_cwd argument is true, we try
448 to open the file in the current directory first. */
450 FILE *
451 gfc_open_included_file (const char *name, bool include_cwd, bool module)
453 FILE *f = NULL;
455 if (IS_ABSOLUTE_PATH (name) || include_cwd)
457 f = gfc_open_file (name);
458 if (f && gfc_cpp_makedep ())
459 gfc_cpp_add_dep (name, false);
462 if (!f)
463 f = open_included_file (name, include_dirs, module, false);
465 return f;
469 /* Test to see if we're at the end of the main source file. */
472 gfc_at_end (void)
474 return end_flag;
478 /* Test to see if we're at the end of the current file. */
481 gfc_at_eof (void)
483 if (gfc_at_end ())
484 return 1;
486 if (line_head == NULL)
487 return 1; /* Null file */
489 if (gfc_current_locus.lb == NULL)
490 return 1;
492 return 0;
496 /* Test to see if we're at the beginning of a new line. */
499 gfc_at_bol (void)
501 if (gfc_at_eof ())
502 return 1;
504 return (gfc_current_locus.nextc == gfc_current_locus.lb->line);
508 /* Test to see if we're at the end of a line. */
511 gfc_at_eol (void)
513 if (gfc_at_eof ())
514 return 1;
516 return (*gfc_current_locus.nextc == '\0');
519 static void
520 add_file_change (const char *filename, int line)
522 if (file_changes_count == file_changes_allocated)
524 if (file_changes_allocated)
525 file_changes_allocated *= 2;
526 else
527 file_changes_allocated = 16;
528 file_changes = XRESIZEVEC (struct gfc_file_change, file_changes,
529 file_changes_allocated);
531 file_changes[file_changes_count].filename = filename;
532 file_changes[file_changes_count].lb = NULL;
533 file_changes[file_changes_count++].line = line;
536 static void
537 report_file_change (gfc_linebuf *lb)
539 size_t c = file_changes_cur;
540 while (c < file_changes_count
541 && file_changes[c].lb == lb)
543 if (file_changes[c].filename)
544 (*debug_hooks->start_source_file) (file_changes[c].line,
545 file_changes[c].filename);
546 else
547 (*debug_hooks->end_source_file) (file_changes[c].line);
548 ++c;
550 file_changes_cur = c;
553 void
554 gfc_start_source_files (void)
556 /* If the debugger wants the name of the main source file,
557 we give it. */
558 if (debug_hooks->start_end_main_source_file)
559 (*debug_hooks->start_source_file) (0, gfc_source_file);
561 file_changes_cur = 0;
562 report_file_change (gfc_current_locus.lb);
565 void
566 gfc_end_source_files (void)
568 report_file_change (NULL);
570 if (debug_hooks->start_end_main_source_file)
571 (*debug_hooks->end_source_file) (0);
574 /* Advance the current line pointer to the next line. */
576 void
577 gfc_advance_line (void)
579 if (gfc_at_end ())
580 return;
582 if (gfc_current_locus.lb == NULL)
584 end_flag = 1;
585 return;
588 if (gfc_current_locus.lb->next
589 && !gfc_current_locus.lb->next->dbg_emitted)
591 report_file_change (gfc_current_locus.lb->next);
592 gfc_current_locus.lb->next->dbg_emitted = true;
595 gfc_current_locus.lb = gfc_current_locus.lb->next;
597 if (gfc_current_locus.lb != NULL)
598 gfc_current_locus.nextc = gfc_current_locus.lb->line;
599 else
601 gfc_current_locus.nextc = NULL;
602 end_flag = 1;
607 /* Get the next character from the input, advancing gfc_current_file's
608 locus. When we hit the end of the line or the end of the file, we
609 start returning a '\n' in order to complete the current statement.
610 No Fortran line conventions are implemented here.
612 Requiring explicit advances to the next line prevents the parse
613 pointer from being on the wrong line if the current statement ends
614 prematurely. */
616 static gfc_char_t
617 next_char (void)
619 gfc_char_t c;
621 if (gfc_current_locus.nextc == NULL)
622 return '\n';
624 c = *gfc_current_locus.nextc++;
625 if (c == '\0')
627 gfc_current_locus.nextc--; /* Remain on this line. */
628 c = '\n';
631 return c;
635 /* Skip a comment. When we come here the parse pointer is positioned
636 immediately after the comment character. If we ever implement
637 compiler directives within comments, here is where we parse the
638 directive. */
640 static void
641 skip_comment_line (void)
643 gfc_char_t c;
647 c = next_char ();
649 while (c != '\n');
651 gfc_advance_line ();
656 gfc_define_undef_line (void)
658 char *tmp;
660 /* All lines beginning with '#' are either #define or #undef. */
661 if (debug_info_level != DINFO_LEVEL_VERBOSE || gfc_peek_ascii_char () != '#')
662 return 0;
664 if (wide_strncmp (gfc_current_locus.nextc, "#define ", 8) == 0)
666 tmp = gfc_widechar_to_char (&gfc_current_locus.nextc[8], -1);
667 (*debug_hooks->define) (gfc_linebuf_linenum (gfc_current_locus.lb),
668 tmp);
669 free (tmp);
672 if (wide_strncmp (gfc_current_locus.nextc, "#undef ", 7) == 0)
674 tmp = gfc_widechar_to_char (&gfc_current_locus.nextc[7], -1);
675 (*debug_hooks->undef) (gfc_linebuf_linenum (gfc_current_locus.lb),
676 tmp);
677 free (tmp);
680 /* Skip the rest of the line. */
681 skip_comment_line ();
683 return 1;
687 /* Return true if GCC$ was matched. */
688 static bool
689 skip_gcc_attribute (locus start)
691 bool r = false;
692 char c;
693 locus old_loc = gfc_current_locus;
695 if ((c = next_char ()) == 'g' || c == 'G')
696 if ((c = next_char ()) == 'c' || c == 'C')
697 if ((c = next_char ()) == 'c' || c == 'C')
698 if ((c = next_char ()) == '$')
699 r = true;
701 if (r == false)
702 gfc_current_locus = old_loc;
703 else
705 gcc_attribute_flag = 1;
706 gcc_attribute_locus = old_loc;
707 gfc_current_locus = start;
710 return r;
713 /* Return true if CC was matched. */
714 static bool
715 skip_free_oacc_sentinel (locus start, locus old_loc)
717 bool r = false;
718 char c;
720 if ((c = next_char ()) == 'c' || c == 'C')
721 if ((c = next_char ()) == 'c' || c == 'C')
722 r = true;
724 if (r)
726 if ((c = next_char ()) == ' ' || c == '\t'
727 || continue_flag)
729 while (gfc_is_whitespace (c))
730 c = next_char ();
731 if (c != '\n' && c != '!')
733 openacc_flag = 1;
734 openacc_locus = old_loc;
735 gfc_current_locus = start;
737 else
738 r = false;
740 else
742 gfc_warning_now (0, "!$ACC at %C starts a commented "
743 "line as it neither is followed "
744 "by a space nor is a "
745 "continuation line");
746 r = false;
750 return r;
753 /* Return true if MP was matched. */
754 static bool
755 skip_free_omp_sentinel (locus start, locus old_loc)
757 bool r = false;
758 char c;
760 if ((c = next_char ()) == 'm' || c == 'M')
761 if ((c = next_char ()) == 'p' || c == 'P')
762 r = true;
764 if (r)
766 if ((c = next_char ()) == ' ' || c == '\t'
767 || continue_flag)
769 while (gfc_is_whitespace (c))
770 c = next_char ();
771 if (c != '\n' && c != '!')
773 openmp_flag = 1;
774 openmp_locus = old_loc;
775 gfc_current_locus = start;
777 else
778 r = false;
780 else
782 gfc_warning_now (0, "!$OMP at %C starts a commented "
783 "line as it neither is followed "
784 "by a space nor is a "
785 "continuation line");
786 r = false;
790 return r;
793 /* Comment lines are null lines, lines containing only blanks or lines
794 on which the first nonblank line is a '!'.
795 Return true if !$ openmp or openacc conditional compilation sentinel was
796 seen. */
798 static bool
799 skip_free_comments (void)
801 locus start;
802 gfc_char_t c;
803 int at_bol;
805 for (;;)
807 at_bol = gfc_at_bol ();
808 start = gfc_current_locus;
809 if (gfc_at_eof ())
810 break;
813 c = next_char ();
814 while (gfc_is_whitespace (c));
816 if (c == '\n')
818 gfc_advance_line ();
819 continue;
822 if (c == '!')
824 /* Keep the !GCC$ line. */
825 if (at_bol && skip_gcc_attribute (start))
826 return false;
828 /* If -fopenmp/-fopenacc, we need to handle here 2 things:
829 1) don't treat !$omp/!$acc as comments, but directives
830 2) handle OpenMP/OpenACC conditional compilation, where
831 !$ should be treated as 2 spaces (for initial lines
832 only if followed by space). */
833 if (at_bol)
835 if ((flag_openmp || flag_openmp_simd)
836 && flag_openacc)
838 locus old_loc = gfc_current_locus;
839 if (next_char () == '$')
841 c = next_char ();
842 if (c == 'o' || c == 'O')
844 if (skip_free_omp_sentinel (start, old_loc))
845 return false;
846 gfc_current_locus = old_loc;
847 next_char ();
848 c = next_char ();
850 else if (c == 'a' || c == 'A')
852 if (skip_free_oacc_sentinel (start, old_loc))
853 return false;
854 gfc_current_locus = old_loc;
855 next_char ();
856 c = next_char ();
858 if (continue_flag || c == ' ' || c == '\t')
860 gfc_current_locus = old_loc;
861 next_char ();
862 openmp_flag = openacc_flag = 0;
863 return true;
866 gfc_current_locus = old_loc;
868 else if ((flag_openmp || flag_openmp_simd)
869 && !flag_openacc)
871 locus old_loc = gfc_current_locus;
872 if (next_char () == '$')
874 c = next_char ();
875 if (c == 'o' || c == 'O')
877 if (skip_free_omp_sentinel (start, old_loc))
878 return false;
879 gfc_current_locus = old_loc;
880 next_char ();
881 c = next_char ();
883 if (continue_flag || c == ' ' || c == '\t')
885 gfc_current_locus = old_loc;
886 next_char ();
887 openmp_flag = 0;
888 return true;
891 gfc_current_locus = old_loc;
893 else if (flag_openacc
894 && !(flag_openmp || flag_openmp_simd))
896 locus old_loc = gfc_current_locus;
897 if (next_char () == '$')
899 c = next_char ();
900 if (c == 'a' || c == 'A')
902 if (skip_free_oacc_sentinel (start, old_loc))
903 return false;
904 gfc_current_locus = old_loc;
905 next_char();
906 c = next_char();
908 if (continue_flag || c == ' ' || c == '\t')
910 gfc_current_locus = old_loc;
911 next_char();
912 openacc_flag = 0;
913 return true;
916 gfc_current_locus = old_loc;
919 skip_comment_line ();
920 continue;
923 break;
926 if (openmp_flag && at_bol)
927 openmp_flag = 0;
929 if (openacc_flag && at_bol)
930 openacc_flag = 0;
932 gcc_attribute_flag = 0;
933 gfc_current_locus = start;
934 return false;
937 /* Return true if MP was matched in fixed form. */
938 static bool
939 skip_fixed_omp_sentinel (locus *start)
941 gfc_char_t c;
942 if (((c = next_char ()) == 'm' || c == 'M')
943 && ((c = next_char ()) == 'p' || c == 'P'))
945 c = next_char ();
946 if (c != '\n'
947 && (continue_flag
948 || c == ' ' || c == '\t' || c == '0'))
951 c = next_char ();
952 while (gfc_is_whitespace (c));
953 if (c != '\n' && c != '!')
955 /* Canonicalize to *$omp. */
956 *start->nextc = '*';
957 openmp_flag = 1;
958 gfc_current_locus = *start;
959 return true;
963 return false;
966 /* Return true if CC was matched in fixed form. */
967 static bool
968 skip_fixed_oacc_sentinel (locus *start)
970 gfc_char_t c;
971 if (((c = next_char ()) == 'c' || c == 'C')
972 && ((c = next_char ()) == 'c' || c == 'C'))
974 c = next_char ();
975 if (c != '\n'
976 && (continue_flag
977 || c == ' ' || c == '\t' || c == '0'))
980 c = next_char ();
981 while (gfc_is_whitespace (c));
982 if (c != '\n' && c != '!')
984 /* Canonicalize to *$acc. */
985 *start->nextc = '*';
986 openacc_flag = 1;
987 gfc_current_locus = *start;
988 return true;
992 return false;
995 /* Skip comment lines in fixed source mode. We have the same rules as
996 in skip_free_comment(), except that we can have a 'c', 'C' or '*'
997 in column 1, and a '!' cannot be in column 6. Also, we deal with
998 lines with 'd' or 'D' in column 1, if the user requested this. */
1000 static void
1001 skip_fixed_comments (void)
1003 locus start;
1004 int col;
1005 gfc_char_t c;
1007 if (! gfc_at_bol ())
1009 start = gfc_current_locus;
1010 if (! gfc_at_eof ())
1013 c = next_char ();
1014 while (gfc_is_whitespace (c));
1016 if (c == '\n')
1017 gfc_advance_line ();
1018 else if (c == '!')
1019 skip_comment_line ();
1022 if (! gfc_at_bol ())
1024 gfc_current_locus = start;
1025 return;
1029 for (;;)
1031 start = gfc_current_locus;
1032 if (gfc_at_eof ())
1033 break;
1035 c = next_char ();
1036 if (c == '\n')
1038 gfc_advance_line ();
1039 continue;
1042 if (c == '!' || c == 'c' || c == 'C' || c == '*')
1044 if (skip_gcc_attribute (start))
1046 /* Canonicalize to *$omp. */
1047 *start.nextc = '*';
1048 return;
1051 /* If -fopenmp/-fopenacc, we need to handle here 2 things:
1052 1) don't treat !$omp/!$acc|c$omp/c$acc|*$omp / *$acc as comments,
1053 but directives
1054 2) handle OpenMP/OpenACC conditional compilation, where
1055 !$|c$|*$ should be treated as 2 spaces if the characters
1056 in columns 3 to 6 are valid fixed form label columns
1057 characters. */
1058 if (gfc_current_locus.lb != NULL
1059 && continue_line < gfc_linebuf_linenum (gfc_current_locus.lb))
1060 continue_line = gfc_linebuf_linenum (gfc_current_locus.lb);
1062 if ((flag_openmp || flag_openmp_simd) && !flag_openacc)
1064 if (next_char () == '$')
1066 c = next_char ();
1067 if (c == 'o' || c == 'O')
1069 if (skip_fixed_omp_sentinel (&start))
1070 return;
1072 else
1073 goto check_for_digits;
1075 gfc_current_locus = start;
1078 if (flag_openacc && !(flag_openmp || flag_openmp_simd))
1080 if (next_char () == '$')
1082 c = next_char ();
1083 if (c == 'a' || c == 'A')
1085 if (skip_fixed_oacc_sentinel (&start))
1086 return;
1088 else
1089 goto check_for_digits;
1091 gfc_current_locus = start;
1094 if (flag_openacc || flag_openmp || flag_openmp_simd)
1096 if (next_char () == '$')
1098 c = next_char ();
1099 if (c == 'a' || c == 'A')
1101 if (skip_fixed_oacc_sentinel (&start))
1102 return;
1104 else if (c == 'o' || c == 'O')
1106 if (skip_fixed_omp_sentinel (&start))
1107 return;
1109 else
1110 goto check_for_digits;
1112 gfc_current_locus = start;
1115 skip_comment_line ();
1116 continue;
1118 gcc_unreachable ();
1119 check_for_digits:
1121 int digit_seen = 0;
1123 for (col = 3; col < 6; col++, c = next_char ())
1124 if (c == ' ')
1125 continue;
1126 else if (c == '\t')
1128 col = 6;
1129 break;
1131 else if (c < '0' || c > '9')
1132 break;
1133 else
1134 digit_seen = 1;
1136 if (col == 6 && c != '\n'
1137 && ((continue_flag && !digit_seen)
1138 || c == ' ' || c == '\t' || c == '0'))
1140 gfc_current_locus = start;
1141 start.nextc[0] = ' ';
1142 start.nextc[1] = ' ';
1143 continue;
1146 skip_comment_line ();
1147 continue;
1150 if (gfc_option.flag_d_lines != -1 && (c == 'd' || c == 'D'))
1152 if (gfc_option.flag_d_lines == 0)
1154 skip_comment_line ();
1155 continue;
1157 else
1158 *start.nextc = c = ' ';
1161 col = 1;
1163 while (gfc_is_whitespace (c))
1165 c = next_char ();
1166 col++;
1169 if (c == '\n')
1171 gfc_advance_line ();
1172 continue;
1175 if (col != 6 && c == '!')
1177 if (gfc_current_locus.lb != NULL
1178 && continue_line < gfc_linebuf_linenum (gfc_current_locus.lb))
1179 continue_line = gfc_linebuf_linenum (gfc_current_locus.lb);
1180 skip_comment_line ();
1181 continue;
1184 break;
1187 openmp_flag = 0;
1188 openacc_flag = 0;
1189 gcc_attribute_flag = 0;
1190 gfc_current_locus = start;
1194 /* Skips the current line if it is a comment. */
1196 void
1197 gfc_skip_comments (void)
1199 if (gfc_current_form == FORM_FREE)
1200 skip_free_comments ();
1201 else
1202 skip_fixed_comments ();
1206 /* Get the next character from the input, taking continuation lines
1207 and end-of-line comments into account. This implies that comment
1208 lines between continued lines must be eaten here. For higher-level
1209 subroutines, this flattens continued lines into a single logical
1210 line. The in_string flag denotes whether we're inside a character
1211 context or not. */
1213 gfc_char_t
1214 gfc_next_char_literal (gfc_instring in_string)
1216 locus old_loc;
1217 int i, prev_openmp_flag, prev_openacc_flag;
1218 gfc_char_t c;
1220 continue_flag = 0;
1221 prev_openacc_flag = prev_openmp_flag = 0;
1223 restart:
1224 c = next_char ();
1225 if (gfc_at_end ())
1227 continue_count = 0;
1228 return c;
1231 if (gfc_current_form == FORM_FREE)
1233 bool openmp_cond_flag;
1235 if (!in_string && c == '!')
1237 if (gcc_attribute_flag
1238 && memcmp (&gfc_current_locus, &gcc_attribute_locus,
1239 sizeof (gfc_current_locus)) == 0)
1240 goto done;
1242 if (openmp_flag
1243 && memcmp (&gfc_current_locus, &openmp_locus,
1244 sizeof (gfc_current_locus)) == 0)
1245 goto done;
1247 if (openacc_flag
1248 && memcmp (&gfc_current_locus, &openacc_locus,
1249 sizeof (gfc_current_locus)) == 0)
1250 goto done;
1252 /* This line can't be continued */
1255 c = next_char ();
1257 while (c != '\n');
1259 /* Avoid truncation warnings for comment ending lines. */
1260 gfc_current_locus.lb->truncated = 0;
1262 goto done;
1265 /* Check to see if the continuation line was truncated. */
1266 if (warn_line_truncation && gfc_current_locus.lb != NULL
1267 && gfc_current_locus.lb->truncated)
1269 int maxlen = flag_free_line_length;
1270 gfc_char_t *current_nextc = gfc_current_locus.nextc;
1272 gfc_current_locus.lb->truncated = 0;
1273 gfc_current_locus.nextc = gfc_current_locus.lb->line + maxlen;
1274 gfc_warning_now (OPT_Wline_truncation,
1275 "Line truncated at %L", &gfc_current_locus);
1276 gfc_current_locus.nextc = current_nextc;
1279 if (c != '&')
1280 goto done;
1282 /* If the next nonblank character is a ! or \n, we've got a
1283 continuation line. */
1284 old_loc = gfc_current_locus;
1286 c = next_char ();
1287 while (gfc_is_whitespace (c))
1288 c = next_char ();
1290 /* Character constants to be continued cannot have commentary
1291 after the '&'. However, there are cases where we may think we
1292 are still in a string and we are looking for a possible
1293 doubled quote and we end up here. See PR64506. */
1295 if (in_string && c != '\n')
1297 gfc_current_locus = old_loc;
1298 c = '&';
1299 goto done;
1302 if (c != '!' && c != '\n')
1304 gfc_current_locus = old_loc;
1305 c = '&';
1306 goto done;
1309 if (flag_openmp)
1310 prev_openmp_flag = openmp_flag;
1311 if (flag_openacc)
1312 prev_openacc_flag = openacc_flag;
1314 continue_flag = 1;
1315 if (c == '!')
1316 skip_comment_line ();
1317 else
1318 gfc_advance_line ();
1320 if (gfc_at_eof ())
1321 goto not_continuation;
1323 /* We've got a continuation line. If we are on the very next line after
1324 the last continuation, increment the continuation line count and
1325 check whether the limit has been exceeded. */
1326 if (gfc_linebuf_linenum (gfc_current_locus.lb) == continue_line + 1)
1328 if (++continue_count == gfc_option.max_continue_free)
1330 if (gfc_notification_std (GFC_STD_GNU) || pedantic)
1331 gfc_warning (0, "Limit of %d continuations exceeded in "
1332 "statement at %C", gfc_option.max_continue_free);
1336 /* Now find where it continues. First eat any comment lines. */
1337 openmp_cond_flag = skip_free_comments ();
1339 if (gfc_current_locus.lb != NULL
1340 && continue_line < gfc_linebuf_linenum (gfc_current_locus.lb))
1341 continue_line = gfc_linebuf_linenum (gfc_current_locus.lb);
1343 if (flag_openmp)
1344 if (prev_openmp_flag != openmp_flag && !openacc_flag)
1346 gfc_current_locus = old_loc;
1347 openmp_flag = prev_openmp_flag;
1348 c = '&';
1349 goto done;
1352 if (flag_openacc)
1353 if (prev_openacc_flag != openacc_flag && !openmp_flag)
1355 gfc_current_locus = old_loc;
1356 openacc_flag = prev_openacc_flag;
1357 c = '&';
1358 goto done;
1361 /* Now that we have a non-comment line, probe ahead for the
1362 first non-whitespace character. If it is another '&', then
1363 reading starts at the next character, otherwise we must back
1364 up to where the whitespace started and resume from there. */
1366 old_loc = gfc_current_locus;
1368 c = next_char ();
1369 while (gfc_is_whitespace (c))
1370 c = next_char ();
1372 if (openmp_flag && !openacc_flag)
1374 for (i = 0; i < 5; i++, c = next_char ())
1376 gcc_assert (gfc_wide_tolower (c) == (unsigned char) "!$omp"[i]);
1377 if (i == 4)
1378 old_loc = gfc_current_locus;
1380 while (gfc_is_whitespace (c))
1381 c = next_char ();
1383 if (openacc_flag && !openmp_flag)
1385 for (i = 0; i < 5; i++, c = next_char ())
1387 gcc_assert (gfc_wide_tolower (c) == (unsigned char) "!$acc"[i]);
1388 if (i == 4)
1389 old_loc = gfc_current_locus;
1391 while (gfc_is_whitespace (c))
1392 c = next_char ();
1395 /* In case we have an OpenMP directive continued by OpenACC
1396 sentinel, or vice versa, we get both openmp_flag and
1397 openacc_flag on. */
1399 if (openacc_flag && openmp_flag)
1401 int is_openmp = 0;
1402 for (i = 0; i < 5; i++, c = next_char ())
1404 if (gfc_wide_tolower (c) != (unsigned char) "!$acc"[i])
1405 is_openmp = 1;
1406 if (i == 4)
1407 old_loc = gfc_current_locus;
1409 gfc_error (is_openmp
1410 ? G_("Wrong OpenACC continuation at %C: "
1411 "expected !$ACC, got !$OMP")
1412 : G_("Wrong OpenMP continuation at %C: "
1413 "expected !$OMP, got !$ACC"));
1416 if (c != '&')
1418 if (in_string && gfc_current_locus.nextc)
1420 gfc_current_locus.nextc--;
1421 if (warn_ampersand && in_string == INSTRING_WARN)
1422 gfc_warning (OPT_Wampersand,
1423 "Missing %<&%> in continued character "
1424 "constant at %C");
1426 else if (!in_string && (c == '\'' || c == '"'))
1427 goto done;
1428 /* Both !$omp and !$ -fopenmp continuation lines have & on the
1429 continuation line only optionally. */
1430 else if (openmp_flag || openacc_flag || openmp_cond_flag)
1432 if (gfc_current_locus.nextc)
1433 gfc_current_locus.nextc--;
1435 else
1437 c = ' ';
1438 gfc_current_locus = old_loc;
1439 goto done;
1443 else /* Fixed form. */
1445 /* Fixed form continuation. */
1446 if (in_string != INSTRING_WARN && c == '!')
1448 /* Skip comment at end of line. */
1451 c = next_char ();
1453 while (c != '\n');
1455 /* Avoid truncation warnings for comment ending lines. */
1456 gfc_current_locus.lb->truncated = 0;
1459 if (c != '\n')
1460 goto done;
1462 /* Check to see if the continuation line was truncated. */
1463 if (warn_line_truncation && gfc_current_locus.lb != NULL
1464 && gfc_current_locus.lb->truncated)
1466 gfc_current_locus.lb->truncated = 0;
1467 gfc_warning_now (OPT_Wline_truncation,
1468 "Line truncated at %L", &gfc_current_locus);
1471 if (flag_openmp)
1472 prev_openmp_flag = openmp_flag;
1473 if (flag_openacc)
1474 prev_openacc_flag = openacc_flag;
1476 continue_flag = 1;
1477 old_loc = gfc_current_locus;
1479 gfc_advance_line ();
1480 skip_fixed_comments ();
1482 /* See if this line is a continuation line. */
1483 if (flag_openmp && openmp_flag != prev_openmp_flag && !openacc_flag)
1485 openmp_flag = prev_openmp_flag;
1486 goto not_continuation;
1488 if (flag_openacc && openacc_flag != prev_openacc_flag && !openmp_flag)
1490 openacc_flag = prev_openacc_flag;
1491 goto not_continuation;
1494 /* In case we have an OpenMP directive continued by OpenACC
1495 sentinel, or vice versa, we get both openmp_flag and
1496 openacc_flag on. */
1497 if (openacc_flag && openmp_flag)
1499 int is_openmp = 0;
1500 for (i = 0; i < 5; i++)
1502 c = next_char ();
1503 if (gfc_wide_tolower (c) != (unsigned char) "*$acc"[i])
1504 is_openmp = 1;
1506 gfc_error (is_openmp
1507 ? G_("Wrong OpenACC continuation at %C: "
1508 "expected !$ACC, got !$OMP")
1509 : G_("Wrong OpenMP continuation at %C: "
1510 "expected !$OMP, got !$ACC"));
1512 else if (!openmp_flag && !openacc_flag)
1513 for (i = 0; i < 5; i++)
1515 c = next_char ();
1516 if (c != ' ')
1517 goto not_continuation;
1519 else if (openmp_flag)
1520 for (i = 0; i < 5; i++)
1522 c = next_char ();
1523 if (gfc_wide_tolower (c) != (unsigned char) "*$omp"[i])
1524 goto not_continuation;
1526 else if (openacc_flag)
1527 for (i = 0; i < 5; i++)
1529 c = next_char ();
1530 if (gfc_wide_tolower (c) != (unsigned char) "*$acc"[i])
1531 goto not_continuation;
1534 c = next_char ();
1535 if (c == '0' || c == ' ' || c == '\n')
1536 goto not_continuation;
1538 /* We've got a continuation line. If we are on the very next line after
1539 the last continuation, increment the continuation line count and
1540 check whether the limit has been exceeded. */
1541 if (gfc_linebuf_linenum (gfc_current_locus.lb) == continue_line + 1)
1543 if (++continue_count == gfc_option.max_continue_fixed)
1545 if (gfc_notification_std (GFC_STD_GNU) || pedantic)
1546 gfc_warning (0, "Limit of %d continuations exceeded in "
1547 "statement at %C",
1548 gfc_option.max_continue_fixed);
1552 if (gfc_current_locus.lb != NULL
1553 && continue_line < gfc_linebuf_linenum (gfc_current_locus.lb))
1554 continue_line = gfc_linebuf_linenum (gfc_current_locus.lb);
1557 /* Ready to read first character of continuation line, which might
1558 be another continuation line! */
1559 goto restart;
1561 not_continuation:
1562 c = '\n';
1563 gfc_current_locus = old_loc;
1564 end_flag = 0;
1566 done:
1567 if (c == '\n')
1568 continue_count = 0;
1569 continue_flag = 0;
1570 return c;
1574 /* Get the next character of input, folded to lowercase. In fixed
1575 form mode, we also ignore spaces. When matcher subroutines are
1576 parsing character literals, they have to call
1577 gfc_next_char_literal(). */
1579 gfc_char_t
1580 gfc_next_char (void)
1582 gfc_char_t c;
1586 c = gfc_next_char_literal (NONSTRING);
1588 while (gfc_current_form == FORM_FIXED && gfc_is_whitespace (c));
1590 return gfc_wide_tolower (c);
1593 char
1594 gfc_next_ascii_char (void)
1596 gfc_char_t c = gfc_next_char ();
1598 return (gfc_wide_fits_in_byte (c) ? (unsigned char) c
1599 : (unsigned char) UCHAR_MAX);
1603 gfc_char_t
1604 gfc_peek_char (void)
1606 locus old_loc;
1607 gfc_char_t c;
1609 old_loc = gfc_current_locus;
1610 c = gfc_next_char ();
1611 gfc_current_locus = old_loc;
1613 return c;
1617 char
1618 gfc_peek_ascii_char (void)
1620 gfc_char_t c = gfc_peek_char ();
1622 return (gfc_wide_fits_in_byte (c) ? (unsigned char) c
1623 : (unsigned char) UCHAR_MAX);
1627 /* Recover from an error. We try to get past the current statement
1628 and get lined up for the next. The next statement follows a '\n'
1629 or a ';'. We also assume that we are not within a character
1630 constant, and deal with finding a '\'' or '"'. */
1632 void
1633 gfc_error_recovery (void)
1635 gfc_char_t c, delim;
1637 if (gfc_at_eof ())
1638 return;
1640 for (;;)
1642 c = gfc_next_char ();
1643 if (c == '\n' || c == ';')
1644 break;
1646 if (c != '\'' && c != '"')
1648 if (gfc_at_eof ())
1649 break;
1650 continue;
1652 delim = c;
1654 for (;;)
1656 c = next_char ();
1658 if (c == delim)
1659 break;
1660 if (c == '\n')
1661 return;
1662 if (c == '\\')
1664 c = next_char ();
1665 if (c == '\n')
1666 return;
1669 if (gfc_at_eof ())
1670 break;
1675 /* Read ahead until the next character to be read is not whitespace. */
1677 void
1678 gfc_gobble_whitespace (void)
1680 static int linenum = 0;
1681 locus old_loc;
1682 gfc_char_t c;
1686 old_loc = gfc_current_locus;
1687 c = gfc_next_char_literal (NONSTRING);
1688 /* Issue a warning for nonconforming tabs. We keep track of the line
1689 number because the Fortran matchers will often back up and the same
1690 line will be scanned multiple times. */
1691 if (warn_tabs && c == '\t')
1693 int cur_linenum = LOCATION_LINE (gfc_current_locus.lb->location);
1694 if (cur_linenum != linenum)
1696 linenum = cur_linenum;
1697 gfc_warning_now (OPT_Wtabs, "Nonconforming tab character at %C");
1701 while (gfc_is_whitespace (c));
1703 gfc_current_locus = old_loc;
1707 /* Load a single line into pbuf.
1709 If pbuf points to a NULL pointer, it is allocated.
1710 We truncate lines that are too long, unless we're dealing with
1711 preprocessor lines or if the option -ffixed-line-length-none is set,
1712 in which case we reallocate the buffer to fit the entire line, if
1713 need be.
1714 In fixed mode, we expand a tab that occurs within the statement
1715 label region to expand to spaces that leave the next character in
1716 the source region.
1718 If first_char is not NULL, it's a pointer to a single char value holding
1719 the first character of the line, which has already been read by the
1720 caller. This avoids the use of ungetc().
1722 load_line returns whether the line was truncated.
1724 NOTE: The error machinery isn't available at this point, so we can't
1725 easily report line and column numbers consistent with other
1726 parts of gfortran. */
1728 static int
1729 load_line (FILE *input, gfc_char_t **pbuf, int *pbuflen, const int *first_char)
1731 static int linenum = 0, current_line = 1;
1732 int c, maxlen, i, preprocessor_flag, buflen = *pbuflen;
1733 int trunc_flag = 0, seen_comment = 0;
1734 int seen_printable = 0, seen_ampersand = 0, quoted = ' ';
1735 gfc_char_t *buffer;
1736 bool found_tab = false;
1738 /* Determine the maximum allowed line length. */
1739 if (gfc_current_form == FORM_FREE)
1740 maxlen = flag_free_line_length;
1741 else if (gfc_current_form == FORM_FIXED)
1742 maxlen = flag_fixed_line_length;
1743 else
1744 maxlen = 72;
1746 if (*pbuf == NULL)
1748 /* Allocate the line buffer, storing its length into buflen.
1749 Note that if maxlen==0, indicating that arbitrary-length lines
1750 are allowed, the buffer will be reallocated if this length is
1751 insufficient; since 132 characters is the length of a standard
1752 free-form line, we use that as a starting guess. */
1753 if (maxlen > 0)
1754 buflen = maxlen;
1755 else
1756 buflen = 132;
1758 *pbuf = gfc_get_wide_string (buflen + 1);
1761 i = 0;
1762 buffer = *pbuf;
1764 if (first_char)
1765 c = *first_char;
1766 else
1767 c = getc (input);
1769 /* In order to not truncate preprocessor lines, we have to
1770 remember that this is one. */
1771 preprocessor_flag = (c == '#' ? 1 : 0);
1773 for (;;)
1775 if (c == EOF)
1776 break;
1778 if (c == '\n')
1780 /* Check for illegal use of ampersand. See F95 Standard 3.3.1.3. */
1781 if (gfc_current_form == FORM_FREE
1782 && !seen_printable && seen_ampersand)
1784 if (pedantic)
1785 gfc_error_now ("%<&%> not allowed by itself in line %d",
1786 current_line);
1787 else
1788 gfc_warning_now (0, "%<&%> not allowed by itself in line %d",
1789 current_line);
1791 break;
1794 if (c == '\r' || c == '\0')
1795 goto next_char; /* Gobble characters. */
1797 if (c == '&')
1799 if (seen_ampersand)
1801 seen_ampersand = 0;
1802 seen_printable = 1;
1804 else
1805 seen_ampersand = 1;
1808 if ((c != '&' && c != '!' && c != ' ') || (c == '!' && !seen_ampersand))
1809 seen_printable = 1;
1811 /* Is this a fixed-form comment? */
1812 if (gfc_current_form == FORM_FIXED && i == 0
1813 && (c == '*' || c == 'c' || c == 'd'))
1814 seen_comment = 1;
1816 if (quoted == ' ')
1818 if (c == '\'' || c == '"')
1819 quoted = c;
1821 else if (c == quoted)
1822 quoted = ' ';
1824 /* Is this a free-form comment? */
1825 if (c == '!' && quoted == ' ')
1826 seen_comment = 1;
1828 /* Vendor extension: "<tab>1" marks a continuation line. */
1829 if (found_tab)
1831 found_tab = false;
1832 if (c >= '1' && c <= '9')
1834 *(buffer-1) = c;
1835 goto next_char;
1839 if (gfc_current_form == FORM_FIXED && c == '\t' && i < 6)
1841 found_tab = true;
1843 if (warn_tabs && seen_comment == 0 && current_line != linenum)
1845 linenum = current_line;
1846 gfc_warning_now (OPT_Wtabs,
1847 "Nonconforming tab character in column %d "
1848 "of line %d", i+1, linenum);
1851 while (i < 6)
1853 *buffer++ = ' ';
1854 i++;
1857 goto next_char;
1860 *buffer++ = c;
1861 i++;
1863 if (maxlen == 0 || preprocessor_flag)
1865 if (i >= buflen)
1867 /* Reallocate line buffer to double size to hold the
1868 overlong line. */
1869 buflen = buflen * 2;
1870 *pbuf = XRESIZEVEC (gfc_char_t, *pbuf, (buflen + 1));
1871 buffer = (*pbuf) + i;
1874 else if (i >= maxlen)
1876 bool trunc_warn = true;
1878 /* Enhancement, if the very next non-space character is an ampersand
1879 or comment that we would otherwise warn about, don't mark as
1880 truncated. */
1882 /* Truncate the rest of the line. */
1883 for (;;)
1885 c = getc (input);
1886 if (c == '\r' || c == ' ')
1887 continue;
1889 if (c == '\n' || c == EOF)
1890 break;
1892 if (!trunc_warn && c != '!')
1893 trunc_warn = true;
1895 if (trunc_warn && ((gfc_current_form == FORM_FIXED && c == '&')
1896 || c == '!'))
1897 trunc_warn = false;
1899 if (c == '!')
1900 seen_comment = 1;
1902 if (trunc_warn && !seen_comment)
1903 trunc_flag = 1;
1906 c = '\n';
1907 continue;
1910 next_char:
1911 c = getc (input);
1914 /* Pad lines to the selected line length in fixed form. */
1915 if (gfc_current_form == FORM_FIXED
1916 && flag_fixed_line_length != 0
1917 && !preprocessor_flag
1918 && c != EOF)
1920 while (i++ < maxlen)
1921 *buffer++ = ' ';
1924 *buffer = '\0';
1925 *pbuflen = buflen;
1926 current_line++;
1928 return trunc_flag;
1932 /* Get a gfc_file structure, initialize it and add it to
1933 the file stack. */
1935 static gfc_file *
1936 get_file (const char *name, enum lc_reason reason ATTRIBUTE_UNUSED)
1938 gfc_file *f;
1940 f = XCNEW (gfc_file);
1942 f->filename = xstrdup (name);
1944 f->next = file_head;
1945 file_head = f;
1947 f->up = current_file;
1948 if (current_file != NULL)
1949 f->inclusion_line = current_file->line;
1951 linemap_add (line_table, reason, false, f->filename, 1);
1953 return f;
1957 /* Deal with a line from the C preprocessor. The
1958 initial octothorp has already been seen. */
1960 static void
1961 preprocessor_line (gfc_char_t *c)
1963 bool flag[5];
1964 int i, line;
1965 gfc_char_t *wide_filename;
1966 gfc_file *f;
1967 int escaped, unescape;
1968 char *filename;
1970 c++;
1971 while (*c == ' ' || *c == '\t')
1972 c++;
1974 if (*c < '0' || *c > '9')
1975 goto bad_cpp_line;
1977 line = wide_atoi (c);
1979 c = wide_strchr (c, ' ');
1980 if (c == NULL)
1982 /* No file name given. Set new line number. */
1983 current_file->line = line;
1984 return;
1987 /* Skip spaces. */
1988 while (*c == ' ' || *c == '\t')
1989 c++;
1991 /* Skip quote. */
1992 if (*c != '"')
1993 goto bad_cpp_line;
1994 ++c;
1996 wide_filename = c;
1998 /* Make filename end at quote. */
1999 unescape = 0;
2000 escaped = false;
2001 while (*c && ! (!escaped && *c == '"'))
2003 if (escaped)
2004 escaped = false;
2005 else if (*c == '\\')
2007 escaped = true;
2008 unescape++;
2010 ++c;
2013 if (! *c)
2014 /* Preprocessor line has no closing quote. */
2015 goto bad_cpp_line;
2017 *c++ = '\0';
2019 /* Undo effects of cpp_quote_string. */
2020 if (unescape)
2022 gfc_char_t *s = wide_filename;
2023 gfc_char_t *d = gfc_get_wide_string (c - wide_filename - unescape);
2025 wide_filename = d;
2026 while (*s)
2028 if (*s == '\\')
2029 *d++ = *++s;
2030 else
2031 *d++ = *s;
2032 s++;
2034 *d = '\0';
2037 /* Get flags. */
2039 flag[1] = flag[2] = flag[3] = flag[4] = false;
2041 for (;;)
2043 c = wide_strchr (c, ' ');
2044 if (c == NULL)
2045 break;
2047 c++;
2048 i = wide_atoi (c);
2050 if (1 <= i && i <= 4)
2051 flag[i] = true;
2054 /* Convert the filename in wide characters into a filename in narrow
2055 characters. */
2056 filename = gfc_widechar_to_char (wide_filename, -1);
2058 /* Interpret flags. */
2060 if (flag[1]) /* Starting new file. */
2062 f = get_file (filename, LC_RENAME);
2063 add_file_change (f->filename, f->inclusion_line);
2064 current_file = f;
2067 if (flag[2]) /* Ending current file. */
2069 if (!current_file->up
2070 || filename_cmp (current_file->up->filename, filename) != 0)
2072 linemap_line_start (line_table, current_file->line, 80);
2073 /* ??? One could compute the exact column where the filename
2074 starts and compute the exact location here. */
2075 gfc_warning_now_at (linemap_position_for_column (line_table, 1),
2076 0, "file %qs left but not entered",
2077 filename);
2078 current_file->line++;
2079 if (unescape)
2080 free (wide_filename);
2081 free (filename);
2082 return;
2085 add_file_change (NULL, line);
2086 current_file = current_file->up;
2087 linemap_add (line_table, LC_RENAME, false, current_file->filename,
2088 current_file->line);
2091 /* The name of the file can be a temporary file produced by
2092 cpp. Replace the name if it is different. */
2094 if (filename_cmp (current_file->filename, filename) != 0)
2096 /* FIXME: we leak the old filename because a pointer to it may be stored
2097 in the linemap. Alternative could be using GC or updating linemap to
2098 point to the new name, but there is no API for that currently. */
2099 current_file->filename = xstrdup (filename);
2102 /* Set new line number. */
2103 current_file->line = line;
2104 if (unescape)
2105 free (wide_filename);
2106 free (filename);
2107 return;
2109 bad_cpp_line:
2110 linemap_line_start (line_table, current_file->line, 80);
2111 /* ??? One could compute the exact column where the directive
2112 starts and compute the exact location here. */
2113 gfc_warning_now_at (linemap_position_for_column (line_table, 2), 0,
2114 "Illegal preprocessor directive");
2115 current_file->line++;
2119 static bool load_file (const char *, const char *, bool);
2121 /* include_line()-- Checks a line buffer to see if it is an include
2122 line. If so, we call load_file() recursively to load the included
2123 file. We never return a syntax error because a statement like
2124 "include = 5" is perfectly legal. We return false if no include was
2125 processed or true if we matched an include. */
2127 static bool
2128 include_line (gfc_char_t *line)
2130 gfc_char_t quote, *c, *begin, *stop;
2131 char *filename;
2133 c = line;
2135 if (flag_openmp || flag_openmp_simd)
2137 if (gfc_current_form == FORM_FREE)
2139 while (*c == ' ' || *c == '\t')
2140 c++;
2141 if (*c == '!' && c[1] == '$' && (c[2] == ' ' || c[2] == '\t'))
2142 c += 3;
2144 else
2146 if ((*c == '!' || *c == 'c' || *c == 'C' || *c == '*')
2147 && c[1] == '$' && (c[2] == ' ' || c[2] == '\t'))
2148 c += 3;
2152 while (*c == ' ' || *c == '\t')
2153 c++;
2155 if (gfc_wide_strncasecmp (c, "include", 7))
2156 return false;
2158 c += 7;
2159 while (*c == ' ' || *c == '\t')
2160 c++;
2162 /* Find filename between quotes. */
2164 quote = *c++;
2165 if (quote != '"' && quote != '\'')
2166 return false;
2168 begin = c;
2170 while (*c != quote && *c != '\0')
2171 c++;
2173 if (*c == '\0')
2174 return false;
2176 stop = c++;
2178 while (*c == ' ' || *c == '\t')
2179 c++;
2181 if (*c != '\0' && *c != '!')
2182 return false;
2184 /* We have an include line at this point. */
2186 *stop = '\0'; /* It's ok to trash the buffer, as this line won't be
2187 read by anything else. */
2189 filename = gfc_widechar_to_char (begin, -1);
2190 if (!load_file (filename, NULL, false))
2191 exit (FATAL_EXIT_CODE);
2193 free (filename);
2194 return true;
2198 /* Load a file into memory by calling load_line until the file ends. */
2200 static bool
2201 load_file (const char *realfilename, const char *displayedname, bool initial)
2203 gfc_char_t *line;
2204 gfc_linebuf *b;
2205 gfc_file *f;
2206 FILE *input;
2207 int len, line_len;
2208 bool first_line;
2209 struct stat st;
2210 int stat_result;
2211 const char *filename;
2212 /* If realfilename and displayedname are different and non-null then
2213 surely realfilename is the preprocessed form of
2214 displayedname. */
2215 bool preprocessed_p = (realfilename && displayedname
2216 && strcmp (realfilename, displayedname));
2218 filename = displayedname ? displayedname : realfilename;
2220 for (f = current_file; f; f = f->up)
2221 if (filename_cmp (filename, f->filename) == 0)
2223 fprintf (stderr, "%s:%d: Error: File '%s' is being included "
2224 "recursively\n", current_file->filename, current_file->line,
2225 filename);
2226 return false;
2229 if (initial)
2231 if (gfc_src_file)
2233 input = gfc_src_file;
2234 gfc_src_file = NULL;
2236 else
2237 input = gfc_open_file (realfilename);
2239 if (input == NULL)
2241 gfc_error_now ("Can't open file %qs", filename);
2242 return false;
2245 else
2247 input = gfc_open_included_file (realfilename, false, false);
2248 if (input == NULL)
2250 fprintf (stderr, "%s:%d: Error: Can't open included file '%s'\n",
2251 current_file->filename, current_file->line, filename);
2252 return false;
2254 stat_result = stat (realfilename, &st);
2255 if (stat_result == 0 && !S_ISREG(st.st_mode))
2257 fprintf (stderr, "%s:%d: Error: Included path '%s'"
2258 " is not a regular file\n",
2259 current_file->filename, current_file->line, filename);
2260 fclose (input);
2261 return false;
2265 /* Load the file.
2267 A "non-initial" file means a file that is being included. In
2268 that case we are creating an LC_ENTER map.
2270 An "initial" file means a main file; one that is not included.
2271 That file has already got at least one (surely more) line map(s)
2272 created by gfc_init. So the subsequent map created in that case
2273 must have LC_RENAME reason.
2275 This latter case is not true for a preprocessed file. In that
2276 case, although the file is "initial", the line maps created by
2277 gfc_init was used during the preprocessing of the file. Now that
2278 the preprocessing is over and we are being fed the result of that
2279 preprocessing, we need to create a brand new line map for the
2280 preprocessed file, so the reason is going to be LC_ENTER. */
2282 f = get_file (filename, (initial && !preprocessed_p) ? LC_RENAME : LC_ENTER);
2283 if (!initial)
2284 add_file_change (f->filename, f->inclusion_line);
2285 current_file = f;
2286 current_file->line = 1;
2287 line = NULL;
2288 line_len = 0;
2289 first_line = true;
2291 if (initial && gfc_src_preprocessor_lines[0])
2293 preprocessor_line (gfc_src_preprocessor_lines[0]);
2294 free (gfc_src_preprocessor_lines[0]);
2295 gfc_src_preprocessor_lines[0] = NULL;
2296 if (gfc_src_preprocessor_lines[1])
2298 preprocessor_line (gfc_src_preprocessor_lines[1]);
2299 free (gfc_src_preprocessor_lines[1]);
2300 gfc_src_preprocessor_lines[1] = NULL;
2304 for (;;)
2306 int trunc = load_line (input, &line, &line_len, NULL);
2308 len = gfc_wide_strlen (line);
2309 if (feof (input) && len == 0)
2310 break;
2312 /* If this is the first line of the file, it can contain a byte
2313 order mark (BOM), which we will ignore:
2314 FF FE is UTF-16 little endian,
2315 FE FF is UTF-16 big endian,
2316 EF BB BF is UTF-8. */
2317 if (first_line
2318 && ((line_len >= 2 && line[0] == (unsigned char) '\xFF'
2319 && line[1] == (unsigned char) '\xFE')
2320 || (line_len >= 2 && line[0] == (unsigned char) '\xFE'
2321 && line[1] == (unsigned char) '\xFF')
2322 || (line_len >= 3 && line[0] == (unsigned char) '\xEF'
2323 && line[1] == (unsigned char) '\xBB'
2324 && line[2] == (unsigned char) '\xBF')))
2326 int n = line[1] == (unsigned char) '\xBB' ? 3 : 2;
2327 gfc_char_t *new_char = gfc_get_wide_string (line_len);
2329 wide_strcpy (new_char, &line[n]);
2330 free (line);
2331 line = new_char;
2332 len -= n;
2335 /* There are three things this line can be: a line of Fortran
2336 source, an include line or a C preprocessor directive. */
2338 if (line[0] == '#')
2340 /* When -g3 is specified, it's possible that we emit #define
2341 and #undef lines, which we need to pass to the middle-end
2342 so that it can emit correct debug info. */
2343 if (debug_info_level == DINFO_LEVEL_VERBOSE
2344 && (wide_strncmp (line, "#define ", 8) == 0
2345 || wide_strncmp (line, "#undef ", 7) == 0))
2347 else
2349 preprocessor_line (line);
2350 continue;
2354 /* Preprocessed files have preprocessor lines added before the byte
2355 order mark, so first_line is not about the first line of the file
2356 but the first line that's not a preprocessor line. */
2357 first_line = false;
2359 if (include_line (line))
2361 current_file->line++;
2362 continue;
2365 /* Add line. */
2367 b = XCNEWVAR (gfc_linebuf, gfc_linebuf_header_size
2368 + (len + 1) * sizeof (gfc_char_t));
2371 b->location
2372 = linemap_line_start (line_table, current_file->line++, len);
2373 /* ??? We add the location for the maximum column possible here,
2374 because otherwise if the next call creates a new line-map, it
2375 will not reserve space for any offset. */
2376 if (len > 0)
2377 linemap_position_for_column (line_table, len);
2379 b->file = current_file;
2380 b->truncated = trunc;
2381 wide_strcpy (b->line, line);
2383 if (line_head == NULL)
2384 line_head = b;
2385 else
2386 line_tail->next = b;
2388 line_tail = b;
2390 while (file_changes_cur < file_changes_count)
2391 file_changes[file_changes_cur++].lb = b;
2394 /* Release the line buffer allocated in load_line. */
2395 free (line);
2397 fclose (input);
2399 if (!initial)
2400 add_file_change (NULL, current_file->inclusion_line + 1);
2401 current_file = current_file->up;
2402 linemap_add (line_table, LC_LEAVE, 0, NULL, 0);
2403 return true;
2407 /* Open a new file and start scanning from that file. Returns true
2408 if everything went OK, false otherwise. If form == FORM_UNKNOWN
2409 it tries to determine the source form from the filename, defaulting
2410 to free form. */
2412 bool
2413 gfc_new_file (void)
2415 bool result;
2417 if (gfc_cpp_enabled ())
2419 result = gfc_cpp_preprocess (gfc_source_file);
2420 if (!gfc_cpp_preprocess_only ())
2421 result = load_file (gfc_cpp_temporary_file (), gfc_source_file, true);
2423 else
2424 result = load_file (gfc_source_file, NULL, true);
2426 gfc_current_locus.lb = line_head;
2427 gfc_current_locus.nextc = (line_head == NULL) ? NULL : line_head->line;
2429 #if 0 /* Debugging aid. */
2430 for (; line_head; line_head = line_head->next)
2431 printf ("%s:%3d %s\n", LOCATION_FILE (line_head->location),
2432 LOCATION_LINE (line_head->location), line_head->line);
2434 exit (SUCCESS_EXIT_CODE);
2435 #endif
2437 return result;
2440 static char *
2441 unescape_filename (const char *ptr)
2443 const char *p = ptr, *s;
2444 char *d, *ret;
2445 int escaped, unescape = 0;
2447 /* Make filename end at quote. */
2448 escaped = false;
2449 while (*p && ! (! escaped && *p == '"'))
2451 if (escaped)
2452 escaped = false;
2453 else if (*p == '\\')
2455 escaped = true;
2456 unescape++;
2458 ++p;
2461 if (!*p || p[1])
2462 return NULL;
2464 /* Undo effects of cpp_quote_string. */
2465 s = ptr;
2466 d = XCNEWVEC (char, p + 1 - ptr - unescape);
2467 ret = d;
2469 while (s != p)
2471 if (*s == '\\')
2472 *d++ = *++s;
2473 else
2474 *d++ = *s;
2475 s++;
2477 *d = '\0';
2478 return ret;
2481 /* For preprocessed files, if the first tokens are of the form # NUM.
2482 handle the directives so we know the original file name. */
2484 const char *
2485 gfc_read_orig_filename (const char *filename, const char **canon_source_file)
2487 int c, len;
2488 char *dirname, *tmp;
2490 gfc_src_file = gfc_open_file (filename);
2491 if (gfc_src_file == NULL)
2492 return NULL;
2494 c = getc (gfc_src_file);
2496 if (c != '#')
2497 return NULL;
2499 len = 0;
2500 load_line (gfc_src_file, &gfc_src_preprocessor_lines[0], &len, &c);
2502 if (wide_strncmp (gfc_src_preprocessor_lines[0], "# 1 \"", 5) != 0)
2503 return NULL;
2505 tmp = gfc_widechar_to_char (&gfc_src_preprocessor_lines[0][5], -1);
2506 filename = unescape_filename (tmp);
2507 free (tmp);
2508 if (filename == NULL)
2509 return NULL;
2511 c = getc (gfc_src_file);
2513 if (c != '#')
2514 return filename;
2516 len = 0;
2517 load_line (gfc_src_file, &gfc_src_preprocessor_lines[1], &len, &c);
2519 if (wide_strncmp (gfc_src_preprocessor_lines[1], "# 1 \"", 5) != 0)
2520 return filename;
2522 tmp = gfc_widechar_to_char (&gfc_src_preprocessor_lines[1][5], -1);
2523 dirname = unescape_filename (tmp);
2524 free (tmp);
2525 if (dirname == NULL)
2526 return filename;
2528 len = strlen (dirname);
2529 if (len < 3 || dirname[len - 1] != '/' || dirname[len - 2] != '/')
2531 free (dirname);
2532 return filename;
2534 dirname[len - 2] = '\0';
2535 set_src_pwd (dirname);
2537 if (! IS_ABSOLUTE_PATH (filename))
2539 char *p = XCNEWVEC (char, len + strlen (filename));
2541 memcpy (p, dirname, len - 2);
2542 p[len - 2] = '/';
2543 strcpy (p + len - 1, filename);
2544 *canon_source_file = p;
2547 free (dirname);
2548 return filename;